mirror of
https://github.com/microsoft/mscclpp.git
synced 2026-05-22 22:08:28 +00:00
Do not check value of __HIP_PLATFORM_AMD__ (#240)
According to the [document](https://rocm.docs.amd.com/projects/HIP/en/docs-6.0.0/user_guide/hip_porting_guide.html#compiler-defines-summary), `__HIP_PLATFORM_AMD__` is effective only by definition.
This commit is contained in:
@@ -74,7 +74,7 @@ __device__ void localAllGather(DeviceHandle<mscclpp::SimpleProxyChannel> proxyCh
|
||||
if ((remoteRank % nranksPerNode) == ((rank - i + nranksPerNode) % nranksPerNode)) {
|
||||
if ((threadIdx.x % 32) == 0) proxyChan.wait();
|
||||
}
|
||||
#if defined(__HIP_PLATFORM_AMD__) && (__HIP_PLATFORM_AMD__ == 1)
|
||||
#if defined(__HIP_PLATFORM_AMD__)
|
||||
// NOTE: we actually need a group barrier here for better performance, but __syncthreads() is still correct.
|
||||
__syncthreads();
|
||||
#else
|
||||
|
||||
Reference in New Issue
Block a user