update

2026-05-11 17:00:22 +00:00 · 2026-05-08 03:43:34 +00:00
parent 113d859d13
commit 9ff7e1c2c3
1 changed files with 1 additions and 8 deletions
--- a/src/ext/collectives/allreduce/allreduce_nvls_zero_copy.cu
+++ b/src/ext/collectives/allreduce/allreduce_nvls_zero_copy.cu
@@ -82,14 +82,7 @@ struct NvlsAdapter {
    } else if constexpr (std::is_same_v<T, __fp8_e4m3b15>) {
      // fp8_e4m3b15 is a software-only type with no hardware NVLS support.
      return cudaErrorNotSupported;
-    } else
-#if defined(__CUDA_ARCH__) && \
-    ((!defined(__CUDA_ARCH_SPECIFIC__) && !defined(__CUDA_ARCH_FAMILY_SPECIFIC__)) || (__CUDA_ARCH__ < 1000))
-        if constexpr (std::is_same_v<T, __fp8_e4m3> || std::is_same_v<T, __fp8_e5m2>) {
-      return cudaErrorNotSupported;
-    } else
-#endif
-    {
+    } else {
      using ChannelType = DeviceHandle<mscclpp::BaseMemoryChannel>;
      allreduceNvls<T, AccumT><<<nBlocks, nThreadsPerBlock, 0, stream>>>(
          (ChannelType*)memoryChannels, nvlsChannels, nvlsOutChannels, channelInOffset, channelOutOffset, inputSize,