Fix Python bindings and tests (#690)

Minimal fix to make things work. We need a more careful look at
preventing silent fallback of nanobind when it fails to (properly)
construct a C++ STL object with mscclpp instances.
This commit is contained in:
Changho Hwang
2025-11-21 12:53:12 -08:00
committed by GitHub
parent 060c35fec6
commit 8b8593ba51
8 changed files with 73 additions and 63 deletions

View File

@@ -453,7 +453,10 @@ class MscclppAllReduce6:
)
# create a memory_channel for each remote neighbor
self.semaphores = group.make_semaphore(self.nvlink_connections, MemoryDevice2DeviceSemaphore)
self.semaphores = {
rank: MemoryDevice2DeviceSemaphore(sema)
for rank, sema in group.make_semaphores(self.nvlink_connections).items()
}
file_dir = os.path.dirname(os.path.abspath(__file__))
self.kernel = KernelBuilder(
file="allreduce.cu",