add barrier

This commit is contained in:
Ubuntu
2026-04-07 01:40:15 +00:00
parent 812f6cfded
commit 3f2ade22cb

View File

@@ -230,6 +230,8 @@ def main(
# Count how many elements changed
changed = cp.count_nonzero(result_buf != cp.float16(123.0)).item()
print("changed elements:", changed, "out of", result_buf.size)
cp.cuda.runtime.deviceSynchronize()
mscclpp_group.barrier()
bench_correctness(
collective,