diff --git a/python/test/executor_test.py b/python/test/executor_test.py index eeace1a1..1175d629 100644 --- a/python/test/executor_test.py +++ b/python/test/executor_test.py @@ -230,6 +230,8 @@ def main( # Count how many elements changed changed = cp.count_nonzero(result_buf != cp.float16(123.0)).item() print("changed elements:", changed, "out of", result_buf.size) + cp.cuda.runtime.deviceSynchronize() + mscclpp_group.barrier() bench_correctness( collective,