Fix multi-nodes test failure (#262)

fix multi-nodes CI pipeline

Co-authored-by: Changho Hwang <changhohwang@microsoft.com>
This commit is contained in:
Binyang Li
2024-02-07 18:21:05 -08:00
committed by GitHub
parent 2101f5251e
commit 7c229fbdd8

View File

@@ -165,9 +165,8 @@ def run_benchmark(
memory_out = cp.zeros(nelem, dtype=data_type)
cp.cuda.runtime.deviceSynchronize()
proxy_service = None
proxy_service = ProxyService()
if MPI.COMM_WORLD.size // N_GPUS_PER_NODE == 1:
proxy_service = ProxyService()
if memory.nbytes < 2**20:
mscclpp_algos = [MscclppAllReduce2(mscclpp_group, memory, memory_out)]
else: