mirror of
https://github.com/microsoft/mscclpp.git
synced 2026-05-12 09:17:06 +00:00
tests/ep: HT benches also print per_rank_bw
Same alignment with NCCL-EP ep_bench as the LL test: report both per-rank (agg/num_ranks) and aggregate throughput.
This commit is contained in:
@@ -338,11 +338,15 @@ def main():
|
||||
flush=True,
|
||||
)
|
||||
print(
|
||||
f" dispatch: {disp_us_t.item():.1f}us (max) agg_bw={disp_bw_t.item():.2f} GB/s",
|
||||
f" dispatch: {disp_us_t.item():.1f}us (max) "
|
||||
f"per_rank_bw={disp_bw_t.item() / num_ranks:.2f} GB/s "
|
||||
f"agg_bw={disp_bw_t.item():.2f} GB/s",
|
||||
flush=True,
|
||||
)
|
||||
print(
|
||||
f" combine : {comb_us_t.item():.1f}us (max) agg_bw={comb_bw_t.item():.2f} GB/s",
|
||||
f" combine : {comb_us_t.item():.1f}us (max) "
|
||||
f"per_rank_bw={comb_bw_t.item() / num_ranks:.2f} GB/s "
|
||||
f"agg_bw={comb_bw_t.item():.2f} GB/s",
|
||||
flush=True,
|
||||
)
|
||||
|
||||
|
||||
@@ -285,11 +285,15 @@ def main():
|
||||
flush=True,
|
||||
)
|
||||
print(
|
||||
f" dispatch: {disp_us_t.item():.1f}us (max) agg_bw={disp_bw_t.item():.2f} GB/s",
|
||||
f" dispatch: {disp_us_t.item():.1f}us (max) "
|
||||
f"per_rank_bw={disp_bw_t.item() / num_ranks:.2f} GB/s "
|
||||
f"agg_bw={disp_bw_t.item():.2f} GB/s",
|
||||
flush=True,
|
||||
)
|
||||
print(
|
||||
f" combine : {comb_us_t.item():.1f}us (max) agg_bw={comb_bw_t.item():.2f} GB/s",
|
||||
f" combine : {comb_us_t.item():.1f}us (max) "
|
||||
f"per_rank_bw={comb_bw_t.item() / num_ranks:.2f} GB/s "
|
||||
f"agg_bw={comb_bw_t.item():.2f} GB/s",
|
||||
flush=True,
|
||||
)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user