From 81fd2b0ee0df11f5d7db486d7bf1180f4f5bd196 Mon Sep 17 00:00:00 2001 From: Zhengyi Lai Date: Thu, 23 Oct 2025 12:20:54 +0800 Subject: [PATCH] =?UTF-8?q?fix(deepep):=20resolve=20benchmark=20failure=20?= =?UTF-8?q?on=204=C3=97IB-card=20setup=20by=20aligning=20tuning=20config?= =?UTF-8?q?=20with=20DeepEP=20commit=20bdd119f8=20(#11965)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- benchmark/kernels/deepep/tuning_deepep.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/benchmark/kernels/deepep/tuning_deepep.py b/benchmark/kernels/deepep/tuning_deepep.py index bb900a875..db08a8f14 100644 --- a/benchmark/kernels/deepep/tuning_deepep.py +++ b/benchmark/kernels/deepep/tuning_deepep.py @@ -381,8 +381,8 @@ def test_main( # Tune combine performance best_time, best_results = 1e10, None - for nvl_chunk_size in range(1, 5, 1): - for rdma_chunk_size in range(8, 33, 4): + for nvl_chunk_size in range(1, 8, 1): + for rdma_chunk_size in range(12 if num_nodes == 2 else 8, 33, 4): config_kwargs = { "num_sms": num_sms, "num_max_nvl_chunked_send_tokens": nvl_chunk_size,