From 8e72758645571800cb5d35edd28a2c86d0d07688 Mon Sep 17 00:00:00 2001 From: offline893 <158537145+offline893@users.noreply.github.com> Date: Fri, 7 Nov 2025 17:43:23 +0800 Subject: [PATCH] [BugFix]Fix grouplist type of mc2. (#4049) ### What this PR does / why we need it? Fix accrucy problem of eplb because of PTA upgrade. This is a backport of #4047 ### How was this patch tested? Mian: baseline: | dataset | version | metric | mode | vllm-api-general-chat | |----- | ----- | ----- | ----- | -----| | aime2024 | 604a78 | accuracy | gen | 87.50 | EPLB: | dataset | version | metric | mode | vllm-api-general-chat | |----- | ----- | ----- | ----- | -----| | aime2024 | 604a78 | accuracy | gen | 87.50 | - vLLM version: v0.11.0 - vLLM main: https://github.com/vllm-project/vllm/commit/83f478bb19489b41e9d208b47b4bb5a95ac171ac Signed-off-by: offline0806 <3337230449@qq.com> Co-authored-by: offline0806 <3337230449@qq.com> --- vllm_ascend/ops/moe/token_dispatcher.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm_ascend/ops/moe/token_dispatcher.py b/vllm_ascend/ops/moe/token_dispatcher.py index 88c8cb6..5182e9e 100644 --- a/vllm_ascend/ops/moe/token_dispatcher.py +++ b/vllm_ascend/ops/moe/token_dispatcher.py @@ -212,7 +212,7 @@ class TokenDispatcherWithMC2(MoETokenDispatcher): if shared_experts is not None: shared_gate_up, _ = shared_experts.gate_up_proj(hidden_states) self.shared_act = shared_experts.act_fn(shared_gate_up) - group_list_type = 1 if dynamic_eplb else 0 + group_list_type = 0 return { "group_list_type": group_list_type, "hidden_states": expand_x,