[MOE Refactor] Remove QuantType in prepare_finalize.py (#6534)

### What this PR does / why we need it? To prevent confusion between different QuantType classes, we remove** QuantType in prepare_finalize.py - vLLM version: v0.15.0 - vLLM main: https://github.com/vllm-project/vllm/commit/v0.15.0 Signed-off-by: shenchuxiaofugui <1311027364@qq.com>
2026-02-10 15:59:58 +08:00
parent 34eecacace
commit 7cf285a77a
4 changed files with 9 additions and 24 deletions
--- a/vllm_ascend/ops/fused_moe/moe_comm_method.py
+++ b/vllm_ascend/ops/fused_moe/moe_comm_method.py
@@ -30,7 +30,6 @@ from vllm_ascend.ops.fused_moe.prepare_finalize import (
    PrepareAndFinalizeWithAll2All,
    PrepareAndFinalizeWithAllGather,
    PrepareAndFinalizeWithMC2,
-    QuantType,
 )
 from vllm_ascend.ops.fused_moe.token_dispatcher import (
    MoETokenDispatcher,
@@ -38,6 +37,7 @@ from vllm_ascend.ops.fused_moe.token_dispatcher import (
    TokenDispatcherWithAllGather,
    TokenDispatcherWithMC2,
 )
+from vllm_ascend.quantization.methods.base import QuantType

 _MoECommMethods: dict[MoECommType | None, MoECommMethod] = {}