diff --git a/vllm_ascend/ascend_forward_context.py b/vllm_ascend/ascend_forward_context.py index 8106c935..6f402ca8 100644 --- a/vllm_ascend/ascend_forward_context.py +++ b/vllm_ascend/ascend_forward_context.py @@ -249,11 +249,7 @@ def select_moe_comm_method(num_tokens: int, vllm_config.parallel_config.pipeline_parallel_size >= 16): moe_comm_type = MoECommType.MC2 else: - # Currently, w4a8_dynamic does not support allgatherep - if quant_type == "w4a8_dynamic": - moe_comm_type = MoECommType.ALLTOALL - else: - moe_comm_type = MoECommType.ALLGATHER + moe_comm_type = MoECommType.ALLGATHER elif soc_version in {AscendDeviceType.A3}: ascend_config = get_ascend_config()