diff --git a/tests/e2e/multicard/test_data_parallel.py b/tests/e2e/multicard/test_data_parallel.py index 6edeeb37..6b4df381 100644 --- a/tests/e2e/multicard/test_data_parallel.py +++ b/tests/e2e/multicard/test_data_parallel.py @@ -28,16 +28,14 @@ from unittest.mock import patch import pytest MODELS = [ - "Qwen/Qwen3-0.6B", - "Qwen/Qwen3-30B-A3B", - # FIXME(Potabk): Skip this case for now - # "vllm-ascend/Qwen3-30B-A3B-W8A8" + "Qwen/Qwen3-0.6B", "Qwen/Qwen3-30B-A3B", "vllm-ascend/Qwen3-30B-A3B-W8A8" ] @pytest.mark.parametrize("model", MODELS) @pytest.mark.parametrize("max_tokens", [32]) @patch.dict(os.environ, {"ASCEND_RT_VISIBLE_DEVICES": "0,1"}) +@patch.dict(os.environ, {"HCCL_BUFFSIZE": "1024"}) def test_qwen3_inference_dp2(model, max_tokens): moe_models = ["Qwen/Qwen3-30B-A3B", "vllm-ascend/Qwen3-30B-A3B-W8A8"] quantization_models = ["vllm-ascend/Qwen3-30B-A3B-W8A8"]