[CI] recover e2e test (#2688)

1. recover the skipped test.
2. remove pangu eager mode test, it's tested by torchair mode already.
3. skip pangu test util the bug is fixed.

- vLLM version: v0.10.1.1
- vLLM main:
56d04089ef

Signed-off-by: wangxiyuan <wangxiyuan1007@gmail.com>
This commit is contained in:
wangxiyuan
2025-09-02 18:49:17 +08:00
committed by GitHub
parent f023bd52bf
commit 0829b4873f
6 changed files with 8 additions and 45 deletions

View File

@@ -22,8 +22,9 @@ Run `pytest tests/multicard/test_torchair_graph_mode.py`.
import os
from typing import Dict
import pytest
from tests.e2e.conftest import VllmRunner
from vllm_ascend.ascend_config import clear_ascend_config
os.environ["PYTORCH_NPU_ALLOC_CONF"] = "max_split_size_mb:256"
@@ -85,8 +86,6 @@ def test_e2e_deepseekv3_with_torchair():
}
_deepseek_torchair_test_fixture(additional_config)
clear_ascend_config()
def test_e2e_deepseekv3_with_torchair_ms_mla():
additional_config = {
@@ -97,8 +96,6 @@ def test_e2e_deepseekv3_with_torchair_ms_mla():
}
_deepseek_torchair_test_fixture(additional_config)
clear_ascend_config()
def test_e2e_deepseekv3_with_torchair_v1scheduler():
additional_config = {
@@ -108,8 +105,6 @@ def test_e2e_deepseekv3_with_torchair_v1scheduler():
}
_deepseek_torchair_test_fixture(additional_config, use_v1_schduler=True)
clear_ascend_config()
def _pangu_torchair_test_fixture(
additional_config: Dict,
@@ -160,6 +155,7 @@ def _pangu_torchair_test_fixture(
print(f"Generated text: {vllm_output[i][1]!r}")
@pytest.mark.skip("pangu doesn't work, fix me")
def test_e2e_pangu_with_torchair():
additional_config = {
"torchair_graph_config": {
@@ -168,8 +164,6 @@ def test_e2e_pangu_with_torchair():
}
_pangu_torchair_test_fixture(additional_config)
clear_ascend_config()
def _qwen_torchair_test_fixture(
model,
@@ -228,9 +222,6 @@ def _qwen_torchair_test_fixture(
def test_e2e_qwen2_with_torchair():
_qwen_torchair_test_fixture("Qwen/Qwen2.5-0.5B-Instruct", 2, False)
clear_ascend_config()
def test_e2e_qwen3_moe_with_torchair():
_qwen_torchair_test_fixture("Qwen/Qwen3-30B-A3B", 2, True)
clear_ascend_config()