diff --git a/.github/workflows/_e2e_test.yaml b/.github/workflows/_e2e_test.yaml index be5b43e6..0dd57b70 100644 --- a/.github/workflows/_e2e_test.yaml +++ b/.github/workflows/_e2e_test.yaml @@ -171,7 +171,10 @@ jobs: if: ${{ inputs.type == 'light' }} run: | pytest -sv tests/e2e/multicard/test_qwen3_moe.py::test_models_distributed_Qwen3_MOE_TP2_WITH_EP + pytest -sv tests/e2e/multicard/test_torchair_graph_mode.py::test_e2e_qwen3_moe_with_torchair pytest -sv tests/e2e/multicard/test_torchair_graph_mode.py::test_e2e_deepseekv2lite_with_torchair + pytest -sv tests/e2e/multicard/test_torchair_graph_mode.py::test_e2e_deepseekv2lite_with_torchair_v1scheduler + pytest -sv tests/e2e/multicard/test_torchair_graph_mode.py::test_e2e_deepseekv2lite_with_nz - name: Run vllm-project/vllm-ascend test (full) env: diff --git a/tests/e2e/multicard/test_torchair_graph_mode.py b/tests/e2e/multicard/test_torchair_graph_mode.py index e55d3466..a6f3f16d 100644 --- a/tests/e2e/multicard/test_torchair_graph_mode.py +++ b/tests/e2e/multicard/test_torchair_graph_mode.py @@ -288,3 +288,14 @@ def test_e2e_deepseekv2lite_with_torchair_v1scheduler(): } _deepseek_v2_lite_torchair_test_fixure(additional_config, use_v1_schduler=True) + + +# kv_cache enable e2e test +def test_e2e_deepseekv2lite_with_nz(): + additional_config = { + "torchair_graph_config": { + "enabled": True, + "enable_kv_nz": True, + }, + } + _deepseek_v2_lite_torchair_test_fixure(additional_config)