diff --git a/tests/e2e/nightly/models/test_deepseek_r1_0528_w8a8.py b/tests/e2e/nightly/models/test_deepseek_r1_0528_w8a8.py index 38f54a04..c9126577 100644 --- a/tests/e2e/nightly/models/test_deepseek_r1_0528_w8a8.py +++ b/tests/e2e/nightly/models/test_deepseek_r1_0528_w8a8.py @@ -32,6 +32,7 @@ MODES = [ "torchair", "single", "aclgraph", + "aclgraph_mlapo", "no_chunkprefill", ] @@ -108,6 +109,9 @@ async def test_models(model: str, mode: str) -> None: additional_config["torchair_graph_config"] = {"enabled": False} if mode == "aclgraph": additional_config["torchair_graph_config"] = {"enabled": False} + if mode == "aclgraph_mlapo": + env_dict["VLLM_ASCEND_ENABLE_MLAPO"] = "1" + additional_config["torchair_graph_config"] = {"enabled": False} if mode == "no_chunkprefill": additional_config["ascend_scheduler_config"] = {"enabled": True} i = server_args.index("--max-num-batched-tokens") + 1