[TEST]Add MALPO for aclgraph in nightly test (#3894)
### What this PR does / why we need it?
This PR adds MALPO for deepseek aclgraph, we need to test it nightly
### Does this PR introduce _any_ user-facing change?
No
### How was this patch tested?
By running the test
- vLLM version: v0.11.0
- vLLM main:
83f478bb19
---------
Signed-off-by: jiangyunfan1 <jiangyunfan1@h-partners.com>
This commit is contained in:
@@ -32,6 +32,7 @@ MODES = [
|
|||||||
"torchair",
|
"torchair",
|
||||||
"single",
|
"single",
|
||||||
"aclgraph",
|
"aclgraph",
|
||||||
|
"aclgraph_mlapo",
|
||||||
"no_chunkprefill",
|
"no_chunkprefill",
|
||||||
]
|
]
|
||||||
|
|
||||||
@@ -108,6 +109,9 @@ async def test_models(model: str, mode: str) -> None:
|
|||||||
additional_config["torchair_graph_config"] = {"enabled": False}
|
additional_config["torchair_graph_config"] = {"enabled": False}
|
||||||
if mode == "aclgraph":
|
if mode == "aclgraph":
|
||||||
additional_config["torchair_graph_config"] = {"enabled": False}
|
additional_config["torchair_graph_config"] = {"enabled": False}
|
||||||
|
if mode == "aclgraph_mlapo":
|
||||||
|
env_dict["VLLM_ASCEND_ENABLE_MLAPO"] = "1"
|
||||||
|
additional_config["torchair_graph_config"] = {"enabled": False}
|
||||||
if mode == "no_chunkprefill":
|
if mode == "no_chunkprefill":
|
||||||
additional_config["ascend_scheduler_config"] = {"enabled": True}
|
additional_config["ascend_scheduler_config"] = {"enabled": True}
|
||||||
i = server_args.index("--max-num-batched-tokens") + 1
|
i = server_args.index("--max-num-batched-tokens") + 1
|
||||||
|
|||||||
Reference in New Issue
Block a user