[TEST]Add initial multi modal cases for nightly test and deepseek-r1 tests (#3631)

### What this PR does / why we need it? This PR adds the initial multi modal model for nightly test, including 3 cases for Qwen2.5-vl-7b acc/perf test on A3, we need test them daily. It also inclues 8 cases for deepseek-r1-0528-w8a8 func, acc and perf tests ### Does this PR introduce _any_ user-facing change? No ### How was this patch tested? by running the test - vLLM version: v0.11.0rc3 - vLLM main: https://github.com/vllm-project/vllm/commit/v0.11.0 --------- Signed-off-by: jiangyunfan1 <jiangyunfan1@h-partners.com>
2025-10-23 17:18:49 +08:00
parent 427b17e2da
commit 9434f24ded
4 changed files with 192 additions and 25 deletions
--- a/tests/e2e/nightly/models/test_qwen3_32b_int8.py
+++ b/tests/e2e/nightly/models/test_qwen3_32b_int8.py
@@ -51,6 +51,15 @@ VLLM_CI_RUNNER = os.getenv("VLLM_CI_RUNNER", "linux-aarch64-a2-4")
 performance_batch_size = batch_size_dict.get(VLLM_CI_RUNNER, 1)

 aisbench_cases = [{
+    "case_type": "accuracy",
+    "dataset_path": "vllm-ascend/aime2024",
+    "request_conf": "vllm_api_general_chat",
+    "dataset_conf": "aime2024/aime2024_gen_0_shot_chat_prompt",
+    "max_out_len": 32768,
+    "batch_size": 32,
+    "baseline": 83.33,
+    "threshold": 17
+}, {
    "case_type": "performance",
    "dataset_path": "vllm-ascend/GSM8K-in3500-bs400",
    "request_conf": "vllm_api_stream_chat",
@@ -60,15 +69,6 @@ aisbench_cases = [{
    "batch_size": performance_batch_size,
    "baseline": 1,
    "threshold": 0.97
-}, {
-    "case_type": "accuracy",
-    "dataset_path": "vllm-ascend/aime2024",
-    "request_conf": "vllm_api_general_chat",
-    "dataset_conf": "aime2024/aime2024_gen_0_shot_chat_prompt",
-    "max_out_len": 32768,
-    "batch_size": 32,
-    "baseline": 83.33,
-    "threshold": 17
 }]