[TEST]Update nightly acc test standard (#4032)
### What this PR does / why we need it?
This PR updates the acc test standard for some cases, we need it to
better maintain acc
### Does this PR introduce _any_ user-facing change?
No
### How was this patch tested?
by running the test
- vLLM version: v0.11.0
- vLLM main:
83f478bb19
Signed-off-by: jiangyunfan1 <jiangyunfan1@h-partners.com>
This commit is contained in:
@@ -45,7 +45,7 @@ aisbench_cases = [{
|
|||||||
"dataset_conf": "textvqa/textvqa_gen_base64",
|
"dataset_conf": "textvqa/textvqa_gen_base64",
|
||||||
"max_out_len": 2048,
|
"max_out_len": 2048,
|
||||||
"batch_size": 128,
|
"batch_size": 128,
|
||||||
"baseline": 76,
|
"baseline": 76.22,
|
||||||
"temperature": 0,
|
"temperature": 0,
|
||||||
"top_k": -1,
|
"top_k": -1,
|
||||||
"top_p": 1,
|
"top_p": 1,
|
||||||
|
|||||||
@@ -45,7 +45,7 @@ aisbench_cases = [{
|
|||||||
"dataset_conf": "textvqa/textvqa_gen_base64",
|
"dataset_conf": "textvqa/textvqa_gen_base64",
|
||||||
"max_out_len": 2048,
|
"max_out_len": 2048,
|
||||||
"batch_size": 128,
|
"batch_size": 128,
|
||||||
"baseline": 81,
|
"baseline": 82.05,
|
||||||
"threshold": 5
|
"threshold": 5
|
||||||
}, {
|
}, {
|
||||||
"case_type": "performance",
|
"case_type": "performance",
|
||||||
|
|||||||
@@ -58,7 +58,7 @@ aisbench_cases = [{
|
|||||||
"max_out_len": 32768,
|
"max_out_len": 32768,
|
||||||
"batch_size": 32,
|
"batch_size": 32,
|
||||||
"baseline": 83.33,
|
"baseline": 83.33,
|
||||||
"threshold": 17
|
"threshold": 7
|
||||||
}, {
|
}, {
|
||||||
"case_type": "performance",
|
"case_type": "performance",
|
||||||
"dataset_path": "vllm-ascend/GSM8K-in3500-bs400",
|
"dataset_path": "vllm-ascend/GSM8K-in3500-bs400",
|
||||||
|
|||||||
Reference in New Issue
Block a user