Clean up server_args.py to have a dedicated function for model specific adjustments (#8983)
This commit is contained in:
@@ -15,7 +15,7 @@ from sglang.test.test_utils import (
|
||||
|
||||
TEST_MODEL_MATRIX = {
|
||||
"Qwen/Qwen2.5-7B-Instruct": {
|
||||
"accuracy": 0.85,
|
||||
"accuracy": 0.84,
|
||||
"latency": 150,
|
||||
"output_throughput": 30,
|
||||
},
|
||||
|
||||
Reference in New Issue
Block a user