Quick Fix GLM (#9264)

This commit is contained in:
Stefan He
2025-08-16 23:43:41 -07:00
committed by GitHub
parent bb10e3a1c3
commit e47800e176
2 changed files with 6 additions and 1 deletions

View File

@@ -30,7 +30,7 @@ MODEL_SCORE_THRESHOLDS = {
"neuralmagic/Meta-Llama-3.1-8B-Instruct-FP8": 0.83,
"neuralmagic/Mistral-7B-Instruct-v0.3-FP8": 0.54,
"neuralmagic/DeepSeek-Coder-V2-Lite-Instruct-FP8": 0.84,
"zai-org/GLM-4.5-Air-FP8": 0.94,
"zai-org/GLM-4.5-Air-FP8": 0.78,
# The threshold of neuralmagic/gemma-2-2b-it-FP8 should be 0.6, but this model has some accuracy regression.
# The fix is tracked at https://github.com/sgl-project/sglang/issues/4324, we set it to 0.50, for now, to make CI green.
"neuralmagic/gemma-2-2b-it-FP8": 0.50,