chore: tune mem fraction static for vlm (#6881)

This commit is contained in:
Mick
2025-07-19 08:19:27 +08:00
committed by GitHub
parent 9c7a46180c
commit 3964b352c3
4 changed files with 57 additions and 13 deletions

View File

@@ -22,7 +22,7 @@ class TestPixtralServer(TestOpenAIVisionServer):
other_args=[
"--trust-remote-code",
"--mem-fraction-static",
"0.73",
"0.70",
],
)
cls.base_url += "/v1"
@@ -44,7 +44,7 @@ class TestMistral3_1Server(TestOpenAIVisionServer):
other_args=[
"--trust-remote-code",
"--mem-fraction-static",
"0.8",
"0.75",
],
)
cls.base_url += "/v1"
@@ -88,7 +88,7 @@ class TestJanusProServer(TestOpenAIVisionServer):
other_args=[
"--trust-remote-code",
"--mem-fraction-static",
"0.4",
"0.35",
],
)
cls.base_url += "/v1"
@@ -197,7 +197,7 @@ class TestPhi4MMServer(TestOpenAIVisionServer):
other_args=[
"--trust-remote-code",
"--mem-fraction-static",
"0.75",
"0.70",
"--disable-radix-cache",
"--max-loras-per-batch",
"1",