fix: gemma 3 not use softcap (#5622)

This commit is contained in:
Yineng Zhang
2025-04-22 01:16:08 -07:00
committed by GitHub
parent 506be6b892
commit 04f2abcb34
4 changed files with 17 additions and 2 deletions

View File

@@ -154,6 +154,7 @@ class ServerArgs:
disable_outlines_disk_cache: bool = False
disable_custom_all_reduce: bool = False
enable_llama4_multimodal: Optional[bool] = None
enable_gemma3_multimodal: Optional[bool] = None
disable_overlap_schedule: bool = False
enable_mixed_chunk: bool = False
enable_dp_attention: bool = False
@@ -285,7 +286,9 @@ class ServerArgs:
if self.grammar_backend is None:
self.grammar_backend = "xgrammar"
self.enable_multimodal: Optional[bool] = self.enable_llama4_multimodal
self.enable_multimodal: Optional[bool] = (
self.enable_llama4_multimodal or self.enable_gemma3_multimodal
)
# Data parallelism attention
if self.enable_dp_attention:
@@ -984,6 +987,12 @@ class ServerArgs:
action="store_true",
help="Enable the multimodal functionality for Llama-4.",
)
parser.add_argument(
"--enable-gemma3-multimodal",
default=ServerArgs.enable_gemma3_multimodal,
action="store_true",
help="Enable the multimodal functionality for Gemma-3.",
)
parser.add_argument(
"--disable-overlap-schedule",
action="store_true",