From c36a6693f3ef2d79f491f7fb1bbb4fe0520766b5 Mon Sep 17 00:00:00 2001 From: Xinyuan Tong <115166877+JustinTong0323@users.noreply.github.com> Date: Thu, 7 Aug 2025 00:44:44 -0700 Subject: [PATCH] Disable gemma3 for SWA due to CUDA illegal memory access error (#8895) Signed-off-by: Xinyuan Tong --- python/sglang/srt/server_args.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/python/sglang/srt/server_args.py b/python/sglang/srt/server_args.py index 442403307..27362ad27 100644 --- a/python/sglang/srt/server_args.py +++ b/python/sglang/srt/server_args.py @@ -2037,6 +2037,8 @@ class ServerArgs: if model_arch in [ "Gemma2ForCausalLM", + "Gemma3ForCausalLM", + "Gemma3ForConditionalGeneration", "Gemma3nForCausalLM", "Gemma3nForConditionalGeneration", ]: