diff --git a/python/sglang/srt/models/glm4_moe.py b/python/sglang/srt/models/glm4_moe.py index 9716557f4..f080beb50 100644 --- a/python/sglang/srt/models/glm4_moe.py +++ b/python/sglang/srt/models/glm4_moe.py @@ -795,6 +795,7 @@ class Glm4MoeForCausalLM(DeepseekV2ForCausalLM): elif ( self.quant_config.get_name() == "fp8" or self.quant_config.get_name() == "blockwise_int8" + or self.quant_config.get_name() == "compressed_tensors" ): suffix_list = [ "down_proj.weight",