diff --git a/python/sglang/srt/models/glm4v_moe.py b/python/sglang/srt/models/glm4v_moe.py index 86cca4ab2..2a17e04b0 100644 --- a/python/sglang/srt/models/glm4v_moe.py +++ b/python/sglang/srt/models/glm4v_moe.py @@ -74,6 +74,9 @@ class Glm4vMoeForConditionalGeneration(Glm4vForConditionalGeneration): self.pooler = Pooler(pooling_type=PoolingType.LAST, normalize=True) self.is_mrope_enabled = "mrope_section" in self.config.rope_scaling + # For EAGLE3 support + self.capture_aux_hidden_states = False + def determine_num_fused_shared_experts( self, architecture: str = "Glm4MoeForCausalLM" ):