diff --git a/python/sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py b/python/sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py index b4ffde60e..7057c502d 100644 --- a/python/sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py +++ b/python/sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py @@ -84,7 +84,15 @@ class EAGLEDraftExtendCudaGraphRunner: self.hidden_states = torch.zeros( ( self.max_num_token, - self.model_runner.model_config.hidden_size * 3, + ( + self.model_runner.model_config.hf_config.target_hidden_size + * 3 + if hasattr( + self.model_runner.model_config.hf_config, + "target_hidden_size", + ) + else self.model_runner.model_config.hidden_size * 3 + ), ), dtype=self.model_runner.dtype, )