Fix dtype for idle input in spec decoding (#7456)

This commit is contained in:
Cheng Wan
2025-06-23 11:23:25 -07:00
committed by GitHub
parent 34b6b8426f
commit f8d48fd311
2 changed files with 5 additions and 3 deletions

View File

@@ -498,6 +498,7 @@ class EAGLEWorker(TpModelWorker):
batch.spec_info = EagleDraftInput.create_idle_input(
device=self.device,
hidden_size=self.model_config.hidden_size,
dtype=self.model_config.dtype,
topk=self.topk,
capture_hidden_mode=CaptureHiddenMode.LAST,
)
@@ -838,6 +839,7 @@ class EAGLEWorker(TpModelWorker):
batch.spec_info = EagleDraftInput.create_idle_input(
device=self.device,
hidden_size=self.model_config.hidden_size,
dtype=self.model_config.dtype,
topk=self.topk,
capture_hidden_mode=CaptureHiddenMode.LAST,
)