Revert "Check eagle server args" (#4242)

This commit is contained in:
Lianmin Zheng
2025-03-09 18:53:33 -07:00
committed by GitHub
parent eb06dbcbf8
commit 4a05bdfa86

View File

@@ -284,13 +284,9 @@ class ServerArgs:
"Overlap scheduler are disabled because of using " "Overlap scheduler are disabled because of using "
"eagle speculative decoding." "eagle speculative decoding."
) )
# The token generated from the verify step is counted in speculative_num_draft_tokens. # The token generated from the verify step is counted.
# If sepculative_num_steps >= speculative_num_draft_tokens, the additional tokens will definitely be discarded. # If sepculative_num_steps >= speculative_num_draft_tokens, the additional tokens will definitely be discarded.
assert self.speculative_num_steps < self.speculative_num_draft_tokens # assert self.speculative_num_steps < self.speculative_num_draft_tokens
assert (
self.speculative_num_draft_tokens - 1
<= self.speculative_num_steps * self.speculative_eagle_topk
)
# GGUF # GGUF
if ( if (