[EAGLE] remove a wrong adjustment for page_size > 1 & topk > 1 in server_args.py (#7643)
This commit is contained in:
@@ -486,12 +486,6 @@ class ServerArgs:
|
|||||||
self.speculative_num_draft_tokens,
|
self.speculative_num_draft_tokens,
|
||||||
) = auto_choose_speculative_params(self)
|
) = auto_choose_speculative_params(self)
|
||||||
|
|
||||||
if self.page_size > 1 and self.speculative_eagle_topk > 1:
|
|
||||||
self.speculative_eagle_topk = 1
|
|
||||||
logger.warning(
|
|
||||||
"speculative_eagle_topk is adjusted to 1 when page_size > 1"
|
|
||||||
)
|
|
||||||
|
|
||||||
if (
|
if (
|
||||||
self.speculative_eagle_topk == 1
|
self.speculative_eagle_topk == 1
|
||||||
and self.speculative_num_draft_tokens != self.speculative_num_steps + 1
|
and self.speculative_num_draft_tokens != self.speculative_num_steps + 1
|
||||||
|
|||||||
Reference in New Issue
Block a user