add deepseekv3 and llama4
This commit is contained in:
@@ -159,9 +159,11 @@ class MLUSpecDecodeWorker(LoraNotSupportedWorkerBase):
|
||||
draft_worker_kwargs[
|
||||
"model_runner_cls"] = MLUTP1DraftModelRunner
|
||||
else:
|
||||
if draft_model_config.hf_config.model_type == "eagle":
|
||||
if draft_model_config.hf_config.model_type in (
|
||||
"eagle", "deepseek_mtp"):
|
||||
raise NotImplementedError(
|
||||
"EAGLE does not support TP > 1 yet")
|
||||
f"{draft_model_config.hf_config.model_type} "
|
||||
"does not support TP > 1 yet")
|
||||
|
||||
allow_zero_draft_token_step = False
|
||||
proposer_worker = MLUMultiStepWorker(**draft_worker_kwargs)
|
||||
|
||||
Reference in New Issue
Block a user