add deepseekv3 and llama4

2026-02-11 15:27:19 +08:00
parent 9b05d7285e
commit f6d6f69abc
2 changed files with 9 additions and 4 deletions
--- a/vllm-v0.6.2/vllm/spec_decode/mlu_spec_decode_worker.py
+++ b/vllm-v0.6.2/vllm/spec_decode/mlu_spec_decode_worker.py
@@ -159,9 +159,11 @@ class MLUSpecDecodeWorker(LoraNotSupportedWorkerBase):
                    draft_worker_kwargs[
                        "model_runner_cls"] = MLUTP1DraftModelRunner
                else:
-                    if draft_model_config.hf_config.model_type == "eagle":
+                    if draft_model_config.hf_config.model_type in (
+                            "eagle", "deepseek_mtp"):
                        raise NotImplementedError(
-                            "EAGLE does not support TP > 1 yet")
+                            f"{draft_model_config.hf_config.model_type} "
+                            "does not support TP > 1 yet")

                    allow_zero_draft_token_step = False
                proposer_worker = MLUMultiStepWorker(**draft_worker_kwargs)