add deepseekv3 and llama4

2026-02-11 15:27:19 +08:00
parent c584139543
commit 50e02f2011
2 changed files with 9 additions and 4 deletions
--- a/vllm-v0.6.2/vllm/model_executor/models/deepseek_mtp.py
+++ b/vllm-v0.6.2/vllm/model_executor/models/deepseek_mtp.py
@@ -1,5 +1,4 @@
 """Inference-only DeepSeek V3 Multi-Token Prediction (MTP) model."""
-import re
 from typing import Iterable, List, Optional, Tuple

 import torch
@@ -18,7 +17,6 @@ from vllm.model_executor.sampling_metadata import SamplingMetadata
 from vllm.sequence import IntermediateTensors

 from .deepseek_v2 import DeepseekV2DecoderLayer
-from .utils import maybe_prefix


 class SharedHead(nn.Module):
@@ -240,6 +238,11 @@ class DeepSeekMTP(nn.Module):
                    and ".layers" not in name):
                continue

+            # Strip "model." prefix since DeepSeekMTP holds
+            # embed_tokens and layers directly (no .model wrapper)
+            if name.startswith("model."):
+                name = name[len("model."):]
+
            self._load_single_weight(
                name, loaded_weight, stacked_params_mapping,
                params_dict)