diff --git a/vllm-v0.6.2/vllm/model_executor/models/deepseek_v2.py b/vllm-v0.6.2/vllm/model_executor/models/deepseek_v2.py index 4fb1eed..2649139 100644 --- a/vllm-v0.6.2/vllm/model_executor/models/deepseek_v2.py +++ b/vllm-v0.6.2/vllm/model_executor/models/deepseek_v2.py @@ -611,3 +611,7 @@ class DeepseekV2ForCausalLM(nn.Module, SupportsPP): weight_loader = getattr(param, "weight_loader", default_weight_loader) weight_loader(param, loaded_weight) + + +class DeepseekV3ForCausalLM(DeepseekV2ForCausalLM): + pass diff --git a/vllm-v0.6.2/vllm/model_executor/models/registry.py b/vllm-v0.6.2/vllm/model_executor/models/registry.py index 2cfa0df..75fc5d2 100644 --- a/vllm-v0.6.2/vllm/model_executor/models/registry.py +++ b/vllm-v0.6.2/vllm/model_executor/models/registry.py @@ -48,6 +48,7 @@ _TEXT_GENERATION_MODELS = { "DeciLMForCausalLM": ("decilm", "DeciLMForCausalLM"), "DeepseekForCausalLM": ("deepseek", "DeepseekForCausalLM"), "DeepseekV2ForCausalLM": ("deepseek_v2", "DeepseekV2ForCausalLM"), + "DeepseekV3ForCausalLM": ("deepseek_v2", "DeepseekV3ForCausalLM"), "ExaoneForCausalLM": ("exaone", "ExaoneForCausalLM"), "FalconForCausalLM": ("falcon", "FalconForCausalLM"), "GemmaForCausalLM": ("gemma", "GemmaForCausalLM"),