From 5c980830a0ec0d7a1c2a02db78917533fc600938 Mon Sep 17 00:00:00 2001
From: Chranos <826995883@qq.com>
Date: Wed, 11 Feb 2026 14:37:00 +0800
Subject: [PATCH] add deepseekv3 and llama4

---
 vllm-v0.6.2/vllm_mlu/vllm_mlu/model_executor/models/llama4.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/vllm-v0.6.2/vllm_mlu/vllm_mlu/model_executor/models/llama4.py b/vllm-v0.6.2/vllm_mlu/vllm_mlu/model_executor/models/llama4.py
index 604086f..495b2a4 100644
--- a/vllm-v0.6.2/vllm_mlu/vllm_mlu/model_executor/models/llama4.py
+++ b/vllm-v0.6.2/vllm_mlu/vllm_mlu/model_executor/models/llama4.py
@@ -9,7 +9,8 @@ from vllm.model_executor.layers.layernorm import RMSNorm
 from vllm_mlu.model_executor.layers.feed_forward import FeedForward
 from vllm_mlu.mlu_hijack_utils import MluHijackObject
 from vllm.distributed import tensor_model_parallel_all_reduce
-from vllm.model_executor.model_loader.weight_utils import default_weight_loader
+from vllm.model_executor.model_loader.weight_utils import (
+    default_weight_loader, maybe_remap_kv_scale_name)
 from vllm.model_executor.models.llama4 import (
     Llama4Attention, Llama4DecoderLayer, Llama4ForCausalLM,
     Llama4Model, Llama4MoE)