From 8aa5ae6b042f09d9beb2b0e814ea9c2311b6c2b6 Mon Sep 17 00:00:00 2001 From: yilian49 <43861414+yilian49@users.noreply.github.com> Date: Fri, 18 Jul 2025 00:41:32 -0400 Subject: [PATCH] load draft model fix (#7506) --- python/sglang/srt/model_loader/loader.py | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/python/sglang/srt/model_loader/loader.py b/python/sglang/srt/model_loader/loader.py index 733e6df9e..2e2f71078 100644 --- a/python/sglang/srt/model_loader/loader.py +++ b/python/sglang/srt/model_loader/loader.py @@ -575,7 +575,13 @@ class DummyModelLoader(BaseModelLoader): # 2. Post-processing of weights, including assigning specific member variables. # For `dummy_init`, only the second stage is required. if hasattr(model, "post_load_weights"): - model.post_load_weights() + if ( + model_config.hf_config.architectures[0] + == "DeepseekV3ForCausalLMNextN" + ): + model.post_load_weights(is_nextn=True) + else: + model.post_load_weights() return model.eval()