From 451ffe74d9071a2f67194e2497152643b0b809b0 Mon Sep 17 00:00:00 2001 From: Pan Lyu Date: Mon, 9 Jun 2025 16:32:49 +0800 Subject: [PATCH] support qwen3 emebedding (#6990) --- python/sglang/srt/models/qwen3.py | 2 ++ test/srt/models/test_embedding_models.py | 1 + 2 files changed, 3 insertions(+) diff --git a/python/sglang/srt/models/qwen3.py b/python/sglang/srt/models/qwen3.py index de7db4c32..ae7bbfd4c 100644 --- a/python/sglang/srt/models/qwen3.py +++ b/python/sglang/srt/models/qwen3.py @@ -333,6 +333,8 @@ class Qwen3ForCausalLM(nn.Module): params_dict = dict(self.named_parameters()) for name, loaded_weight in weights: + if "Embedding" in self.config.name_or_path: + name = add_prefix(name, "model") layer_id = get_layer_id(name) if ( layer_id is not None diff --git a/test/srt/models/test_embedding_models.py b/test/srt/models/test_embedding_models.py index 069f69c34..b56e952d7 100644 --- a/test/srt/models/test_embedding_models.py +++ b/test/srt/models/test_embedding_models.py @@ -26,6 +26,7 @@ MODELS = [ ("Alibaba-NLP/gte-Qwen2-1.5B-instruct", 1, 1e-5), ("intfloat/e5-mistral-7b-instruct", 1, 1e-5), ("marco/mcdse-2b-v1", 1, 1e-5), + ("Qwen/Qwen3-Embedding-8B", 1, 1e-5), # Temporarily disable before this model is fixed # ("jason9693/Qwen2.5-1.5B-apeach", 1, 1e-5), ]