support qwen3 emebedding (#6990)
This commit is contained in:
@@ -333,6 +333,8 @@ class Qwen3ForCausalLM(nn.Module):
|
|||||||
|
|
||||||
params_dict = dict(self.named_parameters())
|
params_dict = dict(self.named_parameters())
|
||||||
for name, loaded_weight in weights:
|
for name, loaded_weight in weights:
|
||||||
|
if "Embedding" in self.config.name_or_path:
|
||||||
|
name = add_prefix(name, "model")
|
||||||
layer_id = get_layer_id(name)
|
layer_id = get_layer_id(name)
|
||||||
if (
|
if (
|
||||||
layer_id is not None
|
layer_id is not None
|
||||||
|
|||||||
@@ -26,6 +26,7 @@ MODELS = [
|
|||||||
("Alibaba-NLP/gte-Qwen2-1.5B-instruct", 1, 1e-5),
|
("Alibaba-NLP/gte-Qwen2-1.5B-instruct", 1, 1e-5),
|
||||||
("intfloat/e5-mistral-7b-instruct", 1, 1e-5),
|
("intfloat/e5-mistral-7b-instruct", 1, 1e-5),
|
||||||
("marco/mcdse-2b-v1", 1, 1e-5),
|
("marco/mcdse-2b-v1", 1, 1e-5),
|
||||||
|
("Qwen/Qwen3-Embedding-8B", 1, 1e-5),
|
||||||
# Temporarily disable before this model is fixed
|
# Temporarily disable before this model is fixed
|
||||||
# ("jason9693/Qwen2.5-1.5B-apeach", 1, 1e-5),
|
# ("jason9693/Qwen2.5-1.5B-apeach", 1, 1e-5),
|
||||||
]
|
]
|
||||||
|
|||||||
Reference in New Issue
Block a user