2025-03-07 15:41:47 +08:00
|
|
|
from vllm import ModelRegistry
|
|
|
|
|
|
2025-08-14 09:33:39 +08:00
|
|
|
import vllm_ascend.envs as envs_ascend
|
2025-06-07 16:46:58 +08:00
|
|
|
|
2025-03-07 15:41:47 +08:00
|
|
|
|
|
|
|
|
def register_model():
|
2025-06-07 16:46:58 +08:00
|
|
|
from .deepseek_dbo import CustomDeepseekDBOForCausalLM # noqa: F401
|
2025-04-19 17:38:18 +08:00
|
|
|
from .deepseek_mtp import CustomDeepSeekMTP # noqa: F401
|
|
|
|
|
from .deepseek_v2 import CustomDeepseekV2ForCausalLM # noqa: F401
|
2025-07-19 11:37:03 +08:00
|
|
|
from .deepseek_v3 import CustomDeepseekV3ForCausalLM # noqa: F401
|
2025-04-30 14:22:38 +08:00
|
|
|
from .qwen2_5_vl import \
|
|
|
|
|
AscendQwen2_5_VLForConditionalGeneration # noqa: F401
|
|
|
|
|
from .qwen2_vl import AscendQwen2VLForConditionalGeneration # noqa: F401
|
2025-07-22 19:03:13 +08:00
|
|
|
from .qwen3 import CustomQwen3ForCausalLM # noqa: F401
|
2025-03-07 15:41:47 +08:00
|
|
|
|
2025-04-19 17:38:18 +08:00
|
|
|
ModelRegistry.register_model(
|
|
|
|
|
"DeepSeekMTPModel",
|
|
|
|
|
"vllm_ascend.models.deepseek_mtp:CustomDeepSeekMTP")
|
|
|
|
|
|
2025-03-07 15:41:47 +08:00
|
|
|
ModelRegistry.register_model(
|
|
|
|
|
"Qwen2VLForConditionalGeneration",
|
2025-04-30 14:22:38 +08:00
|
|
|
"vllm_ascend.models.qwen2_vl:AscendQwen2VLForConditionalGeneration")
|
|
|
|
|
|
2025-08-14 09:33:39 +08:00
|
|
|
if envs_ascend.USE_OPTIMIZED_MODEL:
|
2025-06-07 19:45:46 +08:00
|
|
|
ModelRegistry.register_model(
|
|
|
|
|
"Qwen2_5_VLForConditionalGeneration",
|
|
|
|
|
"vllm_ascend.models.qwen2_5_vl:AscendQwen2_5_VLForConditionalGeneration"
|
|
|
|
|
)
|
|
|
|
|
else:
|
|
|
|
|
ModelRegistry.register_model(
|
|
|
|
|
"Qwen2_5_VLForConditionalGeneration",
|
|
|
|
|
"vllm_ascend.models.qwen2_5_vl_without_padding:AscendQwen2_5_VLForConditionalGeneration_Without_Padding"
|
|
|
|
|
)
|
2025-04-07 10:56:12 +08:00
|
|
|
|
2025-08-14 09:33:39 +08:00
|
|
|
if envs_ascend.VLLM_ASCEND_ENABLE_DBO:
|
2025-06-07 16:46:58 +08:00
|
|
|
ModelRegistry.register_model(
|
|
|
|
|
"DeepseekV2ForCausalLM",
|
|
|
|
|
"vllm_ascend.models.deepseek_dbo:CustomDeepseekDBOForCausalLM")
|
2025-06-23 09:07:57 +08:00
|
|
|
|
|
|
|
|
ModelRegistry.register_model(
|
|
|
|
|
"DeepseekV3ForCausalLM",
|
|
|
|
|
"vllm_ascend.models.deepseek_dbo:CustomDeepseekDBOForCausalLM")
|
2025-06-07 16:46:58 +08:00
|
|
|
else:
|
|
|
|
|
ModelRegistry.register_model(
|
|
|
|
|
"DeepseekV2ForCausalLM",
|
|
|
|
|
"vllm_ascend.models.deepseek_v2:CustomDeepseekV2ForCausalLM")
|
2025-04-07 10:56:12 +08:00
|
|
|
|
2025-06-23 09:07:57 +08:00
|
|
|
ModelRegistry.register_model(
|
|
|
|
|
"DeepseekV3ForCausalLM",
|
2025-07-19 11:37:03 +08:00
|
|
|
"vllm_ascend.models.deepseek_v3:CustomDeepseekV3ForCausalLM")
|
2025-05-23 15:50:48 +08:00
|
|
|
|
|
|
|
|
ModelRegistry.register_model(
|
|
|
|
|
"Qwen3MoeForCausalLM",
|
|
|
|
|
"vllm_ascend.models.qwen3_moe:CustomQwen3MoeForCausalLM")
|
2025-06-20 23:59:59 +08:00
|
|
|
|
2025-07-22 19:03:13 +08:00
|
|
|
ModelRegistry.register_model(
|
|
|
|
|
"Qwen3ForCausalLM", "vllm_ascend.models.qwen3:CustomQwen3ForCausalLM")
|
|
|
|
|
|
2025-06-20 23:59:59 +08:00
|
|
|
ModelRegistry.register_model(
|
|
|
|
|
"PanguProMoEForCausalLM",
|
2025-07-22 19:03:13 +08:00
|
|
|
"vllm_ascend.models.pangu_moe:PanguProMoEForCausalLM")
|