Initial commit for vLLM-Kunlun Plugin
This commit is contained in:
68
vllm_kunlun/models/__init__.py
Normal file
68
vllm_kunlun/models/__init__.py
Normal file
@@ -0,0 +1,68 @@
|
||||
from vllm import ModelRegistry
|
||||
|
||||
|
||||
def register_model():
|
||||
# from .demo_model import DemoModel # noqa: F401
|
||||
from .qwen2_vl import Qwen2VLForConditionalGeneration #noqa: F401
|
||||
from .qwen2_5_vl import Qwen2_5_VLForConditionalGeneration #noqa: F401
|
||||
from .qwen3 import Qwen3ForCausalLM #noqa: F401
|
||||
from .qwen3_moe import Qwen3MoeForCausalLM #noqa: F401
|
||||
|
||||
# ModelRegistry.register_model(
|
||||
# "DemoModel",
|
||||
# "vllm_kunlun.model_executor.models.demo_model:DemoModel")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"Qwen2VLForConditionalGeneration",
|
||||
"vllm_kunlun.models.qwen2_vl:Qwen2VLForConditionalGeneration")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"Qwen2_5_VLForConditionalGeneration",
|
||||
"vllm_kunlun.models.qwen2_5_vl:Qwen2_5_VLForConditionalGeneration")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"Qwen3ForCausalLM",
|
||||
"vllm_kunlun.models.qwen3:Qwen3ForCausalLM")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"Qwen3MoeForCausalLM",
|
||||
"vllm_kunlun.models.qwen3_moe:Qwen3MoeForCausalLM")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"GlmForCausalLM",
|
||||
"vllm_kunlun.models.glm:GlmForCausalLM")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"GptOssForCausalLM",
|
||||
"vllm_kunlun.models.gpt_oss:GptOssForCausalLM")
|
||||
ModelRegistry.register_model(
|
||||
"InternLM2ForCausalLM",
|
||||
"vllm_kunlun.models.internlm2:InternLM2ForCausalLM")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"Qwen2ForCausalLM",
|
||||
"vllm_kunlun.models.qwen2:Qwen2ForCausalLM")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"InternVLChatModel",
|
||||
"vllm_kunlun.models.internvl:InternVLChatModel")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"InternS1ForConditionalGeneration",
|
||||
"vllm_kunlun.models.interns1:InternS1ForConditionalGeneration")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"Glm4MoeForCausalLM",
|
||||
"vllm_kunlun.models.glm4_moe:Glm4MoeForCausalLM")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"Glm4ForCausalLM",
|
||||
"vllm_kunlun.models.glm4:Glm4ForCausalLM")
|
||||
|
||||
ModelRegistry.register_model(
|
||||
"Glm4vForConditionalGeneration",
|
||||
"vllm_kunlun.models.glm4_1v:Glm4vForConditionalGeneration")
|
||||
|
||||
|
||||
def register_quant_method():
|
||||
"""to do"""
|
||||
Reference in New Issue
Block a user