xc-llm-kunlun/vllm_kunlun/models/__init__.py

from vllm import ModelRegistry


def register_model():
    # from .demo_model import DemoModel  # noqa: F401
    from .qwen2_5_vl import Qwen2_5_VLForConditionalGeneration  # noqa: F401
    from .qwen2_vl import Qwen2VLForConditionalGeneration  # noqa: F401
    from .qwen3_moe import Qwen3MoeForCausalLM  # noqa: F401
    from .qwen3_omni_moe_thinker import (  # noqa: F401
        Qwen3OmniMoeThinkerForConditionalGeneration,
    )
    from .qwen3_vl import Qwen3VLForConditionalGeneration  # noqa: F401
    from .qwen3_vl_moe import Qwen3VLMoeForConditionalGeneration  # noqa: F401

    # from .llama4 import Llama4ForCausalLM #noqa: F401
    # from .mllama4 import Llama4ForConditionalGeneration #noqa: F401
    # from .deepseek_v2 import KunlunDeepseekV2MoE
    # ModelRegistry.register_model(
    #     "DemoModel",
    #     "vllm_kunlun.model_executor.models.demo_model:DemoModel")

    ModelRegistry.register_model(
        "Qwen2VLForConditionalGeneration",
        "vllm_kunlun.models.qwen2_vl:Qwen2VLForConditionalGeneration",
    )

    ModelRegistry.register_model(
        "Qwen2_5_VLForConditionalGeneration",
        "vllm_kunlun.models.qwen2_5_vl:Qwen2_5_VLForConditionalGeneration",
    )

    ModelRegistry.register_model(
        "Qwen3ForCausalLM", "vllm_kunlun.models.qwen3:Qwen3ForCausalLM"
    )

    ModelRegistry.register_model(
        "Qwen3MoeForCausalLM", "vllm_kunlun.models.qwen3_moe:Qwen3MoeForCausalLM"
    )

    ModelRegistry.register_model(
        "Qwen3NextForCausalLM", "vllm_kunlun.models.qwen3_next:Qwen3NextForCausalLM"
    )

    ModelRegistry.register_model(
        "Qwen3NextMTP", "vllm_kunlun.models.qwen3_next_mtp:Qwen3NextMTP"
    )

    ModelRegistry.register_model(
        "GlmForCausalLM", "vllm_kunlun.models.glm:GlmForCausalLM"
    )

    ModelRegistry.register_model(
        "GptOssForCausalLM", "vllm_kunlun.models.gpt_oss:GptOssForCausalLM"
    )

    ModelRegistry.register_model(
        "InternLM2ForCausalLM", "vllm_kunlun.models.internlm2:InternLM2ForCausalLM"
    )

    ModelRegistry.register_model(
        "InternVLChatModel", "vllm_kunlun.models.internvl:InternVLChatModel"
    )

    ModelRegistry.register_model(
        "InternS1ForConditionalGeneration",
        "vllm_kunlun.models.interns1:InternS1ForConditionalGeneration",
    )

    ModelRegistry.register_model(
        "Qwen3VLForConditionalGeneration",
        "vllm_kunlun.models.qwen3_vl:Qwen3VLForConditionalGeneration",
    )

    ModelRegistry.register_model(
        "Qwen3VLMoeForConditionalGeneration",
        "vllm_kunlun.models.qwen3_vl_moe:Qwen3VLMoeForConditionalGeneration",
    )

    ModelRegistry.register_model(
        "Qwen3OmniMoeForConditionalGeneration",
        "vllm_kunlun.models.qwen3_omni_moe_thinker:Qwen3OmniMoeThinkerForConditionalGeneration",
    )

    ModelRegistry.register_model(
        "SeedOssForCausalLM", "vllm_kunlun.models.seed_oss:SeedOssForCausalLM"
    )

    ModelRegistry.register_model(
        "MiMoV2FlashForCausalLM",
        "vllm_kunlun.models.mimo_v2_flash:MiMoV2FlashForCausalLM",
    )

    ModelRegistry.register_model(
        "GptOssForCausalLM", "vllm_kunlun.models.gpt_oss:GptOssForCausalLM"
    )

    ModelRegistry.register_model(
        "DeepseekV3ForCausalLM", "vllm_kunlun.models.deepseek_v2:DeepseekV3ForCausalLM"
    )

    ModelRegistry.register_model(
        "DeepseekV32ForCausalLM", "vllm_kunlun.models.deepseek_v2:DeepseekV3ForCausalLM"
    )

    ModelRegistry.register_model(
        "DeepSeekMTPModel", "vllm_kunlun.models.deepseek_mtp:DeepSeekMTP"
    )

    ModelRegistry.register_model(
        "GlmMoeDsaForCausalLM", "vllm_kunlun.models.deepseek_v2:GlmMoeDsaForCausalLM"
    )


def register_quant_method():
    """to do"""
Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00			`from vllm import ModelRegistry`


			`def register_model():`
			`# from .demo_model import DemoModel # noqa: F401`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`from .qwen2_5_vl import Qwen2_5_VLForConditionalGeneration # noqa: F401`
			`from .qwen2_vl import Qwen2VLForConditionalGeneration # noqa: F401`
			`from .qwen3_moe import Qwen3MoeForCausalLM # noqa: F401`
			`from .qwen3_omni_moe_thinker import ( # noqa: F401`
			`Qwen3OmniMoeThinkerForConditionalGeneration,`
			`)`
			`from .qwen3_vl import Qwen3VLForConditionalGeneration # noqa: F401`
			`from .qwen3_vl_moe import Qwen3VLMoeForConditionalGeneration # noqa: F401`

提交vllm0.11.0开发分支 2025-12-10 17:51:24 +08:00			`# from .llama4 import Llama4ForCausalLM #noqa: F401`
			`# from .mllama4 import Llama4ForConditionalGeneration #noqa: F401`
			`# from .deepseek_v2 import KunlunDeepseekV2MoE`
Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00			`# ModelRegistry.register_model(`
			`# "DemoModel",`
			`# "vllm_kunlun.model_executor.models.demo_model:DemoModel")`

			`ModelRegistry.register_model(`
			`"Qwen2VLForConditionalGeneration",`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"vllm_kunlun.models.qwen2_vl:Qwen2VLForConditionalGeneration",`
			`)`
Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00
			`ModelRegistry.register_model(`
			`"Qwen2_5_VLForConditionalGeneration",`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"vllm_kunlun.models.qwen2_5_vl:Qwen2_5_VLForConditionalGeneration",`
			`)`

			`ModelRegistry.register_model(`
			`"Qwen3ForCausalLM", "vllm_kunlun.models.qwen3:Qwen3ForCausalLM"`
			`)`

			`ModelRegistry.register_model(`
			`"Qwen3MoeForCausalLM", "vllm_kunlun.models.qwen3_moe:Qwen3MoeForCausalLM"`
			`)`
Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00
			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"Qwen3NextForCausalLM", "vllm_kunlun.models.qwen3_next:Qwen3NextForCausalLM"`
			`)`
Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00
			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"Qwen3NextMTP", "vllm_kunlun.models.qwen3_next_mtp:Qwen3NextMTP"`
			`)`
提交vllm0.11.0开发分支 2025-12-10 17:51:24 +08:00
			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"GlmForCausalLM", "vllm_kunlun.models.glm:GlmForCausalLM"`
			`)`
Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00
			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"GptOssForCausalLM", "vllm_kunlun.models.gpt_oss:GptOssForCausalLM"`
			`)`
提交vllm0.11.0开发分支 2025-12-10 17:51:24 +08:00
Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"InternLM2ForCausalLM", "vllm_kunlun.models.internlm2:InternLM2ForCausalLM"`
			`)`

Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"InternVLChatModel", "vllm_kunlun.models.internvl:InternVLChatModel"`
			`)`
Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00
			`ModelRegistry.register_model(`
			`"InternS1ForConditionalGeneration",`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"vllm_kunlun.models.interns1:InternS1ForConditionalGeneration",`
			`)`

Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00			`ModelRegistry.register_model(`
提交vllm0.11.0开发分支 2025-12-10 17:51:24 +08:00			`"Qwen3VLForConditionalGeneration",`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"vllm_kunlun.models.qwen3_vl:Qwen3VLForConditionalGeneration",`
			`)`

Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00			`ModelRegistry.register_model(`
提交vllm0.11.0开发分支 2025-12-10 17:51:24 +08:00			`"Qwen3VLMoeForConditionalGeneration",`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"vllm_kunlun.models.qwen3_vl_moe:Qwen3VLMoeForConditionalGeneration",`
			`)`
提交vllm0.11.0开发分支 2025-12-10 17:51:24 +08:00
			`ModelRegistry.register_model(`
			`"Qwen3OmniMoeForConditionalGeneration",`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"vllm_kunlun.models.qwen3_omni_moe_thinker:Qwen3OmniMoeThinkerForConditionalGeneration",`
			`)`
Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00
			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"SeedOssForCausalLM", "vllm_kunlun.models.seed_oss:SeedOssForCausalLM"`
			`)`
Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00
[Feature] Support XiaoMi MIMO Flash V2 (#62) * [Feature] Support MIMO Flash V2 2025-12-31 10:16:33 +08:00			`ModelRegistry.register_model(`
			`"MiMoV2FlashForCausalLM",`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"vllm_kunlun.models.mimo_v2_flash:MiMoV2FlashForCausalLM",`
			`)`
[Feature] Support gpt-oss and update model list (#71) * [Docs] Update Support Models * [Feature] Support gpt-oss * [Docs] fix model support list * Fix Moe * Fix * Fix moe_ep * remove gpt oss graph support , not yet --------- Co-authored-by: hanhaowen <hanhaowen@baidu.com> 2026-01-04 21:19:49 +08:00
			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"GptOssForCausalLM", "vllm_kunlun.models.gpt_oss:GptOssForCausalLM"`
			`)`
[Feature] support deepseek v3/r1/v3.2 (#78) * [Feature] support deepseek v3/r1/v3.2 * fix gpt_oss * update readme * update readme --------- Co-authored-by: hanhaowen <hanhaowen@baidu.com> 2026-01-05 22:55:35 +08:00
			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"DeepseekV3ForCausalLM", "vllm_kunlun.models.deepseek_v2:DeepseekV3ForCausalLM"`
			`)`
[Feature] support deepseek v3/r1/v3.2 (#78) * [Feature] support deepseek v3/r1/v3.2 * fix gpt_oss * update readme * update readme --------- Co-authored-by: hanhaowen <hanhaowen@baidu.com> 2026-01-05 22:55:35 +08:00
			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"DeepseekV32ForCausalLM", "vllm_kunlun.models.deepseek_v2:DeepseekV3ForCausalLM"`
			`)`

[Feature] DeepSeek Support MTP 2026-01-06 21:37:21 +08:00			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"DeepSeekMTPModel", "vllm_kunlun.models.deepseek_mtp:DeepSeekMTP"`
			`)`
[Feature] support deepseek v3/r1/v3.2 (#78) * [Feature] support deepseek v3/r1/v3.2 * fix gpt_oss * update readme * update readme --------- Co-authored-by: hanhaowen <hanhaowen@baidu.com> 2026-01-05 22:55:35 +08:00
[Feature] Support glmx (#194) Signed-off-by: Li Wei <liwei.109@outlook.com> Co-authored-by: tangshiwen <tangshiwen@baidu.com> Co-authored-by: Xinyu Dong <dongxinyu03@baidu.com> 2026-02-12 15:40:42 +08:00			`ModelRegistry.register_model(`
[Feature] Merge branch 'Qwen3-Next' into main && Support Qwen-next (#222) Signed-off-by: xyDong0223 <dongxinyu03@baidu.com> Co-authored-by: xyDong0223 <dongxinyu03@baidu.com> 2026-02-28 11:15:50 +08:00			`"GlmMoeDsaForCausalLM", "vllm_kunlun.models.deepseek_v2:GlmMoeDsaForCausalLM"`
			`)`

[Feature] Support glmx (#194) Signed-off-by: Li Wei <liwei.109@outlook.com> Co-authored-by: tangshiwen <tangshiwen@baidu.com> Co-authored-by: Xinyu Dong <dongxinyu03@baidu.com> 2026-02-12 15:40:42 +08:00
Initial commit for vLLM-Kunlun Plugin 2025-12-10 12:05:39 +08:00			`def register_quant_method():`
[Model] registry llama.py to vLLM 2025-12-15 21:21:28 +08:00			`"""to do"""`