remove qwen2.py llama.py fix llama output

2025-12-31 11:31:26 +08:00
parent b3c30a3cb9
commit b015bb76fd
11 changed files with 65 additions and 1263 deletions
--- a/vllm_kunlun/models/init.py
+++ b/vllm_kunlun/models/init.py
@@ -5,7 +5,6 @@ def register_model():
    # from .demo_model import DemoModel  # noqa: F401
    from .qwen2_vl import Qwen2VLForConditionalGeneration #noqa: F401
    from .qwen2_5_vl import Qwen2_5_VLForConditionalGeneration #noqa: F401
-    from .qwen3 import Qwen3ForCausalLM #noqa: F401
    from .qwen3_moe import Qwen3MoeForCausalLM #noqa: F401
    from .qwen3_vl import Qwen3VLForConditionalGeneration
    from .qwen3_vl_moe import Qwen3VLMoeForConditionalGeneration
@@ -48,11 +47,7 @@ def register_model():

    ModelRegistry.register_model(
        "InternLM2ForCausalLM",
-        "vllm_kunlun.models.internlm2:InternLM2ForCausalLM")   
-
-    ModelRegistry.register_model(
-        "Qwen2ForCausalLM",
-        "vllm_kunlun.models.qwen2:Qwen2ForCausalLM")
+        "vllm_kunlun.models.internlm2:InternLM2ForCausalLM")
    
    ModelRegistry.register_model(
        "InternVLChatModel",
@@ -78,10 +73,6 @@ def register_model():
        "SeedOssForCausalLM",
        "vllm_kunlun.models.seed_oss:SeedOssForCausalLM")

-    ModelRegistry.register_model(
-        "LlamaForCausalLM",
-        "vllm_kunlun.models.llama:LlamaForCausalLM")
-
    ModelRegistry.register_model(
        "MiMoV2FlashForCausalLM",
        "vllm_kunlun.models.mimo_v2_flash:MiMoV2FlashForCausalLM")