add deepseekv3 and llama4

2026-02-11 15:09:59 +08:00
parent 45e1fa8bb3
commit 78814aaa68
1 changed files with 4 additions and 7 deletions
--- a/vllm-v0.6.2/vllm/model_executor/model_loader/utils.py
+++ b/vllm-v0.6.2/vllm/model_executor/model_loader/utils.py
@@ -21,13 +21,10 @@ def set_default_torch_dtype(dtype: torch.dtype):
 def get_model_architecture(
        model_config: ModelConfig) -> Tuple[Type[nn.Module], str]:
    architectures = getattr(model_config.hf_config, "architectures", None) or []
-    logger.warning("[DEBUG-ARCH] get_model_architecture: "
+    print(f"[DEBUG-ARCH] get_model_architecture: "
-                   "type(hf_config)=%s, architectures=%s, "
+          f"type(hf_config)={type(model_config.hf_config).__name__}, "
-                   "id(hf_config)=%s, has_text_config=%s",
+          f"architectures={getattr(model_config.hf_config, 'architectures', 'MISSING')}, "
-                   type(model_config.hf_config).__name__,
+          f"id(hf_config)={id(model_config.hf_config)}")
                   getattr(model_config.hf_config, "architectures", "MISSING"),
                   id(model_config.hf_config),
                   hasattr(model_config.hf_config, "text_config"))
    # Special handling for quantized Mixtral.
    # FIXME(woosuk): This is a temporary hack.
    mixtral_supported = [