Fix DeepSeek-v3.2 default config (ValueError: not enough values to unpack (expected 4, got 3)) (#11557)

This commit is contained in:
Trevor Morris
2025-10-13 11:27:40 -07:00
committed by GitHub
parent b6fb5d7666
commit c9cff2b984

View File

@@ -804,7 +804,7 @@ class ServerArgs:
hf_config = self.get_hf_config()
model_arch = hf_config.architectures[0]
if model_arch in ["DeepseekV3ForCausalLM"]:
if model_arch in ["DeepseekV3ForCausalLM"] and not is_deepseek_nsa(hf_config):
if is_cuda() and is_sm100_supported():
if (
self.attention_backend is None