Revert "[XPU][CPU] Enable the native path of DeepSeek" (#4367)

This commit is contained in:
Lianmin Zheng
2025-03-12 23:45:52 -07:00
committed by GitHub
parent 71046fcd71
commit 45de89719c
16 changed files with 221 additions and 499 deletions

View File

@@ -108,25 +108,15 @@ def _get_quantization_config(
quant_config = get_quant_config(model_config, load_config)
major, minor = get_device_capability()
if not hasattr(quant_config, "get_availability"):
# Update VLLM to support get_available
if major is not None and minor is not None:
assert 0 <= minor < 10
capability = major * 10 + minor
if capability < quant_config.get_min_capability():
raise ValueError(
f"The quantization method {model_config.quantization} "
"is not supported for the current GPU. "
f"Minimum capability: {quant_config.get_min_capability()}. "
f"Current capability: {capability}."
)
else:
if not quant_config.get_availability():
if major is not None and minor is not None:
assert 0 <= minor < 10
capability = major * 10 + minor
if capability < quant_config.get_min_capability():
raise ValueError(
f"The quantization method {model_config.quantization} "
"is not supported for the current GPU. "
f"Minimum capability: {quant_config.get_min_capability()}. "
f"Current capability: {major, minor}."
f"Current capability: {capability}."
)
supported_dtypes = quant_config.get_supported_act_dtypes()
if model_config.dtype not in supported_dtypes: