Revert "[XPU][CPU] Enable the native path of DeepSeek" (#4367)

This commit is contained in:
Lianmin Zheng
2025-03-12 23:45:52 -07:00
committed by GitHub
parent 71046fcd71
commit 45de89719c
16 changed files with 221 additions and 499 deletions

View File

@@ -1,5 +1,4 @@
import logging
import sys
from fractions import Fraction
from typing import Any, Dict, List, Optional, Union
@@ -9,7 +8,6 @@ from vllm.scalar_type import scalar_types
from sglang.srt.layers.linear import LinearBase
from sglang.srt.layers.quantization.base_config import QuantizationConfig
from sglang.srt.layers.vocab_parallel_embedding import ParallelLMHead
from sglang.srt.utils import get_device_capability
logger = logging.getLogger(__name__)
@@ -92,20 +90,7 @@ class GPTQConfig(QuantizationConfig):
@classmethod
# Need to figure it out
def get_min_capability(cls) -> int:
if hasattr(torch, "cuda") and torch.cuda.is_available():
return 60
# Vendors can update
return sys.maxsize
@classmethod
def get_availability(cls) -> bool:
major, minor = get_device_capability()
if hasattr(torch, "cuda") and torch.cuda.is_available():
return major * 10 + minor > 60
# Vendors can update
return False
return 60
@classmethod
def get_config_filenames(cls) -> List[str]:
@@ -224,20 +209,7 @@ class GPTQMarlinConfig(QuantizationConfig):
@classmethod
def get_min_capability(cls) -> int:
if hasattr(torch, "cuda") and torch.cuda.is_available():
return 80
# Vendors can update
return sys.maxsize
@classmethod
def get_availability(cls) -> bool:
major, minor = get_device_capability()
if hasattr(torch, "cuda") and torch.cuda.is_available():
return major * 10 + minor > 80
# Vendors can update
return False
return 80
@classmethod
def get_config_filenames(cls) -> List[str]:
@@ -399,20 +371,7 @@ class MarlinConfig(QuantizationConfig):
@classmethod
# Need to figure it out
def get_min_capability(cls) -> int:
if hasattr(torch, "cuda") and torch.cuda.is_available():
return 80
# Vendors can update
return sys.maxsize
@classmethod
def get_availability(cls) -> bool:
major, minor = get_device_capability()
if hasattr(torch, "cuda") and torch.cuda.is_available():
return major * 10 + minor > 80
# Vendors can update
return False
return 80
@classmethod
def get_config_filenames(cls) -> List[str]: