fix compressed tensors WNA16 imports (#8142)
This commit is contained in:
committed by
GitHub
parent
719b29f218
commit
fd63b62eaa
@@ -40,7 +40,10 @@ from sglang.srt.layers.quantization.compressed_tensors.utils import (
|
|||||||
from sglang.srt.layers.quantization.unquant import UnquantizedLinearMethod
|
from sglang.srt.layers.quantization.unquant import UnquantizedLinearMethod
|
||||||
|
|
||||||
try:
|
try:
|
||||||
import vllm
|
from vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_wNa16 import (
|
||||||
|
WNA16_SUPPORTED_BITS,
|
||||||
|
CompressedTensorsWNA16,
|
||||||
|
)
|
||||||
|
|
||||||
VLLM_AVAILABLE = True
|
VLLM_AVAILABLE = True
|
||||||
except ImportError:
|
except ImportError:
|
||||||
|
|||||||
Reference in New Issue
Block a user