fix compressed tensors WNA16 imports (#8142)
This commit is contained in:
committed by
GitHub
parent
719b29f218
commit
fd63b62eaa
@@ -40,7 +40,10 @@ from sglang.srt.layers.quantization.compressed_tensors.utils import (
|
||||
from sglang.srt.layers.quantization.unquant import UnquantizedLinearMethod
|
||||
|
||||
try:
|
||||
import vllm
|
||||
from vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_wNa16 import (
|
||||
WNA16_SUPPORTED_BITS,
|
||||
CompressedTensorsWNA16,
|
||||
)
|
||||
|
||||
VLLM_AVAILABLE = True
|
||||
except ImportError:
|
||||
|
||||
Reference in New Issue
Block a user