fix compressed tensors WNA16 imports (#8142)

This commit is contained in:
Enrique Shockwave
2025-07-18 19:34:14 +01:00
committed by GitHub
parent 719b29f218
commit fd63b62eaa

View File

@@ -40,7 +40,10 @@ from sglang.srt.layers.quantization.compressed_tensors.utils import (
from sglang.srt.layers.quantization.unquant import UnquantizedLinearMethod
try:
import vllm
from vllm.model_executor.layers.quantization.compressed_tensors.schemes.compressed_tensors_wNa16 import (
WNA16_SUPPORTED_BITS,
CompressedTensorsWNA16,
)
VLLM_AVAILABLE = True
except ImportError: