fix awq_dequantize import (#5669)

This commit is contained in:
Yineng Zhang
2025-04-23 01:36:26 -07:00
committed by GitHub
parent 15fabcc07f
commit fbb5f229d4

View File

@@ -3,7 +3,6 @@ import logging
from typing import Any, Dict, List, Optional
import torch
from sgl_kernel import awq_dequantize
from sglang.srt.layers.linear import (
LinearBase,
@@ -12,6 +11,11 @@ from sglang.srt.layers.linear import (
)
from sglang.srt.layers.parameter import GroupQuantScaleParameter, PackedvLLMParameter
from sglang.srt.layers.quantization.base_config import QuantizationConfig
from sglang.srt.utils import is_cuda
_is_cuda = is_cuda()
if _is_cuda:
from sgl_kernel import awq_dequantize
logger = logging.getLogger(__name__)