Support page size > 1 (#4356)
This commit is contained in:
@@ -36,7 +36,7 @@ fp8_type_ = torch.float8_e4m3fnuz if _is_hip else torch.float8_e4m3fn
|
||||
|
||||
_is_cuda = is_cuda()
|
||||
if _is_cuda:
|
||||
import deep_gemm
|
||||
import deep_gemm # `pip install "sgl-kernel>=0.0.4.post3"`
|
||||
from sgl_kernel import sgl_per_token_group_quant_fp8, sgl_per_token_quant_fp8
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
Reference in New Issue
Block a user