Replace sglang.srt.layers.quantization.scalar_types with sgl_kernel.scalar_type (#8951)
This commit is contained in:
@@ -4,9 +4,9 @@ from typing import Optional
|
||||
import pytest
|
||||
import torch
|
||||
from sgl_kernel import fused_marlin_moe
|
||||
from sgl_kernel.scalar_type import ScalarType, scalar_types
|
||||
|
||||
from sglang.srt.layers.activation import SiluAndMul
|
||||
from sglang.srt.layers.quantization.scalar_type import ScalarType, scalar_types
|
||||
from sglang.test.test_marlin_utils import awq_marlin_quantize, marlin_quantize
|
||||
|
||||
|
||||
|
||||
@@ -10,13 +10,13 @@ from typing import Optional
|
||||
|
||||
import numpy as np
|
||||
import torch
|
||||
from sgl_kernel.scalar_type import ScalarType
|
||||
|
||||
from sglang.srt.layers.quantization.marlin_utils import (
|
||||
GPTQ_MARLIN_TILE,
|
||||
marlin_permute_scales,
|
||||
marlin_zero_points,
|
||||
)
|
||||
from sglang.srt.layers.quantization.scalar_type import ScalarType
|
||||
from sglang.srt.layers.quantization.utils import (
|
||||
get_pack_factor,
|
||||
gptq_quantize_weights,
|
||||
|
||||
Reference in New Issue
Block a user