feat: update linear deps 1/N (#1305)

This commit is contained in:
Yineng Zhang
2024-09-19 20:53:11 +08:00
committed by GitHub
parent 2cd7e181dd
commit b4408b0d16
33 changed files with 1484 additions and 132 deletions

View File

@@ -31,8 +31,9 @@ from vllm.distributed import (
get_tensor_model_parallel_world_size,
)
from vllm.model_executor.custom_op import CustomOp
from vllm.model_executor.layers.quantization import QuantizationConfig
from vllm.model_executor.utils import set_weight_attrs
from sglang.srt.layers.quantization.base_config import QuantizationConfig
from sglang.srt.utils import set_weight_attrs
logger = logging.getLogger(__name__)