[dev] support AWQ/GPTQ quantization for dense models
This commit is contained in:
@@ -16,4 +16,6 @@
|
||||
#
|
||||
|
||||
import vllm_kunlun.ops.rotary_embedding
|
||||
import vllm_kunlun.ops.layernorm
|
||||
import vllm_kunlun.ops.layernorm
|
||||
import vllm_kunlun.ops.quantization.awq
|
||||
import vllm_kunlun.ops.quantization.gptq
|
||||
Reference in New Issue
Block a user