[dev] support AWQ/GPTQ quantization for dense models

This commit is contained in:
Li Wei
2025-12-24 13:45:55 +08:00
parent 75d0bdae2f
commit 6546323c71
5 changed files with 412 additions and 2 deletions

View File

@@ -16,4 +16,6 @@
#
import vllm_kunlun.ops.rotary_embedding
import vllm_kunlun.ops.layernorm
import vllm_kunlun.ops.layernorm
import vllm_kunlun.ops.quantization.awq
import vllm_kunlun.ops.quantization.gptq