Update for Transformers AWQ support

This commit is contained in:
Tom Jobbins
2023-11-09 18:20:20 +00:00
committed by huggingface-web
parent 6ac73a5842
commit 9be86ac7e8

View File

@@ -20,5 +20,12 @@
"transformers_version": "4.30.2", "transformers_version": "4.30.2",
"use_cache": true, "use_cache": true,
"vocab_size": 32000, "vocab_size": 32000,
"pretraining_tp": 1 "pretraining_tp": 1,
"quantization_config": {
"quant_method": "awq",
"zero_point": true,
"group_size": 128,
"bits": 4,
"version": "gemm"
}
} }