Update for Transformers AWQ support
This commit is contained in:
committed by
huggingface-web
parent
6ac73a5842
commit
9be86ac7e8
@@ -20,5 +20,12 @@
|
|||||||
"transformers_version": "4.30.2",
|
"transformers_version": "4.30.2",
|
||||||
"use_cache": true,
|
"use_cache": true,
|
||||||
"vocab_size": 32000,
|
"vocab_size": 32000,
|
||||||
"pretraining_tp": 1
|
"pretraining_tp": 1,
|
||||||
|
"quantization_config": {
|
||||||
|
"quant_method": "awq",
|
||||||
|
"zero_point": true,
|
||||||
|
"group_size": 128,
|
||||||
|
"bits": 4,
|
||||||
|
"version": "gemm"
|
||||||
|
}
|
||||||
}
|
}
|
||||||
Reference in New Issue
Block a user