From 92a9d27fb65d2d56f7554bb9909bc90a29096eb5 Mon Sep 17 00:00:00 2001 From: Ubuntu Date: Thu, 18 Apr 2024 17:29:56 +0000 Subject: [PATCH] adding quant config --- quant_config.json | 6 ++++++ 1 file changed, 6 insertions(+) create mode 100644 quant_config.json diff --git a/quant_config.json b/quant_config.json new file mode 100644 index 0000000..4002036 --- /dev/null +++ b/quant_config.json @@ -0,0 +1,6 @@ +{ + "zero_point": true, + "q_group_size": 128, + "w_bit": 4, + "version": "GEMM" +} \ No newline at end of file