From 1182609f828467311ee255b224a209aad8aa974c Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Tue, 21 Apr 2026 21:27:36 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/AceInstruct-1.5B-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++++++++ AceInstruct-1.5B.i1-IQ1_M.gguf | 3 ++ AceInstruct-1.5B.i1-IQ1_S.gguf | 3 ++ AceInstruct-1.5B.i1-IQ2_M.gguf | 3 ++ AceInstruct-1.5B.i1-IQ2_S.gguf | 3 ++ AceInstruct-1.5B.i1-IQ2_XS.gguf | 3 ++ AceInstruct-1.5B.i1-IQ2_XXS.gguf | 3 ++ AceInstruct-1.5B.i1-IQ3_M.gguf | 3 ++ AceInstruct-1.5B.i1-IQ3_S.gguf | 3 ++ AceInstruct-1.5B.i1-IQ3_XS.gguf | 3 ++ AceInstruct-1.5B.i1-IQ3_XXS.gguf | 3 ++ AceInstruct-1.5B.i1-IQ4_NL.gguf | 3 ++ AceInstruct-1.5B.i1-IQ4_XS.gguf | 3 ++ AceInstruct-1.5B.i1-Q2_K.gguf | 3 ++ AceInstruct-1.5B.i1-Q2_K_S.gguf | 3 ++ AceInstruct-1.5B.i1-Q3_K_L.gguf | 3 ++ AceInstruct-1.5B.i1-Q3_K_M.gguf | 3 ++ AceInstruct-1.5B.i1-Q3_K_S.gguf | 3 ++ AceInstruct-1.5B.i1-Q4_0.gguf | 3 ++ AceInstruct-1.5B.i1-Q4_1.gguf | 3 ++ AceInstruct-1.5B.i1-Q4_K_M.gguf | 3 ++ AceInstruct-1.5B.i1-Q4_K_S.gguf | 3 ++ AceInstruct-1.5B.i1-Q5_K_M.gguf | 3 ++ AceInstruct-1.5B.i1-Q5_K_S.gguf | 3 ++ AceInstruct-1.5B.i1-Q6_K.gguf | 3 ++ README.md | 84 ++++++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 27 files changed, 219 insertions(+) create mode 100644 .gitattributes create mode 100644 AceInstruct-1.5B.i1-IQ1_M.gguf create mode 100644 AceInstruct-1.5B.i1-IQ1_S.gguf create mode 100644 AceInstruct-1.5B.i1-IQ2_M.gguf create mode 100644 AceInstruct-1.5B.i1-IQ2_S.gguf create mode 100644 AceInstruct-1.5B.i1-IQ2_XS.gguf create mode 100644 AceInstruct-1.5B.i1-IQ2_XXS.gguf create mode 100644 AceInstruct-1.5B.i1-IQ3_M.gguf create mode 100644 AceInstruct-1.5B.i1-IQ3_S.gguf create mode 100644 AceInstruct-1.5B.i1-IQ3_XS.gguf create mode 100644 AceInstruct-1.5B.i1-IQ3_XXS.gguf create mode 100644 AceInstruct-1.5B.i1-IQ4_NL.gguf create mode 100644 AceInstruct-1.5B.i1-IQ4_XS.gguf create mode 100644 AceInstruct-1.5B.i1-Q2_K.gguf create mode 100644 AceInstruct-1.5B.i1-Q2_K_S.gguf create mode 100644 AceInstruct-1.5B.i1-Q3_K_L.gguf create mode 100644 AceInstruct-1.5B.i1-Q3_K_M.gguf create mode 100644 AceInstruct-1.5B.i1-Q3_K_S.gguf create mode 100644 AceInstruct-1.5B.i1-Q4_0.gguf create mode 100644 AceInstruct-1.5B.i1-Q4_1.gguf create mode 100644 AceInstruct-1.5B.i1-Q4_K_M.gguf create mode 100644 AceInstruct-1.5B.i1-Q4_K_S.gguf create mode 100644 AceInstruct-1.5B.i1-Q5_K_M.gguf create mode 100644 AceInstruct-1.5B.i1-Q5_K_S.gguf create mode 100644 AceInstruct-1.5B.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..9ecfff4 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AceInstruct-1.5B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/AceInstruct-1.5B.i1-IQ1_M.gguf b/AceInstruct-1.5B.i1-IQ1_M.gguf new file mode 100644 index 0000000..4b50539 --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8913b0c3d5ba5a7dca5f72cfeabdba080c96a4dca7af190bbd3ea270ad8cb3b6 +size 541035200 diff --git a/AceInstruct-1.5B.i1-IQ1_S.gguf b/AceInstruct-1.5B.i1-IQ1_S.gguf new file mode 100644 index 0000000..64f0891 --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:480c30de7ae858a8b0ace62e5cc3cc54091d6eeafb0bdfd417ece5bbe5af6d04 +size 513101504 diff --git a/AceInstruct-1.5B.i1-IQ2_M.gguf b/AceInstruct-1.5B.i1-IQ2_M.gguf new file mode 100644 index 0000000..1d9d77b --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cad8804d949011868e853ec053f67bde0475f00974709a0ea5e6a4edf2cef29 +size 701330624 diff --git a/AceInstruct-1.5B.i1-IQ2_S.gguf b/AceInstruct-1.5B.i1-IQ2_S.gguf new file mode 100644 index 0000000..aca92e4 --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4a88780d6b82f21532c4d0f677ed796618fb0d318dd18b8031ce574e8a8fa91 +size 664085696 diff --git a/AceInstruct-1.5B.i1-IQ2_XS.gguf b/AceInstruct-1.5B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..56e04da --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d77e0813706af4585b0ee41686cfb6b2b69e5cf9d93afb24f412af452d582f0 +size 626900672 diff --git a/AceInstruct-1.5B.i1-IQ2_XXS.gguf b/AceInstruct-1.5B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..a673357 --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d8581cae080175a91c9246b6e7638e6fa0331c420ccfddc723ac02e259e6c56 +size 587591360 diff --git a/AceInstruct-1.5B.i1-IQ3_M.gguf b/AceInstruct-1.5B.i1-IQ3_M.gguf new file mode 100644 index 0000000..a633ae8 --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e860de7fac5b43c12d6ea130d427fa8002e1e573d9a4328f08cb9ae195016ad3 +size 876939968 diff --git a/AceInstruct-1.5B.i1-IQ3_S.gguf b/AceInstruct-1.5B.i1-IQ3_S.gguf new file mode 100644 index 0000000..088ca70 --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e546d2e02ca75821ee4ea1c4b6ea33eeddb17f9b5f38c661afce23d94be665 +size 862682816 diff --git a/AceInstruct-1.5B.i1-IQ3_XS.gguf b/AceInstruct-1.5B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..c05d322 --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d4742f6aa9e8f8d9984dfda4b5c62f45bc05d3bc2860c8541bedbb3a4db1b6 +size 831975104 diff --git a/AceInstruct-1.5B.i1-IQ3_XXS.gguf b/AceInstruct-1.5B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..aa18829 --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4bcf56e09a8d25c3db4e3ca34b4b1fff241903ebb66fd6d3e6eb277f5108284 +size 769068224 diff --git a/AceInstruct-1.5B.i1-IQ4_NL.gguf b/AceInstruct-1.5B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..40e122e --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd15cef31ab9298e00e6cb103b412e296249a5c5bb3e5c64bc0d6c6510eb565 +size 1067602112 diff --git a/AceInstruct-1.5B.i1-IQ4_XS.gguf b/AceInstruct-1.5B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..ab43778 --- /dev/null +++ b/AceInstruct-1.5B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08c1588c362d6d0a3d1dcb2c072dd81d7ae0bdb25d515c0384fe8aa1b99c6fc3 +size 1019709632 diff --git a/AceInstruct-1.5B.i1-Q2_K.gguf b/AceInstruct-1.5B.i1-Q2_K.gguf new file mode 100644 index 0000000..7b0a57e --- /dev/null +++ b/AceInstruct-1.5B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d2c1e8cc599c07bc8d07fde0bf80709130c8a6c018e177a9341ae14f064d954 +size 752878784 diff --git a/AceInstruct-1.5B.i1-Q2_K_S.gguf b/AceInstruct-1.5B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..cfa7bef --- /dev/null +++ b/AceInstruct-1.5B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7faad702bb124fbc1787aa7cae461044be32a49192b781b400eed68d33600cc3 +size 716709056 diff --git a/AceInstruct-1.5B.i1-Q3_K_L.gguf b/AceInstruct-1.5B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..9a039b0 --- /dev/null +++ b/AceInstruct-1.5B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:394c995dba1e68cc7fad0aef2d768d871aef10f08d7757f1dea019970b3a4735 +size 980438720 diff --git a/AceInstruct-1.5B.i1-Q3_K_M.gguf b/AceInstruct-1.5B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..561ab8f --- /dev/null +++ b/AceInstruct-1.5B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc85fcd31b6890ac371bf3aeaaa9a6261b05aa217696502b99703e695d86f632 +size 924454592 diff --git a/AceInstruct-1.5B.i1-Q3_K_S.gguf b/AceInstruct-1.5B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..16cb8c3 --- /dev/null +++ b/AceInstruct-1.5B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:787f87be6a336cf7535abf16ddfa310c7ff7ec642cd137921dc136d0709e185f +size 861220544 diff --git a/AceInstruct-1.5B.i1-Q4_0.gguf b/AceInstruct-1.5B.i1-Q4_0.gguf new file mode 100644 index 0000000..79120a9 --- /dev/null +++ b/AceInstruct-1.5B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e18939c49ea98891f526bc2532d21106d36a8b5280a543f2b58199033828dc2 +size 1068806336 diff --git a/AceInstruct-1.5B.i1-Q4_1.gguf b/AceInstruct-1.5B.i1-Q4_1.gguf new file mode 100644 index 0000000..6e90519 --- /dev/null +++ b/AceInstruct-1.5B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d0b91306b2ff98252c2dbac9d5a37cb121106a045331d506b7168d374a1a6ba +size 1162698944 diff --git a/AceInstruct-1.5B.i1-Q4_K_M.gguf b/AceInstruct-1.5B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..04e5eaa --- /dev/null +++ b/AceInstruct-1.5B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00606f7635ca2dc948826d2678a0f318c44a91bad3d9db589a0206bc0efc60c3 +size 1117319360 diff --git a/AceInstruct-1.5B.i1-Q4_K_S.gguf b/AceInstruct-1.5B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..89f811b --- /dev/null +++ b/AceInstruct-1.5B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44050e5bf1f1e91f0d9def6a94efa1579a9e0befb39c966e7f5d64e1b09ed109 +size 1071583424 diff --git a/AceInstruct-1.5B.i1-Q5_K_M.gguf b/AceInstruct-1.5B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..21ede06 --- /dev/null +++ b/AceInstruct-1.5B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5dd34e68329979d2800668065ce4fc4b3610f112d739b0743b63721a3737461 +size 1285492928 diff --git a/AceInstruct-1.5B.i1-Q5_K_S.gguf b/AceInstruct-1.5B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..a3ef40c --- /dev/null +++ b/AceInstruct-1.5B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c8e333992250175ac693a72a6acf619630d18f43a365daf76dc6c0a325283b4 +size 1259172032 diff --git a/AceInstruct-1.5B.i1-Q6_K.gguf b/AceInstruct-1.5B.i1-Q6_K.gguf new file mode 100644 index 0000000..0ad0857 --- /dev/null +++ b/AceInstruct-1.5B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d8a3fb38b51a4355587dcba9281ce354b4c4340051c25c3d808c513d01a558 +size 1464177344 diff --git a/README.md b/README.md new file mode 100644 index 0000000..ad9c2f6 --- /dev/null +++ b/README.md @@ -0,0 +1,84 @@ +--- +base_model: nvidia/AceInstruct-1.5B +language: +- en +library_name: transformers +license: cc-by-nc-4.0 +quantized_by: mradermacher +tags: +- nvidia +- AceInstruct +- code +- math +- general_domain +- instruct_model +- pytorch +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/nvidia/AceInstruct-1.5B + + +static quants are available at https://huggingface.co/mradermacher/AceInstruct-1.5B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ1_S.gguf) | i1-IQ1_S | 0.6 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ1_M.gguf) | i1-IQ1_M | 0.6 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ2_S.gguf) | i1-IQ2_S | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ2_M.gguf) | i1-IQ2_M | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.8 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q2_K.gguf) | i1-Q2_K | 0.9 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 1.0 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ3_S.gguf) | i1-IQ3_S | 1.0 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ3_M.gguf) | i1-IQ3_M | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.0 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.1 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 1.2 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q4_0.gguf) | i1-Q4_0 | 1.2 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 1.2 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q4_1.gguf) | i1-Q4_1 | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/AceInstruct-1.5B-i1-GGUF/resolve/main/AceInstruct-1.5B.i1-Q6_K.gguf) | i1-Q6_K | 1.6 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..c7925dd --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e92441957098b8d422265c54055eced906fca1e99972cdb02fd453e50d195fbb +size 2042201