From a3241eb7843422b41578fe5b09de38e2a688d0d8 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 6 Jun 2026 09:31:16 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Hembot-7B-v1-i1-GGUF Source: Original Platform --- .gitattributes | 60 ++++++++++++++++++++++++ Hembot-7B-v1.i1-IQ1_M.gguf | 3 ++ Hembot-7B-v1.i1-IQ1_S.gguf | 3 ++ Hembot-7B-v1.i1-IQ2_M.gguf | 3 ++ Hembot-7B-v1.i1-IQ2_S.gguf | 3 ++ Hembot-7B-v1.i1-IQ2_XS.gguf | 3 ++ Hembot-7B-v1.i1-IQ2_XXS.gguf | 3 ++ Hembot-7B-v1.i1-IQ3_M.gguf | 3 ++ Hembot-7B-v1.i1-IQ3_S.gguf | 3 ++ Hembot-7B-v1.i1-IQ3_XS.gguf | 3 ++ Hembot-7B-v1.i1-IQ3_XXS.gguf | 3 ++ Hembot-7B-v1.i1-IQ4_NL.gguf | 3 ++ Hembot-7B-v1.i1-IQ4_XS.gguf | 3 ++ Hembot-7B-v1.i1-Q2_K.gguf | 3 ++ Hembot-7B-v1.i1-Q2_K_S.gguf | 3 ++ Hembot-7B-v1.i1-Q3_K_L.gguf | 3 ++ Hembot-7B-v1.i1-Q3_K_M.gguf | 3 ++ Hembot-7B-v1.i1-Q3_K_S.gguf | 3 ++ Hembot-7B-v1.i1-Q4_0.gguf | 3 ++ Hembot-7B-v1.i1-Q4_1.gguf | 3 ++ Hembot-7B-v1.i1-Q4_K_M.gguf | 3 ++ Hembot-7B-v1.i1-Q4_K_S.gguf | 3 ++ Hembot-7B-v1.i1-Q5_K_M.gguf | 3 ++ Hembot-7B-v1.i1-Q5_K_S.gguf | 3 ++ Hembot-7B-v1.i1-Q6_K.gguf | 3 ++ Hembot-7B-v1.imatrix.gguf | 3 ++ README.md | 91 ++++++++++++++++++++++++++++++++++++ 27 files changed, 226 insertions(+) create mode 100644 .gitattributes create mode 100644 Hembot-7B-v1.i1-IQ1_M.gguf create mode 100644 Hembot-7B-v1.i1-IQ1_S.gguf create mode 100644 Hembot-7B-v1.i1-IQ2_M.gguf create mode 100644 Hembot-7B-v1.i1-IQ2_S.gguf create mode 100644 Hembot-7B-v1.i1-IQ2_XS.gguf create mode 100644 Hembot-7B-v1.i1-IQ2_XXS.gguf create mode 100644 Hembot-7B-v1.i1-IQ3_M.gguf create mode 100644 Hembot-7B-v1.i1-IQ3_S.gguf create mode 100644 Hembot-7B-v1.i1-IQ3_XS.gguf create mode 100644 Hembot-7B-v1.i1-IQ3_XXS.gguf create mode 100644 Hembot-7B-v1.i1-IQ4_NL.gguf create mode 100644 Hembot-7B-v1.i1-IQ4_XS.gguf create mode 100644 Hembot-7B-v1.i1-Q2_K.gguf create mode 100644 Hembot-7B-v1.i1-Q2_K_S.gguf create mode 100644 Hembot-7B-v1.i1-Q3_K_L.gguf create mode 100644 Hembot-7B-v1.i1-Q3_K_M.gguf create mode 100644 Hembot-7B-v1.i1-Q3_K_S.gguf create mode 100644 Hembot-7B-v1.i1-Q4_0.gguf create mode 100644 Hembot-7B-v1.i1-Q4_1.gguf create mode 100644 Hembot-7B-v1.i1-Q4_K_M.gguf create mode 100644 Hembot-7B-v1.i1-Q4_K_S.gguf create mode 100644 Hembot-7B-v1.i1-Q5_K_M.gguf create mode 100644 Hembot-7B-v1.i1-Q5_K_S.gguf create mode 100644 Hembot-7B-v1.i1-Q6_K.gguf create mode 100644 Hembot-7B-v1.imatrix.gguf create mode 100644 README.md diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..97e8e70 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.imatrix.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Hembot-7B-v1.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Hembot-7B-v1.i1-IQ1_M.gguf b/Hembot-7B-v1.i1-IQ1_M.gguf new file mode 100644 index 0000000..6d3dfa2 --- /dev/null +++ b/Hembot-7B-v1.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a80a4958f86d386944e11c36b5f35f280e482107695833cf2ceac7bce53002be +size 2042197248 diff --git a/Hembot-7B-v1.i1-IQ1_S.gguf b/Hembot-7B-v1.i1-IQ1_S.gguf new file mode 100644 index 0000000..6e2cd5c --- /dev/null +++ b/Hembot-7B-v1.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70360d76c955b885be8e1bbb1737152053b93d4cdf329dbe7a810b6e70d9754f +size 1903668480 diff --git a/Hembot-7B-v1.i1-IQ2_M.gguf b/Hembot-7B-v1.i1-IQ2_M.gguf new file mode 100644 index 0000000..eeb067b --- /dev/null +++ b/Hembot-7B-v1.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50e260e7b901b07b6f99709a2de319ed2a06b0978cb41bafb5ccb4e8e5e81da1 +size 2780343552 diff --git a/Hembot-7B-v1.i1-IQ2_S.gguf b/Hembot-7B-v1.i1-IQ2_S.gguf new file mode 100644 index 0000000..5ac5073 --- /dev/null +++ b/Hembot-7B-v1.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b611c4525f372cf07362f2c2a4bc03ca459579c1cbdd2252ac5cb731c4d8684 +size 2595638528 diff --git a/Hembot-7B-v1.i1-IQ2_XS.gguf b/Hembot-7B-v1.i1-IQ2_XS.gguf new file mode 100644 index 0000000..9922135 --- /dev/null +++ b/Hembot-7B-v1.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a6793b2fda8e5aa57fee55a6cb56006f15d11dfd77d902b27a373495c7b621 +size 2469022976 diff --git a/Hembot-7B-v1.i1-IQ2_XXS.gguf b/Hembot-7B-v1.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..a4fa8e2 --- /dev/null +++ b/Hembot-7B-v1.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a51b4ff49d6908b05cda4bcb0e3a42031faf64f35dd2ecf90a777f9d73a8e2f +size 2273078528 diff --git a/Hembot-7B-v1.i1-IQ3_M.gguf b/Hembot-7B-v1.i1-IQ3_M.gguf new file mode 100644 index 0000000..0b30546 --- /dev/null +++ b/Hembot-7B-v1.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf2751fe68d8c0f0d803f4718ef20300c20b99c98aaa85eec5c3e0517b7e5b3b +size 3574013184 diff --git a/Hembot-7B-v1.i1-IQ3_S.gguf b/Hembot-7B-v1.i1-IQ3_S.gguf new file mode 100644 index 0000000..ba38ddb --- /dev/null +++ b/Hembot-7B-v1.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61be4354079fb469f24c7ad81e424de1d4d09e878804d2ec2fb2cf679d893f39 +size 3499193600 diff --git a/Hembot-7B-v1.i1-IQ3_XS.gguf b/Hembot-7B-v1.i1-IQ3_XS.gguf new file mode 100644 index 0000000..3986f78 --- /dev/null +++ b/Hembot-7B-v1.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46c34e8d18df7fdb9429c11283c95fbc31e824ac571167d63c966859404b0ba6 +size 3346257152 diff --git a/Hembot-7B-v1.i1-IQ3_XXS.gguf b/Hembot-7B-v1.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..2ce23d2 --- /dev/null +++ b/Hembot-7B-v1.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac3810ba626a03a7cf651873d12a97308f65269a16c138c99650ddddb1ab04c0 +size 3114515712 diff --git a/Hembot-7B-v1.i1-IQ4_NL.gguf b/Hembot-7B-v1.i1-IQ4_NL.gguf new file mode 100644 index 0000000..683862f --- /dev/null +++ b/Hembot-7B-v1.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b851193a7dee6706b3a1804af0ebfc38e82e2a46b1fed5b0f49f156cb11a95 +size 4437814528 diff --git a/Hembot-7B-v1.i1-IQ4_XS.gguf b/Hembot-7B-v1.i1-IQ4_XS.gguf new file mode 100644 index 0000000..8d88684 --- /dev/null +++ b/Hembot-7B-v1.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36b9db4afa445092b8d83b8fad6e2ae2f56904987ebd1b90daa3db2d7f61b683 +size 4218473728 diff --git a/Hembot-7B-v1.i1-Q2_K.gguf b/Hembot-7B-v1.i1-Q2_K.gguf new file mode 100644 index 0000000..726867d --- /dev/null +++ b/Hembot-7B-v1.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaab1f60b344865bb3badf73e9a645eb24ed3e6566e1d7ca521b07ea0df9c868 +size 3015941376 diff --git a/Hembot-7B-v1.i1-Q2_K_S.gguf b/Hembot-7B-v1.i1-Q2_K_S.gguf new file mode 100644 index 0000000..9e5c879 --- /dev/null +++ b/Hembot-7B-v1.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bfb27f8d838e1e8e5d30287d6e5c54dca784662ac35eaa5516dcd3f90d3b8b8 +size 2834074880 diff --git a/Hembot-7B-v1.i1-Q3_K_L.gguf b/Hembot-7B-v1.i1-Q3_K_L.gguf new file mode 100644 index 0000000..5c6703e --- /dev/null +++ b/Hembot-7B-v1.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a26b62883b29f2db803a320c8e2776a51d13fabaef0f115db443dc0a6c9519c9 +size 4088460544 diff --git a/Hembot-7B-v1.i1-Q3_K_M.gguf b/Hembot-7B-v1.i1-Q3_K_M.gguf new file mode 100644 index 0000000..043e246 --- /dev/null +++ b/Hembot-7B-v1.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3807ebedebfa8e394f1bb1ac519dfe67dcbebc64229b5c34405056dcc274718e +size 3808392448 diff --git a/Hembot-7B-v1.i1-Q3_K_S.gguf b/Hembot-7B-v1.i1-Q3_K_S.gguf new file mode 100644 index 0000000..c370279 --- /dev/null +++ b/Hembot-7B-v1.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb3c3de6d45cd697e39afba3d94b742012fede1cfdb56a5e1aca188a5cc0d3ad +size 3492369664 diff --git a/Hembot-7B-v1.i1-Q4_0.gguf b/Hembot-7B-v1.i1-Q4_0.gguf new file mode 100644 index 0000000..92f76cc --- /dev/null +++ b/Hembot-7B-v1.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f8a19303bbab9b4ed3b55fde4d3046deb5af57100d668558ebd672aa205d35 +size 4444122368 diff --git a/Hembot-7B-v1.i1-Q4_1.gguf b/Hembot-7B-v1.i1-Q4_1.gguf new file mode 100644 index 0000000..2a86bc7 --- /dev/null +++ b/Hembot-7B-v1.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ecec4fc6dc54a471b45760b8bab3f2b0c27b643f6dc86cd77075d5302437c60 +size 4873284864 diff --git a/Hembot-7B-v1.i1-Q4_K_M.gguf b/Hembot-7B-v1.i1-Q4_K_M.gguf new file mode 100644 index 0000000..752cba6 --- /dev/null +++ b/Hembot-7B-v1.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16ac1e2e45fef62249ce8906449f287399a1f4ed5e4eaa60603c54ef1e40b898 +size 4683074816 diff --git a/Hembot-7B-v1.i1-Q4_K_S.gguf b/Hembot-7B-v1.i1-Q4_K_S.gguf new file mode 100644 index 0000000..07a095a --- /dev/null +++ b/Hembot-7B-v1.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c446d4c8ea8a238ef994c8b81b55b56524dd91b010c018133066ccabfd0d4dce +size 4457770240 diff --git a/Hembot-7B-v1.i1-Q5_K_M.gguf b/Hembot-7B-v1.i1-Q5_K_M.gguf new file mode 100644 index 0000000..6cec655 --- /dev/null +++ b/Hembot-7B-v1.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc3172d7da05d62ed7e0f6ac836e0d6e1d10827dd78d19710e96720039cfb3d +size 5444832512 diff --git a/Hembot-7B-v1.i1-Q5_K_S.gguf b/Hembot-7B-v1.i1-Q5_K_S.gguf new file mode 100644 index 0000000..1c795c0 --- /dev/null +++ b/Hembot-7B-v1.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c6ba9c17d026d35b93b3e1b19a6968cab5f62971b603f0508e089d07029bd05 +size 5315177728 diff --git a/Hembot-7B-v1.i1-Q6_K.gguf b/Hembot-7B-v1.i1-Q6_K.gguf new file mode 100644 index 0000000..8d9fa47 --- /dev/null +++ b/Hembot-7B-v1.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d24f4230dac605b87375e3adb50a8bbedc32bf724392e1cbce7b22a13b304d45 +size 6254200064 diff --git a/Hembot-7B-v1.imatrix.gguf b/Hembot-7B-v1.imatrix.gguf new file mode 100644 index 0000000..8462eb4 --- /dev/null +++ b/Hembot-7B-v1.imatrix.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e88adc752d40b32b46d66f8d505fbc5625db8f71b5c93cf833aa09b8fae4dd8a +size 4560352 diff --git a/README.md b/README.md new file mode 100644 index 0000000..f224639 --- /dev/null +++ b/README.md @@ -0,0 +1,91 @@ +--- +base_model: hemlang/Hembot-7B-v1 +datasets: +- hemlang/Hembot-DPO +language: +- en +library_name: transformers +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- merlina +- grimoire +- text-generation +- orpo +--- +## About + + + + + + + + + +weighted/imatrix quants of https://huggingface.co/hemlang/Hembot-7B-v1 + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Hembot-7B-v1-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/Hembot-7B-v1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.imatrix.gguf) | imatrix | 0.1 | imatrix file (for creating your own quants) | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ1_S.gguf) | i1-IQ1_S | 2.0 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ1_M.gguf) | i1-IQ1_M | 2.1 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.6 | | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ2_S.gguf) | i1-IQ2_S | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ2_M.gguf) | i1-IQ2_M | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q2_K_S.gguf) | i1-Q2_K_S | 2.9 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q2_K.gguf) | i1-Q2_K | 3.1 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.2 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ3_S.gguf) | i1-IQ3_S | 3.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ3_M.gguf) | i1-IQ3_M | 3.7 | | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q3_K_M.gguf) | i1-Q3_K_M | 3.9 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.2 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.3 | | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-IQ4_NL.gguf) | i1-IQ4_NL | 4.5 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q4_0.gguf) | i1-Q4_0 | 4.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.6 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q4_K_M.gguf) | i1-Q4_K_M | 4.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q4_1.gguf) | i1-Q4_1 | 5.0 | | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.4 | | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.5 | | +| [GGUF](https://huggingface.co/mradermacher/Hembot-7B-v1-i1-GGUF/resolve/main/Hembot-7B-v1.i1-Q6_K.gguf) | i1-Q6_K | 6.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + +