From b9ec4cbb3dea91637de0404e0aba3cd0681e9d8f Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sun, 7 Jun 2026 04:08:24 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/MN-Violet-Lotus-12B-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++++ MN-Violet-Lotus-12B.i1-IQ1_M.gguf | 3 + MN-Violet-Lotus-12B.i1-IQ1_S.gguf | 3 + MN-Violet-Lotus-12B.i1-IQ2_M.gguf | 3 + MN-Violet-Lotus-12B.i1-IQ2_S.gguf | 3 + MN-Violet-Lotus-12B.i1-IQ2_XS.gguf | 3 + MN-Violet-Lotus-12B.i1-IQ2_XXS.gguf | 3 + MN-Violet-Lotus-12B.i1-IQ3_M.gguf | 3 + MN-Violet-Lotus-12B.i1-IQ3_S.gguf | 3 + MN-Violet-Lotus-12B.i1-IQ3_XS.gguf | 3 + MN-Violet-Lotus-12B.i1-IQ3_XXS.gguf | 3 + MN-Violet-Lotus-12B.i1-IQ4_XS.gguf | 3 + MN-Violet-Lotus-12B.i1-Q2_K.gguf | 3 + MN-Violet-Lotus-12B.i1-Q3_K_L.gguf | 3 + MN-Violet-Lotus-12B.i1-Q3_K_M.gguf | 3 + MN-Violet-Lotus-12B.i1-Q3_K_S.gguf | 3 + MN-Violet-Lotus-12B.i1-Q4_0.gguf | 3 + MN-Violet-Lotus-12B.i1-Q4_0_4_4.gguf | 3 + MN-Violet-Lotus-12B.i1-Q4_0_4_8.gguf | 3 + MN-Violet-Lotus-12B.i1-Q4_0_8_8.gguf | 3 + MN-Violet-Lotus-12B.i1-Q4_K_M.gguf | 3 + MN-Violet-Lotus-12B.i1-Q4_K_S.gguf | 3 + MN-Violet-Lotus-12B.i1-Q5_K_M.gguf | 3 + MN-Violet-Lotus-12B.i1-Q5_K_S.gguf | 3 + MN-Violet-Lotus-12B.i1-Q6_K.gguf | 3 + README.md | 87 ++++++++++++++++++++++++++++ imatrix.dat | 3 + 27 files changed, 222 insertions(+) create mode 100644 .gitattributes create mode 100644 MN-Violet-Lotus-12B.i1-IQ1_M.gguf create mode 100644 MN-Violet-Lotus-12B.i1-IQ1_S.gguf create mode 100644 MN-Violet-Lotus-12B.i1-IQ2_M.gguf create mode 100644 MN-Violet-Lotus-12B.i1-IQ2_S.gguf create mode 100644 MN-Violet-Lotus-12B.i1-IQ2_XS.gguf create mode 100644 MN-Violet-Lotus-12B.i1-IQ2_XXS.gguf create mode 100644 MN-Violet-Lotus-12B.i1-IQ3_M.gguf create mode 100644 MN-Violet-Lotus-12B.i1-IQ3_S.gguf create mode 100644 MN-Violet-Lotus-12B.i1-IQ3_XS.gguf create mode 100644 MN-Violet-Lotus-12B.i1-IQ3_XXS.gguf create mode 100644 MN-Violet-Lotus-12B.i1-IQ4_XS.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q2_K.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q3_K_L.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q3_K_M.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q3_K_S.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q4_0.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q4_0_4_4.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q4_0_4_8.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q4_0_8_8.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q4_K_M.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q4_K_S.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q5_K_M.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q5_K_S.gguf create mode 100644 MN-Violet-Lotus-12B.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..8484bad --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q4_0_4_8.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-Q4_0_8_8.gguf filter=lfs diff=lfs merge=lfs -text +MN-Violet-Lotus-12B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/MN-Violet-Lotus-12B.i1-IQ1_M.gguf b/MN-Violet-Lotus-12B.i1-IQ1_M.gguf new file mode 100644 index 0000000..750997b --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43737b64baaff4f79f5b9bcbb63730619338324f084a97543a867b4a9ae04909 +size 3221629504 diff --git a/MN-Violet-Lotus-12B.i1-IQ1_S.gguf b/MN-Violet-Lotus-12B.i1-IQ1_S.gguf new file mode 100644 index 0000000..54e61f0 --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab37abcbbd8d4ccccdf52287f30a5a1f23452972ac1d842b5f7b8b5b58bc9f7a +size 2999216704 diff --git a/MN-Violet-Lotus-12B.i1-IQ2_M.gguf b/MN-Violet-Lotus-12B.i1-IQ2_M.gguf new file mode 100644 index 0000000..09473fa --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03b664b71334d718446d549aa3eb4a0de165aef6428555545808ac1606f0d11d +size 4435028544 diff --git a/MN-Violet-Lotus-12B.i1-IQ2_S.gguf b/MN-Violet-Lotus-12B.i1-IQ2_S.gguf new file mode 100644 index 0000000..4daaf38 --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db11e90b3587ecfad5a9e91495aed1cde98fc973db6214356e95494411428b86 +size 4138478144 diff --git a/MN-Violet-Lotus-12B.i1-IQ2_XS.gguf b/MN-Violet-Lotus-12B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..cee049e --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:363ccf47acda75b495ff5af6b69fc78fb4fced6ab17c7ccc9c8fb6b3fe66e24a +size 3915082304 diff --git a/MN-Violet-Lotus-12B.i1-IQ2_XXS.gguf b/MN-Violet-Lotus-12B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..ab3e4ff --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e7ae5475e4f159fd4761c904bffe4cd6b8a84a8f68d2c608c416ca2741ad7c4 +size 3592317504 diff --git a/MN-Violet-Lotus-12B.i1-IQ3_M.gguf b/MN-Violet-Lotus-12B.i1-IQ3_M.gguf new file mode 100644 index 0000000..9c1828a --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:703cbf8ab3e4639bb4c987c613aba8137f78cb3b8cd67a2fe7564422876b7679 +size 5722237504 diff --git a/MN-Violet-Lotus-12B.i1-IQ3_S.gguf b/MN-Violet-Lotus-12B.i1-IQ3_S.gguf new file mode 100644 index 0000000..a69fc7b --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a10c12f8991679cadc861a67147de776e224b596d3c10d20d623a67e16f86cbb +size 5562083904 diff --git a/MN-Violet-Lotus-12B.i1-IQ3_XS.gguf b/MN-Violet-Lotus-12B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..e490dd6 --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d923b83741946d031ac6b5222dc86b6f75bcf60587204cbf2baf780f7694601 +size 5306493504 diff --git a/MN-Violet-Lotus-12B.i1-IQ3_XXS.gguf b/MN-Violet-Lotus-12B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..c2e33ab --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a7365d246090119ca12c1a229296621acd1dfe25bcfaf64709d9bf94d8a8cb8 +size 4945390144 diff --git a/MN-Violet-Lotus-12B.i1-IQ4_XS.gguf b/MN-Violet-Lotus-12B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..24196ce --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:effd929bdc5200e4b42c46b8d73d61c6d63fe8a9f2ad6af0cd4cb1d79a279767 +size 6742714944 diff --git a/MN-Violet-Lotus-12B.i1-Q2_K.gguf b/MN-Violet-Lotus-12B.i1-Q2_K.gguf new file mode 100644 index 0000000..abab257 --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63d78fb61862eb061cc81f4d2782abc54d8ff0212a4ecce09d8e3d9513b3c124 +size 4791052864 diff --git a/MN-Violet-Lotus-12B.i1-Q3_K_L.gguf b/MN-Violet-Lotus-12B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..d13b9db --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:991a95060c9a2b78a2ac9dc535f496baaf9e04f95ce562f388a83164bd1da6aa +size 6561507904 diff --git a/MN-Violet-Lotus-12B.i1-Q3_K_M.gguf b/MN-Violet-Lotus-12B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..764575f --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aa02bc539050ba26f95e2be32b079fd685769fcdfcd9e6c83e9058894f27727 +size 6083095104 diff --git a/MN-Violet-Lotus-12B.i1-Q3_K_S.gguf b/MN-Violet-Lotus-12B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..12c458d --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37c6d5a44b4e370b21de357228588e569ed712efa49faa62ee860459f3e75784 +size 5534231104 diff --git a/MN-Violet-Lotus-12B.i1-Q4_0.gguf b/MN-Violet-Lotus-12B.i1-Q4_0.gguf new file mode 100644 index 0000000..c189340 --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ff432e95b084ccb320963f5426ac18ba184fb904c3f1843dac2e875ce347b6 +size 7094643264 diff --git a/MN-Violet-Lotus-12B.i1-Q4_0_4_4.gguf b/MN-Violet-Lotus-12B.i1-Q4_0_4_4.gguf new file mode 100644 index 0000000..6d3e6f2 --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q4_0_4_4.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b2f84db101199d64690f9279ad2b4f456fdd7f0f2bfc98fcf67c7ff6b23273c +size 7071705664 diff --git a/MN-Violet-Lotus-12B.i1-Q4_0_4_8.gguf b/MN-Violet-Lotus-12B.i1-Q4_0_4_8.gguf new file mode 100644 index 0000000..8745f98 --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q4_0_4_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7616ebf8c3a5c21f2ec927fbe883c0f3e47977e0a7fdafaa219c7d4172a2bfc +size 7071705664 diff --git a/MN-Violet-Lotus-12B.i1-Q4_0_8_8.gguf b/MN-Violet-Lotus-12B.i1-Q4_0_8_8.gguf new file mode 100644 index 0000000..d0975b9 --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q4_0_8_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf85e30f7ec58781068e42b631ca5190572540459ac42845474eaa9c358f3b59 +size 7071705664 diff --git a/MN-Violet-Lotus-12B.i1-Q4_K_M.gguf b/MN-Violet-Lotus-12B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..e76f8b1 --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e75817fdcb32cec47f7845a907090b268e24a4a0ab3f607135a6c0f042241c3e +size 7477209664 diff --git a/MN-Violet-Lotus-12B.i1-Q4_K_S.gguf b/MN-Violet-Lotus-12B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..126c3d1 --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf7e644620a171b33743111f6cdb34817f6945de001632a57fd6caf9fa7d767e +size 7120202304 diff --git a/MN-Violet-Lotus-12B.i1-Q5_K_M.gguf b/MN-Violet-Lotus-12B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..ea7a584 --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc93e2413d8f5841fd8335ceb44c01c51c05c9b59ecfad9590567d50829d8ee +size 8727636544 diff --git a/MN-Violet-Lotus-12B.i1-Q5_K_S.gguf b/MN-Violet-Lotus-12B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..83b151a --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5843564d672ff675769acf1f95aef17ff1c85e517653ed03b18cea9a23759ad +size 8518740544 diff --git a/MN-Violet-Lotus-12B.i1-Q6_K.gguf b/MN-Violet-Lotus-12B.i1-Q6_K.gguf new file mode 100644 index 0000000..91e868b --- /dev/null +++ b/MN-Violet-Lotus-12B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5abbd259c3039f2ab37030f49f9dad995007e2ecb1aa9f01d3241ef9b7124227 +size 10056215104 diff --git a/README.md b/README.md new file mode 100644 index 0000000..97b212f --- /dev/null +++ b/README.md @@ -0,0 +1,87 @@ +--- +base_model: FallenMerick/MN-Violet-Lotus-12B +language: +- en +library_name: transformers +license: cc-by-4.0 +quantized_by: mradermacher +tags: +- storywriting +- text adventure +- creative +- story +- writing +- fiction +- roleplaying +- rp +- mergekit +- merge +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/FallenMerick/MN-Violet-Lotus-12B + + +static quants are available at https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-IQ1_S.gguf) | i1-IQ1_S | 3.1 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-IQ1_M.gguf) | i1-IQ1_M | 3.3 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 3.7 | | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 4.0 | | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-IQ2_S.gguf) | i1-IQ2_S | 4.2 | | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-IQ2_M.gguf) | i1-IQ2_M | 4.5 | | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q2_K.gguf) | i1-Q2_K | 4.9 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 5.0 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 5.4 | | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 5.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-IQ3_S.gguf) | i1-IQ3_S | 5.7 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-IQ3_M.gguf) | i1-IQ3_M | 5.8 | | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 6.2 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 6.7 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 6.8 | | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q4_0_4_4.gguf) | i1-Q4_0_4_4 | 7.2 | fast on arm, low quality | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q4_0_4_8.gguf) | i1-Q4_0_4_8 | 7.2 | fast on arm+i8mm, low quality | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q4_0_8_8.gguf) | i1-Q4_0_8_8 | 7.2 | fast on arm+sve, low quality | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q4_0.gguf) | i1-Q4_0 | 7.2 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 7.2 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 7.6 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 8.6 | | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 8.8 | | +| [GGUF](https://huggingface.co/mradermacher/MN-Violet-Lotus-12B-i1-GGUF/resolve/main/MN-Violet-Lotus-12B.i1-Q6_K.gguf) | i1-Q6_K | 10.2 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..29780c1 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526fe0dc1a4795602a3b9889c35fca042dd008020e1ea803207c53489cdefe6f +size 7054405