From 6b600b67518fa7bb0296da772ba9ad70c2eb868b Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Thu, 23 Apr 2026 01:08:50 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/MXLewd-L2-20B-i1-GGUF Source: Original Platform --- .gitattributes | 58 ++++++++++++++++++++++++++++++ MXLewd-L2-20B.i1-IQ1_M.gguf | 3 ++ MXLewd-L2-20B.i1-IQ1_S.gguf | 3 ++ MXLewd-L2-20B.i1-IQ2_M.gguf | 3 ++ MXLewd-L2-20B.i1-IQ2_S.gguf | 3 ++ MXLewd-L2-20B.i1-IQ2_XS.gguf | 3 ++ MXLewd-L2-20B.i1-IQ2_XXS.gguf | 3 ++ MXLewd-L2-20B.i1-IQ3_M.gguf | 3 ++ MXLewd-L2-20B.i1-IQ3_S.gguf | 3 ++ MXLewd-L2-20B.i1-IQ3_XS.gguf | 3 ++ MXLewd-L2-20B.i1-IQ3_XXS.gguf | 3 ++ MXLewd-L2-20B.i1-IQ4_NL.gguf | 3 ++ MXLewd-L2-20B.i1-IQ4_XS.gguf | 3 ++ MXLewd-L2-20B.i1-Q2_K.gguf | 3 ++ MXLewd-L2-20B.i1-Q3_K_L.gguf | 3 ++ MXLewd-L2-20B.i1-Q3_K_M.gguf | 3 ++ MXLewd-L2-20B.i1-Q3_K_S.gguf | 3 ++ MXLewd-L2-20B.i1-Q4_0.gguf | 3 ++ MXLewd-L2-20B.i1-Q4_K_M.gguf | 3 ++ MXLewd-L2-20B.i1-Q4_K_S.gguf | 3 ++ MXLewd-L2-20B.i1-Q5_K_M.gguf | 3 ++ MXLewd-L2-20B.i1-Q5_K_S.gguf | 3 ++ MXLewd-L2-20B.i1-Q6_K.gguf | 3 ++ README.md | 68 +++++++++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 25 files changed, 195 insertions(+) create mode 100644 .gitattributes create mode 100644 MXLewd-L2-20B.i1-IQ1_M.gguf create mode 100644 MXLewd-L2-20B.i1-IQ1_S.gguf create mode 100644 MXLewd-L2-20B.i1-IQ2_M.gguf create mode 100644 MXLewd-L2-20B.i1-IQ2_S.gguf create mode 100644 MXLewd-L2-20B.i1-IQ2_XS.gguf create mode 100644 MXLewd-L2-20B.i1-IQ2_XXS.gguf create mode 100644 MXLewd-L2-20B.i1-IQ3_M.gguf create mode 100644 MXLewd-L2-20B.i1-IQ3_S.gguf create mode 100644 MXLewd-L2-20B.i1-IQ3_XS.gguf create mode 100644 MXLewd-L2-20B.i1-IQ3_XXS.gguf create mode 100644 MXLewd-L2-20B.i1-IQ4_NL.gguf create mode 100644 MXLewd-L2-20B.i1-IQ4_XS.gguf create mode 100644 MXLewd-L2-20B.i1-Q2_K.gguf create mode 100644 MXLewd-L2-20B.i1-Q3_K_L.gguf create mode 100644 MXLewd-L2-20B.i1-Q3_K_M.gguf create mode 100644 MXLewd-L2-20B.i1-Q3_K_S.gguf create mode 100644 MXLewd-L2-20B.i1-Q4_0.gguf create mode 100644 MXLewd-L2-20B.i1-Q4_K_M.gguf create mode 100644 MXLewd-L2-20B.i1-Q4_K_S.gguf create mode 100644 MXLewd-L2-20B.i1-Q5_K_M.gguf create mode 100644 MXLewd-L2-20B.i1-Q5_K_S.gguf create mode 100644 MXLewd-L2-20B.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..580da38 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,58 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +MXLewd-L2-20B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/MXLewd-L2-20B.i1-IQ1_M.gguf b/MXLewd-L2-20B.i1-IQ1_M.gguf new file mode 100644 index 0000000..615be59 --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb4191d8953bdb955972d6c45be2553d38c00a5ff7674dd0786109582ee86674 +size 4982148576 diff --git a/MXLewd-L2-20B.i1-IQ1_S.gguf b/MXLewd-L2-20B.i1-IQ1_S.gguf new file mode 100644 index 0000000..99366d7 --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d7807e0b795b23f650490e59d3890cc0361546745cb8d30bacb63e9c84dd7b1 +size 4609023456 diff --git a/MXLewd-L2-20B.i1-IQ2_M.gguf b/MXLewd-L2-20B.i1-IQ2_M.gguf new file mode 100644 index 0000000..91e03d8 --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a5fc7d99e57d7a35ea6c6c00da115261fc867a6bc70dcd8c8192e381cf616dc +size 7110399456 diff --git a/MXLewd-L2-20B.i1-IQ2_S.gguf b/MXLewd-L2-20B.i1-IQ2_S.gguf new file mode 100644 index 0000000..2294e78 --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a6823bdd34105ac82fec92e817f280cfb9561a392c37d00565e47eb0e415390 +size 6612899296 diff --git a/MXLewd-L2-20B.i1-IQ2_XS.gguf b/MXLewd-L2-20B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..acbe741 --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e990b01e7e3c69c6326a4def466679606988bdd779e6682baf7d6c3a854222b +size 6152314336 diff --git a/MXLewd-L2-20B.i1-IQ2_XXS.gguf b/MXLewd-L2-20B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..02f6213 --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b08fdd693ee30d619c25af40b4c5db9f691f6948aca72d42e337bd5178f2da9 +size 5604023776 diff --git a/MXLewd-L2-20B.i1-IQ3_M.gguf b/MXLewd-L2-20B.i1-IQ3_M.gguf new file mode 100644 index 0000000..bcf4563 --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:915b4dfd5dada8bffff53ae5f814d404cfb56a396f644b9845d689f2f35f85e6 +size 9349170656 diff --git a/MXLewd-L2-20B.i1-IQ3_S.gguf b/MXLewd-L2-20B.i1-IQ3_S.gguf new file mode 100644 index 0000000..416b00a --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b770415c1f76ce36f377fc50d1979c25a6cd9d4a4bdd3aa199880f7bb6a74d7d +size 8851650016 diff --git a/MXLewd-L2-20B.i1-IQ3_XS.gguf b/MXLewd-L2-20B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..ebb2996 --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1657fd74ab141f7bb552c4d5b67ffd5dae3b1dec61d0dea2d4f683fd70f8e73 +size 8387409376 diff --git a/MXLewd-L2-20B.i1-IQ3_XXS.gguf b/MXLewd-L2-20B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..8462e5d --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5174166fae91c273a8976eded9a0bb72c39c7da2d82d7b4bd2a27440d91b4878 +size 7802828256 diff --git a/MXLewd-L2-20B.i1-IQ4_NL.gguf b/MXLewd-L2-20B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..bb438e7 --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:045b7618905c00fdc7b8afa1e4a20cf61a819280cafee2669ffe928f9e2003ed +size 11485306336 diff --git a/MXLewd-L2-20B.i1-IQ4_XS.gguf b/MXLewd-L2-20B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..b3356fa --- /dev/null +++ b/MXLewd-L2-20B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a87b8885c2d6ab684b806d1346402e1a559246538c17103e85620a3ad0f2b83 +size 10865622496 diff --git a/MXLewd-L2-20B.i1-Q2_K.gguf b/MXLewd-L2-20B.i1-Q2_K.gguf new file mode 100644 index 0000000..da8b4bf --- /dev/null +++ b/MXLewd-L2-20B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b68244399859cbccc2945955b986fd005dc929548595c7bd22b79e5a6d186b6c +size 7613500896 diff --git a/MXLewd-L2-20B.i1-Q3_K_L.gguf b/MXLewd-L2-20B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..be866da --- /dev/null +++ b/MXLewd-L2-20B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fc62cef8e50a7d31eafbc95c8d22c1821de90c8e4838ba2049b32b4b70c07a1 +size 10821047776 diff --git a/MXLewd-L2-20B.i1-Q3_K_M.gguf b/MXLewd-L2-20B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..c95929d --- /dev/null +++ b/MXLewd-L2-20B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc5cb87736907175cfe7a700ccbbfb06263f6b7632b01c31e4e5a7ddf970f8fe +size 9899283936 diff --git a/MXLewd-L2-20B.i1-Q3_K_S.gguf b/MXLewd-L2-20B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..070a724 --- /dev/null +++ b/MXLewd-L2-20B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29eb48412f92ef6a5d3225f7b9f60de7412524553a63757d82124ed9c9ee33da +size 8851650016 diff --git a/MXLewd-L2-20B.i1-Q4_0.gguf b/MXLewd-L2-20B.i1-Q4_0.gguf new file mode 100644 index 0000000..0d6d40a --- /dev/null +++ b/MXLewd-L2-20B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f0c7e571974592ae6acf6fc5d20cc2dd71828b344fddfc17b95be273d2ca16a +size 11516272096 diff --git a/MXLewd-L2-20B.i1-Q4_K_M.gguf b/MXLewd-L2-20B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..c17d12e --- /dev/null +++ b/MXLewd-L2-20B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:927dac273107038ecbc565981ea3fff7ead5ff770f6036e032034046c108f962 +size 12235488736 diff --git a/MXLewd-L2-20B.i1-Q4_K_S.gguf b/MXLewd-L2-20B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..a29096d --- /dev/null +++ b/MXLewd-L2-20B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978ad559bd796b5c51982cb311dd6a7f043848646375a23679ab9bc37b2e5c1a +size 11560345056 diff --git a/MXLewd-L2-20B.i1-Q5_K_M.gguf b/MXLewd-L2-20B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..5c69f75 --- /dev/null +++ b/MXLewd-L2-20B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de66ac6c005cb3b7cdc95ac331e15563c70c9f313400317b557287a8bc508dbf +size 14350499296 diff --git a/MXLewd-L2-20B.i1-Q5_K_S.gguf b/MXLewd-L2-20B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..9bb6906 --- /dev/null +++ b/MXLewd-L2-20B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b124b2e9e4c370534356e78454f0dede673f145a7ceb42181d48ff5cd6969317 +size 13964041696 diff --git a/MXLewd-L2-20B.i1-Q6_K.gguf b/MXLewd-L2-20B.i1-Q6_K.gguf new file mode 100644 index 0000000..66c3b8d --- /dev/null +++ b/MXLewd-L2-20B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:241559700b3acb8394662a03d03421d04c32ce49e96625832a55ab794a81fd19 +size 16597698016 diff --git a/README.md b/README.md new file mode 100644 index 0000000..09ff56b --- /dev/null +++ b/README.md @@ -0,0 +1,68 @@ +--- +base_model: Undi95/MXLewd-L2-20B +language: +- en +library_name: transformers +license: cc-by-nc-4.0 +quantized_by: mradermacher +--- +## About + +weighted/imatrix quants of https://huggingface.co/Undi95/MXLewd-L2-20B + + +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ1_S.gguf) | i1-IQ1_S | 4.7 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ1_M.gguf) | i1-IQ1_M | 5.1 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 5.7 | | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 6.3 | | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ2_S.gguf) | i1-IQ2_S | 6.7 | | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ2_M.gguf) | i1-IQ2_M | 7.2 | | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-Q2_K.gguf) | i1-Q2_K | 7.7 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 7.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 8.5 | | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ3_S.gguf) | i1-IQ3_S | 9.0 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 9.0 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ3_M.gguf) | i1-IQ3_M | 9.4 | | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 10.0 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 10.9 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 11.0 | | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 11.6 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-Q4_0.gguf) | i1-Q4_0 | 11.6 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 11.7 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 12.3 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 14.1 | | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 14.5 | | +| [GGUF](https://huggingface.co/mradermacher/MXLewd-L2-20B-i1-GGUF/resolve/main/MXLewd-L2-20B.i1-Q6_K.gguf) | i1-Q6_K | 16.7 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..dd128c8 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3608fda7e2eaeb1678d2d50bc40abc262b30a601955d5beb478b8aa1d80520b7 +size 11061292