From 56d9b82b6e3f9b8b75d67dca356cdcafd98d1e8b Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Wed, 20 May 2026 06:51:11 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Luna-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++++++++++++ Luna.i1-IQ1_M.gguf | 3 ++ Luna.i1-IQ1_S.gguf | 3 ++ Luna.i1-IQ2_M.gguf | 3 ++ Luna.i1-IQ2_S.gguf | 3 ++ Luna.i1-IQ2_XS.gguf | 3 ++ Luna.i1-IQ2_XXS.gguf | 3 ++ Luna.i1-IQ3_M.gguf | 3 ++ Luna.i1-IQ3_S.gguf | 3 ++ Luna.i1-IQ3_XS.gguf | 3 ++ Luna.i1-IQ3_XXS.gguf | 3 ++ Luna.i1-IQ4_NL.gguf | 3 ++ Luna.i1-IQ4_XS.gguf | 3 ++ Luna.i1-Q2_K.gguf | 3 ++ Luna.i1-Q2_K_S.gguf | 3 ++ Luna.i1-Q3_K_L.gguf | 3 ++ Luna.i1-Q3_K_M.gguf | 3 ++ Luna.i1-Q3_K_S.gguf | 3 ++ Luna.i1-Q4_0.gguf | 3 ++ Luna.i1-Q4_1.gguf | 3 ++ Luna.i1-Q4_K_M.gguf | 3 ++ Luna.i1-Q4_K_S.gguf | 3 ++ Luna.i1-Q5_K_M.gguf | 3 ++ Luna.i1-Q5_K_S.gguf | 3 ++ Luna.i1-Q6_K.gguf | 3 ++ Luna.imatrix.gguf | 3 ++ README.md | 98 ++++++++++++++++++++++++++++++++++++++++++++ 27 files changed, 233 insertions(+) create mode 100644 .gitattributes create mode 100644 Luna.i1-IQ1_M.gguf create mode 100644 Luna.i1-IQ1_S.gguf create mode 100644 Luna.i1-IQ2_M.gguf create mode 100644 Luna.i1-IQ2_S.gguf create mode 100644 Luna.i1-IQ2_XS.gguf create mode 100644 Luna.i1-IQ2_XXS.gguf create mode 100644 Luna.i1-IQ3_M.gguf create mode 100644 Luna.i1-IQ3_S.gguf create mode 100644 Luna.i1-IQ3_XS.gguf create mode 100644 Luna.i1-IQ3_XXS.gguf create mode 100644 Luna.i1-IQ4_NL.gguf create mode 100644 Luna.i1-IQ4_XS.gguf create mode 100644 Luna.i1-Q2_K.gguf create mode 100644 Luna.i1-Q2_K_S.gguf create mode 100644 Luna.i1-Q3_K_L.gguf create mode 100644 Luna.i1-Q3_K_M.gguf create mode 100644 Luna.i1-Q3_K_S.gguf create mode 100644 Luna.i1-Q4_0.gguf create mode 100644 Luna.i1-Q4_1.gguf create mode 100644 Luna.i1-Q4_K_M.gguf create mode 100644 Luna.i1-Q4_K_S.gguf create mode 100644 Luna.i1-Q5_K_M.gguf create mode 100644 Luna.i1-Q5_K_S.gguf create mode 100644 Luna.i1-Q6_K.gguf create mode 100644 Luna.imatrix.gguf create mode 100644 README.md diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..aa14a8b --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Luna.imatrix.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Luna.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Luna.i1-IQ1_M.gguf b/Luna.i1-IQ1_M.gguf new file mode 100644 index 0000000..01a147a --- /dev/null +++ b/Luna.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ac03bc48d55182d9013c5e5fc12d8187bb386184572be8a23b60cc00e2a04fe +size 1127018016 diff --git a/Luna.i1-IQ1_S.gguf b/Luna.i1-IQ1_S.gguf new file mode 100644 index 0000000..58eb071 --- /dev/null +++ b/Luna.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b2f3da0d394a0f2807d611f2d3a1178281ba2e0fb7094e6f986e17e70e523d +size 1055256096 diff --git a/Luna.i1-IQ2_M.gguf b/Luna.i1-IQ2_M.gguf new file mode 100644 index 0000000..29da7fc --- /dev/null +++ b/Luna.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ab49c908a9d53ad2e0d76208190f4c38d564f5c6e6c67b8081fe8a40ca0f8e +size 1512984096 diff --git a/Luna.i1-IQ2_S.gguf b/Luna.i1-IQ2_S.gguf new file mode 100644 index 0000000..f21b7e7 --- /dev/null +++ b/Luna.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e0d6f56222007f153f264a7d531e216e3b203d4b8f1a8d32c9ddba736f5c690 +size 1417301536 diff --git a/Luna.i1-IQ2_XS.gguf b/Luna.i1-IQ2_XS.gguf new file mode 100644 index 0000000..902ed34 --- /dev/null +++ b/Luna.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0415d1f4addd88b52bed52f9a6bcebf41c85e14f35f54110802955cee3c20be +size 1354100256 diff --git a/Luna.i1-IQ2_XXS.gguf b/Luna.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..09d0a04 --- /dev/null +++ b/Luna.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:434c1a57b3e814fad866f20e6b0fe2344610c2852e73a1dc03b1173bb346621d +size 1246621216 diff --git a/Luna.i1-IQ3_M.gguf b/Luna.i1-IQ3_M.gguf new file mode 100644 index 0000000..4ec4e3e --- /dev/null +++ b/Luna.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc07aa1a1a061f852e79a9570234fec5e9ba19764b8f9b1f65e13bf0a389bab2 +size 1962896416 diff --git a/Luna.i1-IQ3_S.gguf b/Luna.i1-IQ3_S.gguf new file mode 100644 index 0000000..1905c12 --- /dev/null +++ b/Luna.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4750255355ad05829c795274085951228d2764bdfb1d6572144102880e37e8a +size 1899531296 diff --git a/Luna.i1-IQ3_XS.gguf b/Luna.i1-IQ3_XS.gguf new file mode 100644 index 0000000..58e8036 --- /dev/null +++ b/Luna.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e28e99fc138e514cef1bd0b6e02ddfb6f90ed54df4fb8cf033ab1d2de54ab5e2 +size 1814375456 diff --git a/Luna.i1-IQ3_XXS.gguf b/Luna.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..5a63673 --- /dev/null +++ b/Luna.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c8ff1b450a7e8f2c6d09f4dc9355d63a5584bb06bf1dd60723dd675e757d84 +size 1670188576 diff --git a/Luna.i1-IQ4_NL.gguf b/Luna.i1-IQ4_NL.gguf new file mode 100644 index 0000000..0b63b3d --- /dev/null +++ b/Luna.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbbc0d2b247bc5ca1625c698fb418de0ad871381461bd4a3cb45a03acdb51fbe +size 2381343776 diff --git a/Luna.i1-IQ4_XS.gguf b/Luna.i1-IQ4_XS.gguf new file mode 100644 index 0000000..7c79e09 --- /dev/null +++ b/Luna.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ffbdd9993e4f052f568749fb79c7cff94832fc4be913f6b42432eba7004c6bb +size 2270751776 diff --git a/Luna.i1-Q2_K.gguf b/Luna.i1-Q2_K.gguf new file mode 100644 index 0000000..1e6cfb3 --- /dev/null +++ b/Luna.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e8284d8cf22f9e12a4688abed90dca38134a5a657023940245a49b78211e85b +size 1669499936 diff --git a/Luna.i1-Q2_K_S.gguf b/Luna.i1-Q2_K_S.gguf new file mode 100644 index 0000000..6735a32 --- /dev/null +++ b/Luna.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b195bdefb5a751cd10318da2061f357848b6611ac930d8dfb22f9b89a26c922 +size 1563454496 diff --git a/Luna.i1-Q3_K_L.gguf b/Luna.i1-Q3_K_L.gguf new file mode 100644 index 0000000..96d6343 --- /dev/null +++ b/Luna.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2be391c818abc54d12e03646e0fbdf903a1cb42388154e69ec045370b49bdfef +size 2239786016 diff --git a/Luna.i1-Q3_K_M.gguf b/Luna.i1-Q3_K_M.gguf new file mode 100644 index 0000000..44d99ed --- /dev/null +++ b/Luna.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6be6fc84a36bbb7bd0de7bec1784813891061cb1bdc0a4e0405f1ce811e40d +size 2075618336 diff --git a/Luna.i1-Q3_K_S.gguf b/Luna.i1-Q3_K_S.gguf new file mode 100644 index 0000000..b238000 --- /dev/null +++ b/Luna.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0af58c7e0d8c1f0f689768ed4175cc5584bcaa385aa352398784aa9552ac8bd5 +size 1886997536 diff --git a/Luna.i1-Q4_0.gguf b/Luna.i1-Q4_0.gguf new file mode 100644 index 0000000..e8411d1 --- /dev/null +++ b/Luna.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34bc89476d33583b5ec01309da7b63981125392f780942b2f96f930edd2315c1 +size 2375773216 diff --git a/Luna.i1-Q4_1.gguf b/Luna.i1-Q4_1.gguf new file mode 100644 index 0000000..7b25601 --- /dev/null +++ b/Luna.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1820eda48ec8c0435aa16d1165113c440bd5844f8e81e292d08839bafd43b77 +size 2596629536 diff --git a/Luna.i1-Q4_K_M.gguf b/Luna.i1-Q4_K_M.gguf new file mode 100644 index 0000000..a24d661 --- /dev/null +++ b/Luna.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0911199dcd027b9fe1ea43e044dfb12fc20a870dc2e2e90b333e4bb6ff5e8802 +size 2497281056 diff --git a/Luna.i1-Q4_K_S.gguf b/Luna.i1-Q4_K_S.gguf new file mode 100644 index 0000000..b0abf57 --- /dev/null +++ b/Luna.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2d63b40f40b50c4db1afe38e5e8276f51dc26d4f6c2c32018c5ca5da6c66152 +size 2383309856 diff --git a/Luna.i1-Q5_K_M.gguf b/Luna.i1-Q5_K_M.gguf new file mode 100644 index 0000000..dab8f28 --- /dev/null +++ b/Luna.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35b46162ebd26c0704b92726bc2dbb2aa060e876ecb9723bd6c1c18e28318912 +size 2889514016 diff --git a/Luna.i1-Q5_K_S.gguf b/Luna.i1-Q5_K_S.gguf new file mode 100644 index 0000000..c25255b --- /dev/null +++ b/Luna.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68966312a189699010cc988f760105406dbbc75669c2ddd1faa4b8ad34054298 +size 2823711776 diff --git a/Luna.i1-Q6_K.gguf b/Luna.i1-Q6_K.gguf new file mode 100644 index 0000000..fed0361 --- /dev/null +++ b/Luna.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ac19da3df2bb3791cccf1eec3514e34f92764c44aa03a8092b38b9fadfd318 +size 3306261536 diff --git a/Luna.imatrix.gguf b/Luna.imatrix.gguf new file mode 100644 index 0000000..68955b8 --- /dev/null +++ b/Luna.imatrix.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:061f9cd4430c251fb6727108dc559edab369d4b06918d962e471d43e87e8006c +size 3872640 diff --git a/README.md b/README.md new file mode 100644 index 0000000..52ebbe3 --- /dev/null +++ b/README.md @@ -0,0 +1,98 @@ +--- +base_model: beyoru/Luna +language: +- en +- zh +- vi +library_name: transformers +license: mit +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- roleplay +- chat +- rp +- character +- waifu +- character +- natural converation +- creative writing +- storytelling +- sfw +--- +## About + + + + + + + + + +weighted/imatrix quants of https://huggingface.co/beyoru/Luna + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Luna-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/Luna-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.imatrix.gguf) | imatrix | 0.1 | imatrix file (for creating your own quants) | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ1_S.gguf) | i1-IQ1_S | 1.2 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ1_M.gguf) | i1-IQ1_M | 1.2 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ2_XS.gguf) | i1-IQ2_XS | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ2_S.gguf) | i1-IQ2_S | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ2_M.gguf) | i1-IQ2_M | 1.6 | | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q2_K_S.gguf) | i1-Q2_K_S | 1.7 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q2_K.gguf) | i1-Q2_K | 1.8 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 1.8 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ3_XS.gguf) | i1-IQ3_XS | 1.9 | | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q3_K_S.gguf) | i1-Q3_K_S | 2.0 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ3_S.gguf) | i1-IQ3_S | 2.0 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ3_M.gguf) | i1-IQ3_M | 2.1 | | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q3_K_M.gguf) | i1-Q3_K_M | 2.2 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q3_K_L.gguf) | i1-Q3_K_L | 2.3 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ4_XS.gguf) | i1-IQ4_XS | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q4_0.gguf) | i1-Q4_0 | 2.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-IQ4_NL.gguf) | i1-IQ4_NL | 2.5 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q4_K_S.gguf) | i1-Q4_K_S | 2.5 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q4_K_M.gguf) | i1-Q4_K_M | 2.6 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q4_1.gguf) | i1-Q4_1 | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q5_K_S.gguf) | i1-Q5_K_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q5_K_M.gguf) | i1-Q5_K_M | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/Luna-i1-GGUF/resolve/main/Luna.i1-Q6_K.gguf) | i1-Q6_K | 3.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + +