commit 837594af51ce1d73c47a9502930f28a579f147f7 Author: ModelHub XC Date: Fri Jun 5 12:54:20 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Midnight-Bloom-12B-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..77b4d77 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Midnight-Bloom-12B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Midnight-Bloom-12B.i1-IQ1_M.gguf b/Midnight-Bloom-12B.i1-IQ1_M.gguf new file mode 100644 index 0000000..ff6daf7 --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d80f45c8f6e32be41e8558ca312493af01e94bcd9e811dfad20827ca91a44e +size 3164728608 diff --git a/Midnight-Bloom-12B.i1-IQ1_S.gguf b/Midnight-Bloom-12B.i1-IQ1_S.gguf new file mode 100644 index 0000000..0ef78d1 --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37b8c367f7ce77698f6fbec590fd94e5d29850a5b4fc148acf76a9f7ef560fe5 +size 2947415328 diff --git a/Midnight-Bloom-12B.i1-IQ2_M.gguf b/Midnight-Bloom-12B.i1-IQ2_M.gguf new file mode 100644 index 0000000..f6b807a --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5532fa7202f6906a120ce299044b1f5a855e975939034ab0212b929589dcb6de +size 4310461728 diff --git a/Midnight-Bloom-12B.i1-IQ2_S.gguf b/Midnight-Bloom-12B.i1-IQ2_S.gguf new file mode 100644 index 0000000..62bcb1c --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cda073b295aab2ae1d1be1f317b6c7fe60cb09258a63d24c923f3156a0d1920c +size 4020710688 diff --git a/Midnight-Bloom-12B.i1-IQ2_XS.gguf b/Midnight-Bloom-12B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..3d6c787 --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac2226d9d60b16070c4b57e1439f98dae7e4426e9c7374abc3fd947fb2dbeb7 +size 3840261408 diff --git a/Midnight-Bloom-12B.i1-IQ2_XXS.gguf b/Midnight-Bloom-12B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..acb4eb3 --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d30acd406684879ed56082a3d7e8a3472ed6a95a1a61eb6e80b89e884795c089 +size 3526917408 diff --git a/Midnight-Bloom-12B.i1-IQ3_M.gguf b/Midnight-Bloom-12B.i1-IQ3_M.gguf new file mode 100644 index 0000000..b53ab87 --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77bd96d08833f48eb92278918fe52cef9bb95ed2de5e7981bf212eafebfeead5 +size 5655723168 diff --git a/Midnight-Bloom-12B.i1-IQ3_S.gguf b/Midnight-Bloom-12B.i1-IQ3_S.gguf new file mode 100644 index 0000000..9a51cfb --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d56683a19e100966cbd6d74b8cb80aa0cfefc466138dc1807640437f42e6d74f +size 5458316448 diff --git a/Midnight-Bloom-12B.i1-IQ3_XS.gguf b/Midnight-Bloom-12B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..377a35d --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d00ba8bf848c885a2abf3ac1fcab7a3024746c5568e219d6166bb2625e3eef24 +size 5206166688 diff --git a/Midnight-Bloom-12B.i1-IQ3_XXS.gguf b/Midnight-Bloom-12B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..e25a941 --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bde6c385a74c7671a6aa422cda7f54d145f8dc0da6f35cb31c7b832c1fd57f64 +size 4784901408 diff --git a/Midnight-Bloom-12B.i1-IQ4_NL.gguf b/Midnight-Bloom-12B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..e1c51cc --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:211247636b92fad48849fd50a476c65bf5b0d2d1ab079147cccc27d2d3c5ca7e +size 6887165088 diff --git a/Midnight-Bloom-12B.i1-IQ4_XS.gguf b/Midnight-Bloom-12B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..cbce7a8 --- /dev/null +++ b/Midnight-Bloom-12B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6311305b58d9477c1ddaec69143606cdb8f3c756fc4799d926683c916a9a9d64 +size 6550965408 diff --git a/Midnight-Bloom-12B.i1-Q2_K.gguf b/Midnight-Bloom-12B.i1-Q2_K.gguf new file mode 100644 index 0000000..092e197 --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97daa93d8d0ac4f960b5d9c504d49e24ae47fbbdeaba4e8fbc567417ab85c765 +size 4768222368 diff --git a/Midnight-Bloom-12B.i1-Q2_K_S.gguf b/Midnight-Bloom-12B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..0bbaf22 --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96854c93af428c0ee2d3cf23cde151f9668345b9ca6edd68f661bb05a8f365c4 +size 4448611488 diff --git a/Midnight-Bloom-12B.i1-Q3_K_L.gguf b/Midnight-Bloom-12B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..535826d --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1ef4b1440ecf56f9539e9211434c3a1ba67680dbc946f9d869b9df97255331 +size 6480186528 diff --git a/Midnight-Bloom-12B.i1-Q3_K_M.gguf b/Midnight-Bloom-12B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..8c33936 --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb34dc28f6104e7e00efae3bd922ff1d575063f4c89f09ddda4eea4bf4714bf0 +size 6008818848 diff --git a/Midnight-Bloom-12B.i1-Q3_K_S.gguf b/Midnight-Bloom-12B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..c719c52 --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad23b795f69aae571bea77df8145e31fcf75168176c5b43f684f783d9bc5ae6 +size 5458316448 diff --git a/Midnight-Bloom-12B.i1-Q4_0.gguf b/Midnight-Bloom-12B.i1-Q4_0.gguf new file mode 100644 index 0000000..81418f9 --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc9c19018e63044dcac2f0de8aab63936543e6edb92b12a5181ded954597d825 +size 6909283488 diff --git a/Midnight-Bloom-12B.i1-Q4_1.gguf b/Midnight-Bloom-12B.i1-Q4_1.gguf new file mode 100644 index 0000000..d671f50 --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:028acb82436e9cb9846a6bf219549f8a7e590c675d922873d208600f291cda55 +size 7559564448 diff --git a/Midnight-Bloom-12B.i1-Q4_K_M.gguf b/Midnight-Bloom-12B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..30d4e43 --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d94bbdcd9dd292b998d214d1c7cf43de4dcfcd0a9c723e0f9b5a6d0b43d1c65 +size 7300779168 diff --git a/Midnight-Bloom-12B.i1-Q4_K_S.gguf b/Midnight-Bloom-12B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..69eece7 --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:030967eab2372c548f79d509429bc494e24bf968623755898acb4a1106ac66b8 +size 6935334048 diff --git a/Midnight-Bloom-12B.i1-Q5_K_M.gguf b/Midnight-Bloom-12B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..1e16633 --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1787b1841a6be41ffdf87d3879c08e2d5a39334499f6553ac12f1d152850a6f +size 8445037728 diff --git a/Midnight-Bloom-12B.i1-Q5_K_S.gguf b/Midnight-Bloom-12B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..687acb7 --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c9415e51f5e6ac8d9aeb7007f2d954fe08af00df09a6e29b2e7ace62e19eea8 +size 8231963808 diff --git a/Midnight-Bloom-12B.i1-Q6_K.gguf b/Midnight-Bloom-12B.i1-Q6_K.gguf new file mode 100644 index 0000000..ad7e465 --- /dev/null +++ b/Midnight-Bloom-12B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab4bba068c5d00ee97c6c5afdc5b05e65c36a99395c601e62c613cb25bd23c20 +size 9660812448 diff --git a/README.md b/README.md new file mode 100644 index 0000000..806a266 --- /dev/null +++ b/README.md @@ -0,0 +1,83 @@ +--- +base_model: soob3123/Veiled-Rose-12B +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- text-generation-inference +- transformers +- gemma3 +- analytical-tasks +- bias-neutralization +- uncensored +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/soob3123/Veiled-Rose-12B + + +static quants are available at https://huggingface.co/mradermacher/Midnight-Bloom-12B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ1_S.gguf) | i1-IQ1_S | 3.0 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ1_M.gguf) | i1-IQ1_M | 3.3 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 3.6 | | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 3.9 | | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ2_S.gguf) | i1-IQ2_S | 4.1 | | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ2_M.gguf) | i1-IQ2_M | 4.4 | | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 4.5 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q2_K.gguf) | i1-Q2_K | 4.9 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 4.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 5.3 | | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ3_S.gguf) | i1-IQ3_S | 5.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 5.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ3_M.gguf) | i1-IQ3_M | 5.8 | | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 6.1 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 6.6 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 6.7 | | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 7.0 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q4_0.gguf) | i1-Q4_0 | 7.0 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 7.0 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 7.4 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q4_1.gguf) | i1-Q4_1 | 7.7 | | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 8.3 | | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 8.5 | | +| [GGUF](https://huggingface.co/mradermacher/Midnight-Bloom-12B-i1-GGUF/resolve/main/Midnight-Bloom-12B.i1-Q6_K.gguf) | i1-Q6_K | 9.8 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..5fb5b0d --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3050f8c1d29e41f7021ab97f40ef5cb7da7888132a593bf6095faa70f8e43c81 +size 7433101