commit fe9474fbb6ed5fe58f2687988b8d9d31d192c1ae Author: ModelHub XC Date: Fri Apr 10 20:23:54 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..4cd5dd1 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Lacaille-MoT-4B-Supreme2.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ1_M.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ1_M.gguf new file mode 100644 index 0000000..d547aea --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eded6fb37fd40190ee919cff9bcb981d552b2e2bb829c169d1f81ee82b443eca +size 1127019424 diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ1_S.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ1_S.gguf new file mode 100644 index 0000000..c87a021 --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8f6884955ff242c4a02012213c2a7418116d23a7375a7e510fa46f180eed7fb +size 1055257504 diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ2_M.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ2_M.gguf new file mode 100644 index 0000000..ae69f90 --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22970646f171fd93ef7df9f62035f713fbd79893425bb29bb09a269983d65cce +size 1512985504 diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ2_S.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ2_S.gguf new file mode 100644 index 0000000..4d2764f --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf2ef220b93f49ad520a6b0710c102f909084da48c03a10f52a72a911f29778 +size 1417302944 diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ2_XS.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ2_XS.gguf new file mode 100644 index 0000000..21486fa --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63181d4d0616c72a8bd6e1abeee6ca4159ccf1236b6190566514c93f0870e80a +size 1354101664 diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ2_XXS.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..4d53766 --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b67f7dff52785a1e6a7d7f102dd3e67058b51bc6e3d267837f1eb07f996101e4 +size 1246622624 diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ3_M.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ3_M.gguf new file mode 100644 index 0000000..b907c10 --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6483820668a1f905f2127df8913f4e01a46a2714d0524f7beab08cdf98c14f8e +size 1962897824 diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ3_S.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ3_S.gguf new file mode 100644 index 0000000..558d1de --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee88aee9a627104581484d0780ed4278778d4a7aef287c6687fd4b2e9564252 +size 1899532704 diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ3_XS.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ3_XS.gguf new file mode 100644 index 0000000..75aa36e --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5df8b3d49c4d0a3fd935e2d43fb1c3bb09c8ea2f808c662fdeb5f6ebf056e37c +size 1814376864 diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ3_XXS.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..b93b458 --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5f34e7acb21ae53b092d2e633a0311c9dd41cec618542a3a186e9c98ec94255 +size 1670189984 diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ4_NL.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ4_NL.gguf new file mode 100644 index 0000000..daf3096 --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64e5f18ed8db6b6ca033dd32c3df0da02f48d587568435e53d3f69eb75641f82 +size 2381345184 diff --git a/Lacaille-MoT-4B-Supreme2.i1-IQ4_XS.gguf b/Lacaille-MoT-4B-Supreme2.i1-IQ4_XS.gguf new file mode 100644 index 0000000..e2cd5ff --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e22a368aa2e4c3460cb9d7ffc47afc29d43996c6a818a752c02498dc32eee1f +size 2270753184 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q2_K.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q2_K.gguf new file mode 100644 index 0000000..745cfe7 --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3aa96473d0a5eccf96bf5491e839b759ee0d20310e369376b8e5ea40b77ff92 +size 1669501344 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q2_K_S.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q2_K_S.gguf new file mode 100644 index 0000000..91b73e9 --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:017f8ed8dbaf3e49b555d2ce1f5e9a7814b621eadfa3c352460c0f1df8dd24e1 +size 1563455904 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q3_K_L.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q3_K_L.gguf new file mode 100644 index 0000000..f6e3e7b --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a1c208f0778804b2b64e4f0231a3290d7a6676d3dc646361f9d44a3cb0ca427 +size 2239787424 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q3_K_M.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q3_K_M.gguf new file mode 100644 index 0000000..68a2d6f --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65d35113090ba4cae5a0b77179eb0f0b65ff0558f354af875fadd334705104f2 +size 2075619744 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q3_K_S.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q3_K_S.gguf new file mode 100644 index 0000000..9261cfe --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d1ca58bbc73fb9ae26d7f2b7cbb822aad4b032e2faf570e67d76f9514a22346 +size 1886998944 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q4_0.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q4_0.gguf new file mode 100644 index 0000000..64dfe7a --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf898739ac43730d9e7118c9f21615fc9ed70be2f336489c530e55fef48e37f2 +size 2375774624 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q4_1.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q4_1.gguf new file mode 100644 index 0000000..5d7596b --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22eb356e1f91db8c91ac14d67fcda4f7e1dd11d292e1ae3b2979c33201575ce4 +size 2596630944 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q4_K_M.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q4_K_M.gguf new file mode 100644 index 0000000..ed35f5c --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5723d2be03f6a65ce75b9b5a63bd169542700d0be04073c5494fdfbd54c46bda +size 2497282464 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q4_K_S.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q4_K_S.gguf new file mode 100644 index 0000000..292c7f0 --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7299d6bc71fc21bda2f93ce26d22cccddb16fbbd97fda66b6c32f43c8310635f +size 2383311264 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q5_K_M.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q5_K_M.gguf new file mode 100644 index 0000000..94e564b --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d14506832422073707c15d05f7225bc4b3b36185fddf34beae2741bbba6d1483 +size 2889515424 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q5_K_S.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q5_K_S.gguf new file mode 100644 index 0000000..9a2459d --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57a39b627532b696515ea31eb4b3b1cff4d54b52a65683a5247047984ce4c310 +size 2823713184 diff --git a/Lacaille-MoT-4B-Supreme2.i1-Q6_K.gguf b/Lacaille-MoT-4B-Supreme2.i1-Q6_K.gguf new file mode 100644 index 0000000..87beabd --- /dev/null +++ b/Lacaille-MoT-4B-Supreme2.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a975c431fa2f9982e8b01df94150b5ff4f0d7cb4a9a3f832b655ae122cf25acc +size 3306262944 diff --git a/README.md b/README.md new file mode 100644 index 0000000..afa5fac --- /dev/null +++ b/README.md @@ -0,0 +1,93 @@ +--- +base_model: prithivMLmods/Lacaille-MoT-4B-Supreme2 +datasets: +- open-r1/Mixture-of-Thoughts +- nvidia/OpenCodeReasoning +language: +- en +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- trl +- mot +- code +- science +- math +- mixture-of-thoughts +- text-generation-inference +- reasoning +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/prithivMLmods/Lacaille-MoT-4B-Supreme2 + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Lacaille-MoT-4B-Supreme2-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ1_S.gguf) | i1-IQ1_S | 1.2 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ1_M.gguf) | i1-IQ1_M | 1.2 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ2_XS.gguf) | i1-IQ2_XS | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ2_S.gguf) | i1-IQ2_S | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ2_M.gguf) | i1-IQ2_M | 1.6 | | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q2_K_S.gguf) | i1-Q2_K_S | 1.7 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q2_K.gguf) | i1-Q2_K | 1.8 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 1.8 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ3_XS.gguf) | i1-IQ3_XS | 1.9 | | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q3_K_S.gguf) | i1-Q3_K_S | 2.0 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ3_S.gguf) | i1-IQ3_S | 2.0 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ3_M.gguf) | i1-IQ3_M | 2.1 | | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q3_K_M.gguf) | i1-Q3_K_M | 2.2 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q3_K_L.gguf) | i1-Q3_K_L | 2.3 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ4_XS.gguf) | i1-IQ4_XS | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q4_0.gguf) | i1-Q4_0 | 2.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-IQ4_NL.gguf) | i1-IQ4_NL | 2.5 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q4_K_S.gguf) | i1-Q4_K_S | 2.5 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q4_K_M.gguf) | i1-Q4_K_M | 2.6 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q4_1.gguf) | i1-Q4_1 | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q5_K_S.gguf) | i1-Q5_K_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q5_K_M.gguf) | i1-Q5_K_M | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/Lacaille-MoT-4B-Supreme2-i1-GGUF/resolve/main/Lacaille-MoT-4B-Supreme2.i1-Q6_K.gguf) | i1-Q6_K | 3.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..b421084 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e42b6b6def41ef3802eb1cf465dd6a04b3aad026ded16e90092ec16df312c9c7 +size 3842209