From 1a1ede98c57df615474ec6498a93ca73d8b163b9 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Tue, 21 Apr 2026 23:20:09 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Mamba-3B-slimpj-i1-GGUF Source: Original Platform --- .gitattributes | 58 +++++++++++++++++++++++++ Mamba-3B-slimpj.i1-IQ1_M.gguf | 3 ++ Mamba-3B-slimpj.i1-IQ1_S.gguf | 3 ++ Mamba-3B-slimpj.i1-IQ2_M.gguf | 3 ++ Mamba-3B-slimpj.i1-IQ2_S.gguf | 3 ++ Mamba-3B-slimpj.i1-IQ2_XS.gguf | 3 ++ Mamba-3B-slimpj.i1-IQ2_XXS.gguf | 3 ++ Mamba-3B-slimpj.i1-IQ3_M.gguf | 3 ++ Mamba-3B-slimpj.i1-IQ3_S.gguf | 3 ++ Mamba-3B-slimpj.i1-IQ3_XS.gguf | 3 ++ Mamba-3B-slimpj.i1-IQ3_XXS.gguf | 3 ++ Mamba-3B-slimpj.i1-IQ4_XS.gguf | 3 ++ Mamba-3B-slimpj.i1-Q2_K.gguf | 3 ++ Mamba-3B-slimpj.i1-Q2_K_S.gguf | 3 ++ Mamba-3B-slimpj.i1-Q3_K_L.gguf | 3 ++ Mamba-3B-slimpj.i1-Q3_K_M.gguf | 3 ++ Mamba-3B-slimpj.i1-Q3_K_S.gguf | 3 ++ Mamba-3B-slimpj.i1-Q4_0.gguf | 3 ++ Mamba-3B-slimpj.i1-Q4_K_M.gguf | 3 ++ Mamba-3B-slimpj.i1-Q4_K_S.gguf | 3 ++ Mamba-3B-slimpj.i1-Q5_K_M.gguf | 3 ++ Mamba-3B-slimpj.i1-Q5_K_S.gguf | 3 ++ Mamba-3B-slimpj.i1-Q6_K.gguf | 3 ++ README.md | 76 +++++++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 25 files changed, 203 insertions(+) create mode 100644 .gitattributes create mode 100644 Mamba-3B-slimpj.i1-IQ1_M.gguf create mode 100644 Mamba-3B-slimpj.i1-IQ1_S.gguf create mode 100644 Mamba-3B-slimpj.i1-IQ2_M.gguf create mode 100644 Mamba-3B-slimpj.i1-IQ2_S.gguf create mode 100644 Mamba-3B-slimpj.i1-IQ2_XS.gguf create mode 100644 Mamba-3B-slimpj.i1-IQ2_XXS.gguf create mode 100644 Mamba-3B-slimpj.i1-IQ3_M.gguf create mode 100644 Mamba-3B-slimpj.i1-IQ3_S.gguf create mode 100644 Mamba-3B-slimpj.i1-IQ3_XS.gguf create mode 100644 Mamba-3B-slimpj.i1-IQ3_XXS.gguf create mode 100644 Mamba-3B-slimpj.i1-IQ4_XS.gguf create mode 100644 Mamba-3B-slimpj.i1-Q2_K.gguf create mode 100644 Mamba-3B-slimpj.i1-Q2_K_S.gguf create mode 100644 Mamba-3B-slimpj.i1-Q3_K_L.gguf create mode 100644 Mamba-3B-slimpj.i1-Q3_K_M.gguf create mode 100644 Mamba-3B-slimpj.i1-Q3_K_S.gguf create mode 100644 Mamba-3B-slimpj.i1-Q4_0.gguf create mode 100644 Mamba-3B-slimpj.i1-Q4_K_M.gguf create mode 100644 Mamba-3B-slimpj.i1-Q4_K_S.gguf create mode 100644 Mamba-3B-slimpj.i1-Q5_K_M.gguf create mode 100644 Mamba-3B-slimpj.i1-Q5_K_S.gguf create mode 100644 Mamba-3B-slimpj.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..43cd963 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,58 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Mamba-3B-slimpj.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Mamba-3B-slimpj.i1-IQ1_M.gguf b/Mamba-3B-slimpj.i1-IQ1_M.gguf new file mode 100644 index 0000000..980fbaf --- /dev/null +++ b/Mamba-3B-slimpj.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c72913923fc7ca44d694cbd971d6e8e848d8e5ae6ad4c8d52a0ace92ca6b73c +size 714866208 diff --git a/Mamba-3B-slimpj.i1-IQ1_S.gguf b/Mamba-3B-slimpj.i1-IQ1_S.gguf new file mode 100644 index 0000000..37d8b3d --- /dev/null +++ b/Mamba-3B-slimpj.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bc55aeade6c3d4a7111fb28f24c4f0b037966863a344b5523449390d91bc34e +size 654409248 diff --git a/Mamba-3B-slimpj.i1-IQ2_M.gguf b/Mamba-3B-slimpj.i1-IQ2_M.gguf new file mode 100644 index 0000000..3b3fb40 --- /dev/null +++ b/Mamba-3B-slimpj.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bbca8e4ffd5c49854ec3fb231a519b3cdc2513a2da8bd9a73862d6823356422 +size 976846368 diff --git a/Mamba-3B-slimpj.i1-IQ2_S.gguf b/Mamba-3B-slimpj.i1-IQ2_S.gguf new file mode 100644 index 0000000..2a2bd7c --- /dev/null +++ b/Mamba-3B-slimpj.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcfa24708fac9d2d17da29aa722af98aba1088abc8a14b9049d2963507e3f360 +size 896237088 diff --git a/Mamba-3B-slimpj.i1-IQ2_XS.gguf b/Mamba-3B-slimpj.i1-IQ2_XS.gguf new file mode 100644 index 0000000..7b55340 --- /dev/null +++ b/Mamba-3B-slimpj.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e45bcd36212dff7d393f3659c7029ea393885b7707fb5513e230e581a1147f4 +size 896237088 diff --git a/Mamba-3B-slimpj.i1-IQ2_XXS.gguf b/Mamba-3B-slimpj.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..66a9d64 --- /dev/null +++ b/Mamba-3B-slimpj.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:917564cf538fb4ae0790b629db420cd549215596b438aca285d49da22fc92d3a +size 815627808 diff --git a/Mamba-3B-slimpj.i1-IQ3_M.gguf b/Mamba-3B-slimpj.i1-IQ3_M.gguf new file mode 100644 index 0000000..5468d2b --- /dev/null +++ b/Mamba-3B-slimpj.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dded6e5b9f7137742f33dac84b80ca4d4056379e0a8f3d12aeace3f7af086ae9 +size 1276074048 diff --git a/Mamba-3B-slimpj.i1-IQ3_S.gguf b/Mamba-3B-slimpj.i1-IQ3_S.gguf new file mode 100644 index 0000000..cc9dca1 --- /dev/null +++ b/Mamba-3B-slimpj.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8603ccd2ecf95ae858de97191df6daa11e9554ba2746246b558eb935b11538f +size 1276074048 diff --git a/Mamba-3B-slimpj.i1-IQ3_XS.gguf b/Mamba-3B-slimpj.i1-IQ3_XS.gguf new file mode 100644 index 0000000..a96db6e --- /dev/null +++ b/Mamba-3B-slimpj.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc96e579d36e960a482b5ef9bcb54fdb8284ea670b4e1d010d5c48484fd937ce +size 1276074048 diff --git a/Mamba-3B-slimpj.i1-IQ3_XXS.gguf b/Mamba-3B-slimpj.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..22d1167 --- /dev/null +++ b/Mamba-3B-slimpj.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4507253d531622c6510c43d2057f74c0474b69f38df4f401eeaf385c25d7755 +size 1138064928 diff --git a/Mamba-3B-slimpj.i1-IQ4_XS.gguf b/Mamba-3B-slimpj.i1-IQ4_XS.gguf new file mode 100644 index 0000000..a1cfa63 --- /dev/null +++ b/Mamba-3B-slimpj.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1ef4aaffda46016b5444837397378d2bbd9918fa14a89259de9456b7bb393f3 +size 1538054208 diff --git a/Mamba-3B-slimpj.i1-Q2_K.gguf b/Mamba-3B-slimpj.i1-Q2_K.gguf new file mode 100644 index 0000000..0542bec --- /dev/null +++ b/Mamba-3B-slimpj.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a5429df07ac16491da466051040827dd899f4425c0e6591c61ae47245dda82b +size 1014093888 diff --git a/Mamba-3B-slimpj.i1-Q2_K_S.gguf b/Mamba-3B-slimpj.i1-Q2_K_S.gguf new file mode 100644 index 0000000..7247097 --- /dev/null +++ b/Mamba-3B-slimpj.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89cc4f206097de8a020f1404f9554d0add1693b8fcd7a2781cb83e43ce20ae8d +size 1014093888 diff --git a/Mamba-3B-slimpj.i1-Q3_K_L.gguf b/Mamba-3B-slimpj.i1-Q3_K_L.gguf new file mode 100644 index 0000000..905f512 --- /dev/null +++ b/Mamba-3B-slimpj.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27505b74d109bfa4b094a4cea4c810b1afb18d85d962de5f100ddaaea18be2c +size 1276074048 diff --git a/Mamba-3B-slimpj.i1-Q3_K_M.gguf b/Mamba-3B-slimpj.i1-Q3_K_M.gguf new file mode 100644 index 0000000..9366ab6 --- /dev/null +++ b/Mamba-3B-slimpj.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b985d02b8ff7d6345e3cec6b9d5cb5a340310419651f332a5f54f91085ae752 +size 1276074048 diff --git a/Mamba-3B-slimpj.i1-Q3_K_S.gguf b/Mamba-3B-slimpj.i1-Q3_K_S.gguf new file mode 100644 index 0000000..4128424 --- /dev/null +++ b/Mamba-3B-slimpj.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbea3dfa13cb940cc9d42cc06273eefc132e492d05c052dc1454a4f0ab372345 +size 1276074048 diff --git a/Mamba-3B-slimpj.i1-Q4_0.gguf b/Mamba-3B-slimpj.i1-Q4_0.gguf new file mode 100644 index 0000000..64cfae4 --- /dev/null +++ b/Mamba-3B-slimpj.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cf1536405223602f50837fe1d938b61d19df57bfe5433f9fa6c7e4a12121c00 +size 1618663488 diff --git a/Mamba-3B-slimpj.i1-Q4_K_M.gguf b/Mamba-3B-slimpj.i1-Q4_K_M.gguf new file mode 100644 index 0000000..fcfcf40 --- /dev/null +++ b/Mamba-3B-slimpj.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64f1858da21ba16db6fa7d06a873b2f6f315feb96d23255a512a8325011d9919 +size 1625217088 diff --git a/Mamba-3B-slimpj.i1-Q4_K_S.gguf b/Mamba-3B-slimpj.i1-Q4_K_S.gguf new file mode 100644 index 0000000..cc5930b --- /dev/null +++ b/Mamba-3B-slimpj.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea02ec5dff57f381df61089820128c7f0fca1a006944654345747dd6316f627 +size 1625217088 diff --git a/Mamba-3B-slimpj.i1-Q5_K_M.gguf b/Mamba-3B-slimpj.i1-Q5_K_M.gguf new file mode 100644 index 0000000..eb51072 --- /dev/null +++ b/Mamba-3B-slimpj.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68687e7c0fdd6b61fd8fa2ea57abd0090ddd482177688eb8337ebd7902edb97e +size 1950931008 diff --git a/Mamba-3B-slimpj.i1-Q5_K_S.gguf b/Mamba-3B-slimpj.i1-Q5_K_S.gguf new file mode 100644 index 0000000..2c54071 --- /dev/null +++ b/Mamba-3B-slimpj.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b81bbe295ef3441005cc4bf7fd9da1b0b73f154586e3ac4bc42ec3ca1470c7c +size 1950931008 diff --git a/Mamba-3B-slimpj.i1-Q6_K.gguf b/Mamba-3B-slimpj.i1-Q6_K.gguf new file mode 100644 index 0000000..b118b1f --- /dev/null +++ b/Mamba-3B-slimpj.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517b90c80530706880d20262507dc4b763a5905d0e60d5452e2dce825878f770 +size 2309904448 diff --git a/README.md b/README.md new file mode 100644 index 0000000..5060a77 --- /dev/null +++ b/README.md @@ -0,0 +1,76 @@ +--- +base_model: Q-bert/Mamba-3B-slimpj +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- mamba-hf +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/Q-bert/Mamba-3B-slimpj + + +static quants are available at https://huggingface.co/mradermacher/Mamba-3B-slimpj-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-IQ1_S.gguf) | i1-IQ1_S | 0.8 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-IQ1_M.gguf) | i1-IQ1_M | 0.8 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-IQ2_S.gguf) | i1-IQ2_S | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-IQ2_XS.gguf) | i1-IQ2_XS | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-IQ2_M.gguf) | i1-IQ2_M | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-Q2_K.gguf) | i1-Q2_K | 1.1 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-Q2_K_S.gguf) | i1-Q2_K_S | 1.1 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 1.2 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-IQ3_M.gguf) | i1-IQ3_M | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-IQ3_S.gguf) | i1-IQ3_S | 1.4 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-IQ3_XS.gguf) | i1-IQ3_XS | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.4 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.4 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-Q3_K_S.gguf) | i1-Q3_K_S | 1.4 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.6 | | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-Q4_0.gguf) | i1-Q4_0 | 1.7 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-Q4_K_M.gguf) | i1-Q4_K_M | 1.7 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-Q4_K_S.gguf) | i1-Q4_K_S | 1.7 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-Q5_K_M.gguf) | i1-Q5_K_M | 2.1 | | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-Q5_K_S.gguf) | i1-Q5_K_S | 2.1 | | +| [GGUF](https://huggingface.co/mradermacher/Mamba-3B-slimpj-i1-GGUF/resolve/main/Mamba-3B-slimpj.i1-Q6_K.gguf) | i1-Q6_K | 2.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..6e69c75 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12e35278ab77168a99768d4e365032ac1cfeea629709234efdec888a8397a2fd +size 3325947