commit 948b6fffdda189a9f5bf8aa70d3ca5709067581b Author: ModelHub XC Date: Sat May 9 14:52:36 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..f625564 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,58 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Gemmasutra-Pro-27B-v1.1.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Gemmasutra-Pro-27B-v1.1.i1-IQ1_M.gguf b/Gemmasutra-Pro-27B-v1.1.i1-IQ1_M.gguf new file mode 100644 index 0000000..78d30fc --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a943941da34585ed65a6cdcb4dae93688da4e2c43033217ec5746c7fc821c9bb +size 6692470976 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-IQ1_S.gguf b/Gemmasutra-Pro-27B-v1.1.i1-IQ1_S.gguf new file mode 100644 index 0000000..91e525f --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e047f39241c5d3da74ed1a6bd79b2cd876c8e6f4c216cc5df2032de9ed98a0 +size 6132433088 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-IQ2_M.gguf b/Gemmasutra-Pro-27B-v1.1.i1-IQ2_M.gguf new file mode 100644 index 0000000..8f0d80e --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da55e46f4352ad2d1bdea8fd0eca9e6fe8174e08ae26b3b9a11119d17732845d +size 9398878400 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-IQ2_S.gguf b/Gemmasutra-Pro-27B-v1.1.i1-IQ2_S.gguf new file mode 100644 index 0000000..40f2677 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b000e23732629fde9f25baab74af64fbcf638e13b28fab563291e91f020ef30 +size 8652161216 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-IQ2_XS.gguf b/Gemmasutra-Pro-27B-v1.1.i1-IQ2_XS.gguf new file mode 100644 index 0000000..bf453ea --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8da79ec76aadc3e03eac3a216c6c1b6b89e93842a94cd9d0b3d12823ef172694 +size 8399716544 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-IQ2_XXS.gguf b/Gemmasutra-Pro-27B-v1.1.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..b6de006 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90c8421039dc1b26b773f11b2eedb3920d4ac33d183bd7e1320cfe2606c87124 +size 7625867456 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-IQ3_M.gguf b/Gemmasutra-Pro-27B-v1.1.i1-IQ3_M.gguf new file mode 100644 index 0000000..72f421e --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a29571a9cd4fc862505fd773a17df21641b65dc098a8725edebb7bc2b99e05f +size 12454830272 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-IQ3_S.gguf b/Gemmasutra-Pro-27B-v1.1.i1-IQ3_S.gguf new file mode 100644 index 0000000..bb1050e --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c0d38f56778dcfbd188132452c76bd9da55915828ae79cb895a6e4906b6b571 +size 12169060544 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-IQ3_XS.gguf b/Gemmasutra-Pro-27B-v1.1.i1-IQ3_XS.gguf new file mode 100644 index 0000000..42607ac --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a80aaa144cbb9e0db2decafaca015a37917af3708b4d326d87bbbc4f711a6b8 +size 11550630080 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-IQ3_XXS.gguf b/Gemmasutra-Pro-27B-v1.1.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..d9427d8 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b54469aba1bf71203ab1be5b8a26c5d9f3dd89a3a9b447dc52af880076829f1 +size 10750755008 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-IQ4_XS.gguf b/Gemmasutra-Pro-27B-v1.1.i1-IQ4_XS.gguf new file mode 100644 index 0000000..6a886b8 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44e4ac658a22140180421a5b0cc3461ca60f808a282f1f7a23c8684a391469f6 +size 14814421184 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q2_K.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q2_K.gguf new file mode 100644 index 0000000..d964d08 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b19cede00ea8908b52fe1a3827da3c7ce4050205642f11dbfaaebbebd153d7b9 +size 10449576128 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q2_K_S.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q2_K_S.gguf new file mode 100644 index 0000000..6a6a9d2 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d148d085b6b258b799e2b86ebc51065ee7a36803fca20f28fa77a6c5628a73d8 +size 9722765504 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_L.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_L.gguf new file mode 100644 index 0000000..7e9d7d6 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37f08c57e7730721d96dfb8faeac078f7524e5fe765eec80adac8acab4aa3ee8 +size 14519361728 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_M.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_M.gguf new file mode 100644 index 0000000..ad8a96e --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbbc306ef16f841f6ce89b24fccf12250ab48ea184daa4e3884012be131b897d +size 13424648384 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_S.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_S.gguf new file mode 100644 index 0000000..67d84e8 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebd6a8186086065d7efa787b1e3096738452056d2564e43ef1240d4afc800cd8 +size 12169060544 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q4_0.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q4_0.gguf new file mode 100644 index 0000000..a8bce0f --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a40ce8403e302920055965c5e2473eab1269db0f0e3f2f4c37c3f30b0dd5b988 +size 15681462464 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q4_1.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q4_1.gguf new file mode 100644 index 0000000..f3f8767 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65a280191ab153d5b220d4414947f5c5a331a667df634979b540a797ebd2e89e +size 17256292544 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q4_K_M.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q4_K_M.gguf new file mode 100644 index 0000000..09c3a91 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3876e9d3f6ae95aa16a6e917ee8de05a7883022fbcdcf4359beb3fac8498c3ce +size 16645382336 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q4_K_S.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q4_K_S.gguf new file mode 100644 index 0000000..455ac22 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84416172d7fe86c41249b6431f6931de932a246ac9e458011a38d0f5b1845833 +size 15739265216 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q5_K_M.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q5_K_M.gguf new file mode 100644 index 0000000..6215840 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b5037b429f3c543deb3d0040d8bf1e271e4410acf9c22fbc700e1358349d91b +size 19408117952 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q5_K_S.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q5_K_S.gguf new file mode 100644 index 0000000..5f74329 --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd4e80d2a15fcd96be556fee8e2a9fdf58e6b993841b6e02289733a78358039 +size 18884206784 diff --git a/Gemmasutra-Pro-27B-v1.1.i1-Q6_K.gguf b/Gemmasutra-Pro-27B-v1.1.i1-Q6_K.gguf new file mode 100644 index 0000000..1b996ba --- /dev/null +++ b/Gemmasutra-Pro-27B-v1.1.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d83f4e4ed3363012c69d7f032f3c2ec41cfc957b16e5c4f34dde614476f7c656 +size 22343524544 diff --git a/README.md b/README.md new file mode 100644 index 0000000..d65dfbc --- /dev/null +++ b/README.md @@ -0,0 +1,75 @@ +--- +base_model: TheDrummer/Gemmasutra-Pro-27B-v1.1 +language: +- en +library_name: transformers +license: other +quantized_by: mradermacher +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/TheDrummer/Gemmasutra-Pro-27B-v1.1 + + +static quants are available at https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-IQ1_S.gguf) | i1-IQ1_S | 6.2 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-IQ1_M.gguf) | i1-IQ1_M | 6.8 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 7.7 | | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-IQ2_XS.gguf) | i1-IQ2_XS | 8.5 | | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-IQ2_S.gguf) | i1-IQ2_S | 8.8 | | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-IQ2_M.gguf) | i1-IQ2_M | 9.5 | | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q2_K_S.gguf) | i1-Q2_K_S | 9.8 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q2_K.gguf) | i1-Q2_K | 10.5 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 10.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-IQ3_XS.gguf) | i1-IQ3_XS | 11.7 | | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-IQ3_S.gguf) | i1-IQ3_S | 12.3 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_S.gguf) | i1-Q3_K_S | 12.3 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-IQ3_M.gguf) | i1-IQ3_M | 12.6 | | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_M.gguf) | i1-Q3_K_M | 13.5 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q3_K_L.gguf) | i1-Q3_K_L | 14.6 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-IQ4_XS.gguf) | i1-IQ4_XS | 14.9 | | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q4_0.gguf) | i1-Q4_0 | 15.8 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q4_K_S.gguf) | i1-Q4_K_S | 15.8 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q4_K_M.gguf) | i1-Q4_K_M | 16.7 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q4_1.gguf) | i1-Q4_1 | 17.4 | | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q5_K_S.gguf) | i1-Q5_K_S | 19.0 | | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q5_K_M.gguf) | i1-Q5_K_M | 19.5 | | +| [GGUF](https://huggingface.co/mradermacher/Gemmasutra-Pro-27B-v1.1-i1-GGUF/resolve/main/Gemmasutra-Pro-27B-v1.1.i1-Q6_K.gguf) | i1-Q6_K | 22.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + +