From fe4d7ba30b8db391d58a4bf9cc84310870c7616c Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 22 May 2026 16:27:18 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/MedraQ-8b-i1-GGUF Source: Original Platform --- .gitattributes | 60 ++++++++++++++++++++++++++ MedraQ-8b.i1-IQ1_M.gguf | 3 ++ MedraQ-8b.i1-IQ1_S.gguf | 3 ++ MedraQ-8b.i1-IQ2_M.gguf | 3 ++ MedraQ-8b.i1-IQ2_S.gguf | 3 ++ MedraQ-8b.i1-IQ2_XS.gguf | 3 ++ MedraQ-8b.i1-IQ2_XXS.gguf | 3 ++ MedraQ-8b.i1-IQ3_M.gguf | 3 ++ MedraQ-8b.i1-IQ3_S.gguf | 3 ++ MedraQ-8b.i1-IQ3_XS.gguf | 3 ++ MedraQ-8b.i1-IQ3_XXS.gguf | 3 ++ MedraQ-8b.i1-IQ4_NL.gguf | 3 ++ MedraQ-8b.i1-IQ4_XS.gguf | 3 ++ MedraQ-8b.i1-Q2_K.gguf | 3 ++ MedraQ-8b.i1-Q2_K_S.gguf | 3 ++ MedraQ-8b.i1-Q3_K_L.gguf | 3 ++ MedraQ-8b.i1-Q3_K_M.gguf | 3 ++ MedraQ-8b.i1-Q3_K_S.gguf | 3 ++ MedraQ-8b.i1-Q4_0.gguf | 3 ++ MedraQ-8b.i1-Q4_1.gguf | 3 ++ MedraQ-8b.i1-Q4_K_M.gguf | 3 ++ MedraQ-8b.i1-Q4_K_S.gguf | 3 ++ MedraQ-8b.i1-Q5_K_M.gguf | 3 ++ MedraQ-8b.i1-Q5_K_S.gguf | 3 ++ MedraQ-8b.i1-Q6_K.gguf | 3 ++ README.md | 91 +++++++++++++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 27 files changed, 226 insertions(+) create mode 100644 .gitattributes create mode 100644 MedraQ-8b.i1-IQ1_M.gguf create mode 100644 MedraQ-8b.i1-IQ1_S.gguf create mode 100644 MedraQ-8b.i1-IQ2_M.gguf create mode 100644 MedraQ-8b.i1-IQ2_S.gguf create mode 100644 MedraQ-8b.i1-IQ2_XS.gguf create mode 100644 MedraQ-8b.i1-IQ2_XXS.gguf create mode 100644 MedraQ-8b.i1-IQ3_M.gguf create mode 100644 MedraQ-8b.i1-IQ3_S.gguf create mode 100644 MedraQ-8b.i1-IQ3_XS.gguf create mode 100644 MedraQ-8b.i1-IQ3_XXS.gguf create mode 100644 MedraQ-8b.i1-IQ4_NL.gguf create mode 100644 MedraQ-8b.i1-IQ4_XS.gguf create mode 100644 MedraQ-8b.i1-Q2_K.gguf create mode 100644 MedraQ-8b.i1-Q2_K_S.gguf create mode 100644 MedraQ-8b.i1-Q3_K_L.gguf create mode 100644 MedraQ-8b.i1-Q3_K_M.gguf create mode 100644 MedraQ-8b.i1-Q3_K_S.gguf create mode 100644 MedraQ-8b.i1-Q4_0.gguf create mode 100644 MedraQ-8b.i1-Q4_1.gguf create mode 100644 MedraQ-8b.i1-Q4_K_M.gguf create mode 100644 MedraQ-8b.i1-Q4_K_S.gguf create mode 100644 MedraQ-8b.i1-Q5_K_M.gguf create mode 100644 MedraQ-8b.i1-Q5_K_S.gguf create mode 100644 MedraQ-8b.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..78ecc61 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MedraQ-8b.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/MedraQ-8b.i1-IQ1_M.gguf b/MedraQ-8b.i1-IQ1_M.gguf new file mode 100644 index 0000000..40a5ccf --- /dev/null +++ b/MedraQ-8b.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:868a52299e0dab6b1002ad79caa79ddaf6b48e8ab4314e8756e73c5803001606 +size 1127018816 diff --git a/MedraQ-8b.i1-IQ1_S.gguf b/MedraQ-8b.i1-IQ1_S.gguf new file mode 100644 index 0000000..15a16d9 --- /dev/null +++ b/MedraQ-8b.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19e41a609c84731a690d37b211be21c081f8d9c710c7d279dbdd4f737211e808 +size 1055256896 diff --git a/MedraQ-8b.i1-IQ2_M.gguf b/MedraQ-8b.i1-IQ2_M.gguf new file mode 100644 index 0000000..7a6be96 --- /dev/null +++ b/MedraQ-8b.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27a798195b9d9468527192e4eff26bc8c516f58f12c3b2856cdeb0fa0611534f +size 1512984896 diff --git a/MedraQ-8b.i1-IQ2_S.gguf b/MedraQ-8b.i1-IQ2_S.gguf new file mode 100644 index 0000000..2c2cd3d --- /dev/null +++ b/MedraQ-8b.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7795770dc4d3eafe673f6747808e5397153625caaba3c204d59614c97a70cc3 +size 1417302336 diff --git a/MedraQ-8b.i1-IQ2_XS.gguf b/MedraQ-8b.i1-IQ2_XS.gguf new file mode 100644 index 0000000..4a83a26 --- /dev/null +++ b/MedraQ-8b.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5df028af3d1417cccb1286a0b7f5855d366fc53f311c1dcf874a091d588c1ddc +size 1354101056 diff --git a/MedraQ-8b.i1-IQ2_XXS.gguf b/MedraQ-8b.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..e98636e --- /dev/null +++ b/MedraQ-8b.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a47af9085f0200232500c819a1fbd750a6b0ad2f9829df743f31338c8dcc5284 +size 1246622016 diff --git a/MedraQ-8b.i1-IQ3_M.gguf b/MedraQ-8b.i1-IQ3_M.gguf new file mode 100644 index 0000000..406d664 --- /dev/null +++ b/MedraQ-8b.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:070b26c8a61f9994b2b7badf8eb2e29594e7862cf128a0f22f937618174760ed +size 1962897216 diff --git a/MedraQ-8b.i1-IQ3_S.gguf b/MedraQ-8b.i1-IQ3_S.gguf new file mode 100644 index 0000000..e40464c --- /dev/null +++ b/MedraQ-8b.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ccc9a2f36b6f3312b3de934c3a759c973d57539aeffc7bd8ad04a633964a63 +size 1899532096 diff --git a/MedraQ-8b.i1-IQ3_XS.gguf b/MedraQ-8b.i1-IQ3_XS.gguf new file mode 100644 index 0000000..04674e1 --- /dev/null +++ b/MedraQ-8b.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f98a5188d8d7253d94d2bef5e9467f0cdbe354fc0670e1e0d13644a207c3dbe +size 1814376256 diff --git a/MedraQ-8b.i1-IQ3_XXS.gguf b/MedraQ-8b.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..2ab596a --- /dev/null +++ b/MedraQ-8b.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea83437b992bcafe57dddf85cfeedb4cdc4178fe8fde512d30b0d4f2bfe89a79 +size 1670189376 diff --git a/MedraQ-8b.i1-IQ4_NL.gguf b/MedraQ-8b.i1-IQ4_NL.gguf new file mode 100644 index 0000000..7ff2539 --- /dev/null +++ b/MedraQ-8b.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fee8f7edfdb9c06c5a65aae2d4e409c1be357f20fe8c5d9429edc775d7476bb +size 2381344576 diff --git a/MedraQ-8b.i1-IQ4_XS.gguf b/MedraQ-8b.i1-IQ4_XS.gguf new file mode 100644 index 0000000..936383b --- /dev/null +++ b/MedraQ-8b.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54f6522537c9c31b75ed913d49041bf29d23a71a8ea58e52b448df74ba0e4ad2 +size 2270752576 diff --git a/MedraQ-8b.i1-Q2_K.gguf b/MedraQ-8b.i1-Q2_K.gguf new file mode 100644 index 0000000..dece140 --- /dev/null +++ b/MedraQ-8b.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58126e03cf89cca7366f1f48eedc2b847ca7971180c5e8771c9885401fb2e56d +size 1669500736 diff --git a/MedraQ-8b.i1-Q2_K_S.gguf b/MedraQ-8b.i1-Q2_K_S.gguf new file mode 100644 index 0000000..6e7e411 --- /dev/null +++ b/MedraQ-8b.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f90b0925fdf8fc48ae75835aaa8f1cbd320c9a6122eecaf2457215a636d80a +size 1563455296 diff --git a/MedraQ-8b.i1-Q3_K_L.gguf b/MedraQ-8b.i1-Q3_K_L.gguf new file mode 100644 index 0000000..e4fc9b8 --- /dev/null +++ b/MedraQ-8b.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:741795aa0bc398651958543ad15725bd347fbf0c788124f936e56fd0269d055d +size 2239786816 diff --git a/MedraQ-8b.i1-Q3_K_M.gguf b/MedraQ-8b.i1-Q3_K_M.gguf new file mode 100644 index 0000000..95babcf --- /dev/null +++ b/MedraQ-8b.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e208cf54f130e262c0452673c2f958a3bac990f73d187af263da67d9f2b80326 +size 2075619136 diff --git a/MedraQ-8b.i1-Q3_K_S.gguf b/MedraQ-8b.i1-Q3_K_S.gguf new file mode 100644 index 0000000..56673ba --- /dev/null +++ b/MedraQ-8b.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2f4a08df9bcb0e4382e6b37c3c49f3317050779b30e8b004a6b8ee1adedb60e +size 1886998336 diff --git a/MedraQ-8b.i1-Q4_0.gguf b/MedraQ-8b.i1-Q4_0.gguf new file mode 100644 index 0000000..12dcca5 --- /dev/null +++ b/MedraQ-8b.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c59e0d7592777d947380a32517fc2d88972df85b5e0104b79c6c9a56b7182913 +size 2375774016 diff --git a/MedraQ-8b.i1-Q4_1.gguf b/MedraQ-8b.i1-Q4_1.gguf new file mode 100644 index 0000000..e667ff1 --- /dev/null +++ b/MedraQ-8b.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:601c37d4b19c8e55684a159183b4670cc09b28ce80eec565b9da882c0a8fac0b +size 2596630336 diff --git a/MedraQ-8b.i1-Q4_K_M.gguf b/MedraQ-8b.i1-Q4_K_M.gguf new file mode 100644 index 0000000..ccb2099 --- /dev/null +++ b/MedraQ-8b.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90bc345ae4a1b27c0ea1f633833e10951397169f62130da83ae4b7d73093dd2b +size 2497281856 diff --git a/MedraQ-8b.i1-Q4_K_S.gguf b/MedraQ-8b.i1-Q4_K_S.gguf new file mode 100644 index 0000000..5bf700b --- /dev/null +++ b/MedraQ-8b.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8804abbb0299b082c76a3ffb1e615e788c009f0053cbe8070cc481bd64b7bbe0 +size 2383310656 diff --git a/MedraQ-8b.i1-Q5_K_M.gguf b/MedraQ-8b.i1-Q5_K_M.gguf new file mode 100644 index 0000000..f3bd993 --- /dev/null +++ b/MedraQ-8b.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ad49291f21f1df07e19dcbdab34b00370188658c463da01a07b5803b138f7e1 +size 2889514816 diff --git a/MedraQ-8b.i1-Q5_K_S.gguf b/MedraQ-8b.i1-Q5_K_S.gguf new file mode 100644 index 0000000..83ddcd3 --- /dev/null +++ b/MedraQ-8b.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ecbb767409405e8deef35f9a5c3fd6ea62f89aa0464c765d2d9590822c9a110 +size 2823712576 diff --git a/MedraQ-8b.i1-Q6_K.gguf b/MedraQ-8b.i1-Q6_K.gguf new file mode 100644 index 0000000..0f3ff43 --- /dev/null +++ b/MedraQ-8b.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aeb40c034d68b8703ffe6d94043b7afd00ff1733dd9f303a325354a105e1cfe +size 3306262336 diff --git a/README.md b/README.md new file mode 100644 index 0000000..bd9092b --- /dev/null +++ b/README.md @@ -0,0 +1,91 @@ +--- +base_model: drwlf/MedraQ-8b +datasets: +- nicoboss/medra-medical +language: +- en +- ro +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- text-generation +- medical-ai +- summarization +- diagnostic-reasoning +- gemma-3 +- fine-tuned +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/drwlf/MedraQ-8b + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#MedraQ-8b-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/MedraQ-8b-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ1_S.gguf) | i1-IQ1_S | 1.2 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ1_M.gguf) | i1-IQ1_M | 1.2 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ2_XS.gguf) | i1-IQ2_XS | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ2_S.gguf) | i1-IQ2_S | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ2_M.gguf) | i1-IQ2_M | 1.6 | | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q2_K_S.gguf) | i1-Q2_K_S | 1.7 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q2_K.gguf) | i1-Q2_K | 1.8 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 1.8 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ3_XS.gguf) | i1-IQ3_XS | 1.9 | | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q3_K_S.gguf) | i1-Q3_K_S | 2.0 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ3_S.gguf) | i1-IQ3_S | 2.0 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ3_M.gguf) | i1-IQ3_M | 2.1 | | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q3_K_M.gguf) | i1-Q3_K_M | 2.2 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q3_K_L.gguf) | i1-Q3_K_L | 2.3 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ4_XS.gguf) | i1-IQ4_XS | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q4_0.gguf) | i1-Q4_0 | 2.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-IQ4_NL.gguf) | i1-IQ4_NL | 2.5 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q4_K_S.gguf) | i1-Q4_K_S | 2.5 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q4_K_M.gguf) | i1-Q4_K_M | 2.6 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q4_1.gguf) | i1-Q4_1 | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q5_K_S.gguf) | i1-Q5_K_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q5_K_M.gguf) | i1-Q5_K_M | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/MedraQ-8b-i1-GGUF/resolve/main/MedraQ-8b.i1-Q6_K.gguf) | i1-Q6_K | 3.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..11e4f3b --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464c30038a5f17e8642a742469347e8675c7844ea7d782896b84d4e6609526e5 +size 3842209