From d7aa4d6b192dc6f6b4751940f21aab73089fab4b Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 1 May 2026 02:27:58 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Phi-4-QwQ-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++++++++++++++ Phi-4-QwQ.i1-IQ1_M.gguf | 3 ++ Phi-4-QwQ.i1-IQ1_S.gguf | 3 ++ Phi-4-QwQ.i1-IQ2_M.gguf | 3 ++ Phi-4-QwQ.i1-IQ2_S.gguf | 3 ++ Phi-4-QwQ.i1-IQ2_XS.gguf | 3 ++ Phi-4-QwQ.i1-IQ2_XXS.gguf | 3 ++ Phi-4-QwQ.i1-IQ3_M.gguf | 3 ++ Phi-4-QwQ.i1-IQ3_S.gguf | 3 ++ Phi-4-QwQ.i1-IQ3_XS.gguf | 3 ++ Phi-4-QwQ.i1-IQ3_XXS.gguf | 3 ++ Phi-4-QwQ.i1-IQ4_NL.gguf | 3 ++ Phi-4-QwQ.i1-IQ4_XS.gguf | 3 ++ Phi-4-QwQ.i1-Q2_K.gguf | 3 ++ Phi-4-QwQ.i1-Q2_K_S.gguf | 3 ++ Phi-4-QwQ.i1-Q3_K_L.gguf | 3 ++ Phi-4-QwQ.i1-Q3_K_M.gguf | 3 ++ Phi-4-QwQ.i1-Q3_K_S.gguf | 3 ++ Phi-4-QwQ.i1-Q4_0.gguf | 3 ++ Phi-4-QwQ.i1-Q4_1.gguf | 3 ++ Phi-4-QwQ.i1-Q4_K_M.gguf | 3 ++ Phi-4-QwQ.i1-Q4_K_S.gguf | 3 ++ Phi-4-QwQ.i1-Q5_K_M.gguf | 3 ++ Phi-4-QwQ.i1-Q5_K_S.gguf | 3 ++ Phi-4-QwQ.i1-Q6_K.gguf | 3 ++ README.md | 81 +++++++++++++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 27 files changed, 216 insertions(+) create mode 100644 .gitattributes create mode 100644 Phi-4-QwQ.i1-IQ1_M.gguf create mode 100644 Phi-4-QwQ.i1-IQ1_S.gguf create mode 100644 Phi-4-QwQ.i1-IQ2_M.gguf create mode 100644 Phi-4-QwQ.i1-IQ2_S.gguf create mode 100644 Phi-4-QwQ.i1-IQ2_XS.gguf create mode 100644 Phi-4-QwQ.i1-IQ2_XXS.gguf create mode 100644 Phi-4-QwQ.i1-IQ3_M.gguf create mode 100644 Phi-4-QwQ.i1-IQ3_S.gguf create mode 100644 Phi-4-QwQ.i1-IQ3_XS.gguf create mode 100644 Phi-4-QwQ.i1-IQ3_XXS.gguf create mode 100644 Phi-4-QwQ.i1-IQ4_NL.gguf create mode 100644 Phi-4-QwQ.i1-IQ4_XS.gguf create mode 100644 Phi-4-QwQ.i1-Q2_K.gguf create mode 100644 Phi-4-QwQ.i1-Q2_K_S.gguf create mode 100644 Phi-4-QwQ.i1-Q3_K_L.gguf create mode 100644 Phi-4-QwQ.i1-Q3_K_M.gguf create mode 100644 Phi-4-QwQ.i1-Q3_K_S.gguf create mode 100644 Phi-4-QwQ.i1-Q4_0.gguf create mode 100644 Phi-4-QwQ.i1-Q4_1.gguf create mode 100644 Phi-4-QwQ.i1-Q4_K_M.gguf create mode 100644 Phi-4-QwQ.i1-Q4_K_S.gguf create mode 100644 Phi-4-QwQ.i1-Q5_K_M.gguf create mode 100644 Phi-4-QwQ.i1-Q5_K_S.gguf create mode 100644 Phi-4-QwQ.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..15dca76 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Phi-4-QwQ.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Phi-4-QwQ.i1-IQ1_M.gguf b/Phi-4-QwQ.i1-IQ1_M.gguf new file mode 100644 index 0000000..1e24887 --- /dev/null +++ b/Phi-4-QwQ.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391fa0ff88f0ecee5771228cdfde2f345b21e50a953f06fd8507368583755137 +size 3690188928 diff --git a/Phi-4-QwQ.i1-IQ1_S.gguf b/Phi-4-QwQ.i1-IQ1_S.gguf new file mode 100644 index 0000000..df8ac6c --- /dev/null +++ b/Phi-4-QwQ.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d011c24052a841022ed33cdfa64db111dac409dd6b3cc5d77eec571c221d984 +size 3412172928 diff --git a/Phi-4-QwQ.i1-IQ2_M.gguf b/Phi-4-QwQ.i1-IQ2_M.gguf new file mode 100644 index 0000000..181f89f --- /dev/null +++ b/Phi-4-QwQ.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc4028b2ed7a835392c0f5f7170d23a89cb1886dbc2e9fc2358bc35327670335 +size 5173923968 diff --git a/Phi-4-QwQ.i1-IQ2_S.gguf b/Phi-4-QwQ.i1-IQ2_S.gguf new file mode 100644 index 0000000..86d529c --- /dev/null +++ b/Phi-4-QwQ.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d55361224b872cb43b2b17b76e529120e9974a85cd143ac418b7cdfa8c46c2f +size 4803235968 diff --git a/Phi-4-QwQ.i1-IQ2_XS.gguf b/Phi-4-QwQ.i1-IQ2_XS.gguf new file mode 100644 index 0000000..f9755bc --- /dev/null +++ b/Phi-4-QwQ.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46260a4a841ee9b27bf253e5b29b03a666f5bb08f01e6aaf32ad18bce62c2a18 +size 4557004928 diff --git a/Phi-4-QwQ.i1-IQ2_XXS.gguf b/Phi-4-QwQ.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..b6fb4ef --- /dev/null +++ b/Phi-4-QwQ.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af0a6b603fc9e71d6e56f8b0e1e5ed6e1ae7af21031b32d81846695c77854f87 +size 4153548928 diff --git a/Phi-4-QwQ.i1-IQ3_M.gguf b/Phi-4-QwQ.i1-IQ3_M.gguf new file mode 100644 index 0000000..4d6478f --- /dev/null +++ b/Phi-4-QwQ.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d5edba8f4e3399fa17eb5043adce653e912c72202d50e4615a474b0707990c1 +size 6739763328 diff --git a/Phi-4-QwQ.i1-IQ3_S.gguf b/Phi-4-QwQ.i1-IQ3_S.gguf new file mode 100644 index 0000000..9f4a22b --- /dev/null +++ b/Phi-4-QwQ.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5be47080ff37cf5e0c36a0a5ca350f5fec508410cc18408b3047fc1df0d6c893 +size 6539571328 diff --git a/Phi-4-QwQ.i1-IQ3_XS.gguf b/Phi-4-QwQ.i1-IQ3_XS.gguf new file mode 100644 index 0000000..b8dac4b --- /dev/null +++ b/Phi-4-QwQ.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:331301bb094a7e84cf46594c3d0d2764052563a6a1a59980d423aa6686b67edf +size 6220083328 diff --git a/Phi-4-QwQ.i1-IQ3_XXS.gguf b/Phi-4-QwQ.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..634922a --- /dev/null +++ b/Phi-4-QwQ.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd2c78063126630788cf1fe91b86cc1c28c0d27974f3ee848253cfab880faa72 +size 5811875968 diff --git a/Phi-4-QwQ.i1-IQ4_NL.gguf b/Phi-4-QwQ.i1-IQ4_NL.gguf new file mode 100644 index 0000000..b4b3dd5 --- /dev/null +++ b/Phi-4-QwQ.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab8f8eef83c8a1625b9c41916bd1fb2cf9474ed771e7a2b17d02f89fab70ff57 +size 8416194688 diff --git a/Phi-4-QwQ.i1-IQ4_XS.gguf b/Phi-4-QwQ.i1-IQ4_XS.gguf new file mode 100644 index 0000000..803b3dc --- /dev/null +++ b/Phi-4-QwQ.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d3c1e8061e9887b1d23ea73cd12b510ef670a66ad4f11842611875894ddd18 +size 7982346368 diff --git a/Phi-4-QwQ.i1-Q2_K.gguf b/Phi-4-QwQ.i1-Q2_K.gguf new file mode 100644 index 0000000..34e361f --- /dev/null +++ b/Phi-4-QwQ.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:011e0814c7d2ac794473cee2ac860857ef95086c5a049d514a59e4b6e8647b09 +size 5608796288 diff --git a/Phi-4-QwQ.i1-Q2_K_S.gguf b/Phi-4-QwQ.i1-Q2_K_S.gguf new file mode 100644 index 0000000..612a620 --- /dev/null +++ b/Phi-4-QwQ.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee27c1991c8e45a9af33cfab68632a83dad777f700153450d90d24cf39a29505 +size 5237084288 diff --git a/Phi-4-QwQ.i1-Q3_K_L.gguf b/Phi-4-QwQ.i1-Q3_K_L.gguf new file mode 100644 index 0000000..6ab2092 --- /dev/null +++ b/Phi-4-QwQ.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f87d3fec0900da824071f3ed01cc334524ce3a510b115a83052b932d50945e28 +size 7788851328 diff --git a/Phi-4-QwQ.i1-Q3_K_M.gguf b/Phi-4-QwQ.i1-Q3_K_M.gguf new file mode 100644 index 0000000..d333a71 --- /dev/null +++ b/Phi-4-QwQ.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d65422563230e9ca84ec899174fbbcd116b385244a6acd06e4de2993020a726c +size 7190835328 diff --git a/Phi-4-QwQ.i1-Q3_K_S.gguf b/Phi-4-QwQ.i1-Q3_K_S.gguf new file mode 100644 index 0000000..43d6e7e --- /dev/null +++ b/Phi-4-QwQ.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fc90b704671464c694de81ac408c1be6092fedbe83072f19419b3015936574 +size 6504755328 diff --git a/Phi-4-QwQ.i1-Q4_0.gguf b/Phi-4-QwQ.i1-Q4_0.gguf new file mode 100644 index 0000000..667e348 --- /dev/null +++ b/Phi-4-QwQ.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2727da54956f75f1b27af1aef0cc1581a5735aff45e71ddc02339a186591befc +size 8412098688 diff --git a/Phi-4-QwQ.i1-Q4_1.gguf b/Phi-4-QwQ.i1-Q4_1.gguf new file mode 100644 index 0000000..2c385d2 --- /dev/null +++ b/Phi-4-QwQ.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:701f86394a038ed31c3ba77a6feb0ad68a58e60078451febc994ff610fdeac04 +size 9267507328 diff --git a/Phi-4-QwQ.i1-Q4_K_M.gguf b/Phi-4-QwQ.i1-Q4_K_M.gguf new file mode 100644 index 0000000..3a4c1c9 --- /dev/null +++ b/Phi-4-QwQ.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63f02baeeef06e3c52ce258712018b3e57df8b3015b0b38cf9f3b18767c47ac4 +size 8890306688 diff --git a/Phi-4-QwQ.i1-Q4_K_S.gguf b/Phi-4-QwQ.i1-Q4_K_S.gguf new file mode 100644 index 0000000..9134b11 --- /dev/null +++ b/Phi-4-QwQ.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bf3915418761d8d1b5f2588092aca804e88e346fb355805ce71010f0ff1dbdd +size 8444047488 diff --git a/Phi-4-QwQ.i1-Q5_K_M.gguf b/Phi-4-QwQ.i1-Q5_K_M.gguf new file mode 100644 index 0000000..60be564 --- /dev/null +++ b/Phi-4-QwQ.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41234632ef6cc99bde3aff8e8d8721bac49f028bb8d790d5531486daf6831c4e +size 10412707968 diff --git a/Phi-4-QwQ.i1-Q5_K_S.gguf b/Phi-4-QwQ.i1-Q5_K_S.gguf new file mode 100644 index 0000000..603b471 --- /dev/null +++ b/Phi-4-QwQ.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67b3ac26798c900eec23b86d4230b7651c4ba50ef7ba969bc7066b0d8255e630 +size 10151587968 diff --git a/Phi-4-QwQ.i1-Q6_K.gguf b/Phi-4-QwQ.i1-Q6_K.gguf new file mode 100644 index 0000000..dcbeb6b --- /dev/null +++ b/Phi-4-QwQ.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48cbcfa44d632058c1a7b283dd7b4ebbfc2203ff0522dcd45a65465d9a15b864 +size 12030259328 diff --git a/README.md b/README.md new file mode 100644 index 0000000..b577bc1 --- /dev/null +++ b/README.md @@ -0,0 +1,81 @@ +--- +base_model: prithivMLmods/Phi-4-QwQ +language: +- en +library_name: transformers +license: mit +quantized_by: mradermacher +tags: +- text-generation-inference +- llama +- phi3 +- phi +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/prithivMLmods/Phi-4-QwQ + + +static quants are available at https://huggingface.co/mradermacher/Phi-4-QwQ-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ1_S.gguf) | i1-IQ1_S | 3.5 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ1_M.gguf) | i1-IQ1_M | 3.8 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 4.3 | | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ2_XS.gguf) | i1-IQ2_XS | 4.7 | | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ2_S.gguf) | i1-IQ2_S | 4.9 | | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ2_M.gguf) | i1-IQ2_M | 5.3 | | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q2_K_S.gguf) | i1-Q2_K_S | 5.3 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q2_K.gguf) | i1-Q2_K | 5.7 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 5.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ3_XS.gguf) | i1-IQ3_XS | 6.3 | | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q3_K_S.gguf) | i1-Q3_K_S | 6.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ3_S.gguf) | i1-IQ3_S | 6.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ3_M.gguf) | i1-IQ3_M | 6.8 | | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q3_K_M.gguf) | i1-Q3_K_M | 7.3 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q3_K_L.gguf) | i1-Q3_K_L | 7.9 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ4_XS.gguf) | i1-IQ4_XS | 8.1 | | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q4_0.gguf) | i1-Q4_0 | 8.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-IQ4_NL.gguf) | i1-IQ4_NL | 8.5 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q4_K_S.gguf) | i1-Q4_K_S | 8.5 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q4_K_M.gguf) | i1-Q4_K_M | 9.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q4_1.gguf) | i1-Q4_1 | 9.4 | | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q5_K_S.gguf) | i1-Q5_K_S | 10.3 | | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q5_K_M.gguf) | i1-Q5_K_M | 10.5 | | +| [GGUF](https://huggingface.co/mradermacher/Phi-4-QwQ-i1-GGUF/resolve/main/Phi-4-QwQ.i1-Q6_K.gguf) | i1-Q6_K | 12.1 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..106419a --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71a0e2a0649408e24e26fc0c21b1fac3b1fc26808a2b90b5083b52e63fca1e1 +size 7791685