From 45c08b98559f8c5d41bbeeea23372dec78b643c4 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Tue, 5 May 2026 13:42:44 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Codepy-Deepthink-3B-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++++++ Codepy-Deepthink-3B.i1-IQ1_M.gguf | 3 ++ Codepy-Deepthink-3B.i1-IQ1_S.gguf | 3 ++ Codepy-Deepthink-3B.i1-IQ2_M.gguf | 3 ++ Codepy-Deepthink-3B.i1-IQ2_S.gguf | 3 ++ Codepy-Deepthink-3B.i1-IQ2_XS.gguf | 3 ++ Codepy-Deepthink-3B.i1-IQ2_XXS.gguf | 3 ++ Codepy-Deepthink-3B.i1-IQ3_M.gguf | 3 ++ Codepy-Deepthink-3B.i1-IQ3_S.gguf | 3 ++ Codepy-Deepthink-3B.i1-IQ3_XS.gguf | 3 ++ Codepy-Deepthink-3B.i1-IQ3_XXS.gguf | 3 ++ Codepy-Deepthink-3B.i1-IQ4_NL.gguf | 3 ++ Codepy-Deepthink-3B.i1-IQ4_XS.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q2_K.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q2_K_S.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q3_K_L.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q3_K_M.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q3_K_S.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q4_0.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q4_1.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q4_K_M.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q4_K_S.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q5_K_M.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q5_K_S.gguf | 3 ++ Codepy-Deepthink-3B.i1-Q6_K.gguf | 3 ++ README.md | 84 +++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 27 files changed, 219 insertions(+) create mode 100644 .gitattributes create mode 100644 Codepy-Deepthink-3B.i1-IQ1_M.gguf create mode 100644 Codepy-Deepthink-3B.i1-IQ1_S.gguf create mode 100644 Codepy-Deepthink-3B.i1-IQ2_M.gguf create mode 100644 Codepy-Deepthink-3B.i1-IQ2_S.gguf create mode 100644 Codepy-Deepthink-3B.i1-IQ2_XS.gguf create mode 100644 Codepy-Deepthink-3B.i1-IQ2_XXS.gguf create mode 100644 Codepy-Deepthink-3B.i1-IQ3_M.gguf create mode 100644 Codepy-Deepthink-3B.i1-IQ3_S.gguf create mode 100644 Codepy-Deepthink-3B.i1-IQ3_XS.gguf create mode 100644 Codepy-Deepthink-3B.i1-IQ3_XXS.gguf create mode 100644 Codepy-Deepthink-3B.i1-IQ4_NL.gguf create mode 100644 Codepy-Deepthink-3B.i1-IQ4_XS.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q2_K.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q2_K_S.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q3_K_L.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q3_K_M.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q3_K_S.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q4_0.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q4_1.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q4_K_M.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q4_K_S.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q5_K_M.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q5_K_S.gguf create mode 100644 Codepy-Deepthink-3B.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..ed94a31 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Codepy-Deepthink-3B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Codepy-Deepthink-3B.i1-IQ1_M.gguf b/Codepy-Deepthink-3B.i1-IQ1_M.gguf new file mode 100644 index 0000000..d32a6d4 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a90b43576c92761f92fc86c974be52aa7ac02c31edb299fa890a52483d37a3fd +size 924192800 diff --git a/Codepy-Deepthink-3B.i1-IQ1_S.gguf b/Codepy-Deepthink-3B.i1-IQ1_S.gguf new file mode 100644 index 0000000..e6e012a --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a74f5734bda3265254b5c3dd6d5b4ee660c529cf9601d530a85a3b3c7f6c6331 +size 868159520 diff --git a/Codepy-Deepthink-3B.i1-IQ2_M.gguf b/Codepy-Deepthink-3B.i1-IQ2_M.gguf new file mode 100644 index 0000000..501f8f5 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0c2fbe42fed829d441e5fb3a41021197613798e6c01bfb3d0fdd39511ca28b +size 1229033504 diff --git a/Codepy-Deepthink-3B.i1-IQ2_S.gguf b/Codepy-Deepthink-3B.i1-IQ2_S.gguf new file mode 100644 index 0000000..65775ea --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2e44d8162b62fb2321d4053c7598005ef936ece263b89d4967797cce971e88 +size 1154322464 diff --git a/Codepy-Deepthink-3B.i1-IQ2_XS.gguf b/Codepy-Deepthink-3B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..40f50aa --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e721ec5789d880c19c217893cdd15209272e23cf1b5ff6ef2e3166564b2943d2 +size 1100550176 diff --git a/Codepy-Deepthink-3B.i1-IQ2_XXS.gguf b/Codepy-Deepthink-3B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..05d03a3 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a51982ae7ddd3ff2236a89896b9087888640750d7b761f96b10ba6f42c1a4ab +size 1017581600 diff --git a/Codepy-Deepthink-3B.i1-IQ3_M.gguf b/Codepy-Deepthink-3B.i1-IQ3_M.gguf new file mode 100644 index 0000000..0dae432 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef45c248901eceeedd07bf1278443dc16df49e7be2bb4ec34f3c92edc0ae6d2 +size 1599670304 diff --git a/Codepy-Deepthink-3B.i1-IQ3_S.gguf b/Codepy-Deepthink-3B.i1-IQ3_S.gguf new file mode 100644 index 0000000..f627c28 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d935bbbb9caead53143092cba5d91bf89adf6c0f2e947ef110fd1e588cfc91a0 +size 1542850592 diff --git a/Codepy-Deepthink-3B.i1-IQ3_XS.gguf b/Codepy-Deepthink-3B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..5964fab --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95446d1ffe3c07ca5ab42979551dbb63dd1fc3fb6256b8b409d5ebabfd0570eb +size 1476790304 diff --git a/Codepy-Deepthink-3B.i1-IQ3_XXS.gguf b/Codepy-Deepthink-3B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..1f222b2 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:972364aeacb19a39bde495f80f81832c4819d6588eff553bf435930a873c17b5 +size 1348767776 diff --git a/Codepy-Deepthink-3B.i1-IQ4_NL.gguf b/Codepy-Deepthink-3B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..f195bad --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e3d2e7b738bbd56170237ccf4c2b32c97e732e4d675a90ac009b29d9346f80c +size 1917192224 diff --git a/Codepy-Deepthink-3B.i1-IQ4_XS.gguf b/Codepy-Deepthink-3B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..9dfac8a --- /dev/null +++ b/Codepy-Deepthink-3B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95cd1415f5936b282d027f08aafa6acfa2c596e876dd884c6887f55a2aa13b3c +size 1829111840 diff --git a/Codepy-Deepthink-3B.i1-Q2_K.gguf b/Codepy-Deepthink-3B.i1-Q2_K.gguf new file mode 100644 index 0000000..ee152cb --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a578c6fe556a1eeb1550d72693a6c2a11541fbf14e7288ad38c334b70318c04d +size 1363937312 diff --git a/Codepy-Deepthink-3B.i1-Q2_K_S.gguf b/Codepy-Deepthink-3B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..2898a05 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0315ff6349be06e1c7a9450421218a42c02b75650aeaa1f48b0ae19bfeff3cb7 +size 1274284064 diff --git a/Codepy-Deepthink-3B.i1-Q3_K_L.gguf b/Codepy-Deepthink-3B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..759c61b --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4564e19ef268e973fed0bec42a4fcefb80c4f5ea50f144e01e4638083e305b7d +size 1815349280 diff --git a/Codepy-Deepthink-3B.i1-Q3_K_M.gguf b/Codepy-Deepthink-3B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..e338bf8 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2131bbc264b65ff1b5f6a3dd1474cbc120bda40f9871afe4f56cf1529af41fc5 +size 1687160864 diff --git a/Codepy-Deepthink-3B.i1-Q3_K_S.gguf b/Codepy-Deepthink-3B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..9540b48 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b15f12a1e346c949e590057ac8975d63ec2ad641ae247a63ae8e4aef2c7d21b +size 1542850592 diff --git a/Codepy-Deepthink-3B.i1-Q4_0.gguf b/Codepy-Deepthink-3B.i1-Q4_0.gguf new file mode 100644 index 0000000..837cdf8 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22defaa6babc6e1c56136d8aba0ebd6133b250a68a9380ab47735af90f274abc +size 1921910816 diff --git a/Codepy-Deepthink-3B.i1-Q4_1.gguf b/Codepy-Deepthink-3B.i1-Q4_1.gguf new file mode 100644 index 0000000..077e2e9 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39c156e6adc6b8186a26c598479c4f83d4227e93bcbec84d7e8f6f22fbe7080 +size 2093352992 diff --git a/Codepy-Deepthink-3B.i1-Q4_K_M.gguf b/Codepy-Deepthink-3B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..57446e0 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69a73131a840ca4c119edf7b0f6a3312961503287c345083061ab78cd9add68e +size 2019379232 diff --git a/Codepy-Deepthink-3B.i1-Q4_K_S.gguf b/Codepy-Deepthink-3B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..ccc0a50 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7814c6d483255d5c1ffd66426b42737e4891483c0f2dab1f10a740a3313126e9 +size 1928202272 diff --git a/Codepy-Deepthink-3B.i1-Q5_K_M.gguf b/Codepy-Deepthink-3B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..9803552 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2af43bf5fbcf4afe4b9cb873c6b0e1b34dd978ccada22bebe541e2c8d366b2d8 +size 2322155552 diff --git a/Codepy-Deepthink-3B.i1-Q5_K_S.gguf b/Codepy-Deepthink-3B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..75e0ba5 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd6fc47bfcc17137ea54d4ff9518a3e617c1c562cd026b1f3b3e29002c29c556 +size 2269513760 diff --git a/Codepy-Deepthink-3B.i1-Q6_K.gguf b/Codepy-Deepthink-3B.i1-Q6_K.gguf new file mode 100644 index 0000000..2d11115 --- /dev/null +++ b/Codepy-Deepthink-3B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2d8f1b294eb1b5930ee9f9f81542cbf4c7463c041bba663e92b061b1f09b225 +size 2643855392 diff --git a/README.md b/README.md new file mode 100644 index 0000000..6ee9a4f --- /dev/null +++ b/README.md @@ -0,0 +1,84 @@ +--- +base_model: prithivMLmods/Codepy-Deepthink-3B +language: +- en +library_name: transformers +license: creativeml-openrail-m +quantized_by: mradermacher +tags: +- codepy +- safetensors +- ollama +- llama-cpp +- trl +- deep-think +- coder +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/prithivMLmods/Codepy-Deepthink-3B + + +static quants are available at https://huggingface.co/mradermacher/Codepy-Deepthink-3B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ1_S.gguf) | i1-IQ1_S | 1.0 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ1_M.gguf) | i1-IQ1_M | 1.0 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ2_S.gguf) | i1-IQ2_S | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ2_M.gguf) | i1-IQ2_M | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 1.4 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 1.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q2_K.gguf) | i1-Q2_K | 1.5 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 1.6 | | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ3_S.gguf) | i1-IQ3_S | 1.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 1.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ3_M.gguf) | i1-IQ3_M | 1.7 | | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.8 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.9 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.9 | | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 2.0 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q4_0.gguf) | i1-Q4_0 | 2.0 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 2.0 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 2.1 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q4_1.gguf) | i1-Q4_1 | 2.2 | | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/Codepy-Deepthink-3B-i1-GGUF/resolve/main/Codepy-Deepthink-3B.i1-Q6_K.gguf) | i1-Q6_K | 2.7 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..a6566f8 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:975a35f07e52f1623b1195baf56ca8cef87df4b604d076c3adf378dca7df609d +size 2988377