From e12276aeeaf9f32ef64cfbd0c16cb3f1e2b5ce94 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Tue, 21 Apr 2026 21:07:42 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF Source: Original Platform --- .gitattributes | 60 ++++++++++++++++ Poseidon-Reasoning-1.7B.i1-IQ1_M.gguf | 3 + Poseidon-Reasoning-1.7B.i1-IQ1_S.gguf | 3 + Poseidon-Reasoning-1.7B.i1-IQ2_M.gguf | 3 + Poseidon-Reasoning-1.7B.i1-IQ2_S.gguf | 3 + Poseidon-Reasoning-1.7B.i1-IQ2_XS.gguf | 3 + Poseidon-Reasoning-1.7B.i1-IQ2_XXS.gguf | 3 + Poseidon-Reasoning-1.7B.i1-IQ3_M.gguf | 3 + Poseidon-Reasoning-1.7B.i1-IQ3_S.gguf | 3 + Poseidon-Reasoning-1.7B.i1-IQ3_XS.gguf | 3 + Poseidon-Reasoning-1.7B.i1-IQ3_XXS.gguf | 3 + Poseidon-Reasoning-1.7B.i1-IQ4_NL.gguf | 3 + Poseidon-Reasoning-1.7B.i1-IQ4_XS.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q2_K.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q2_K_S.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q3_K_L.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q3_K_M.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q3_K_S.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q4_0.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q4_1.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q4_K_M.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q4_K_S.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q5_K_M.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q5_K_S.gguf | 3 + Poseidon-Reasoning-1.7B.i1-Q6_K.gguf | 3 + README.md | 91 +++++++++++++++++++++++++ imatrix.dat | 3 + 27 files changed, 226 insertions(+) create mode 100644 .gitattributes create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ1_M.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ1_S.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ2_M.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ2_S.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ2_XS.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ2_XXS.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ3_M.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ3_S.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ3_XS.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ3_XXS.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ4_NL.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-IQ4_XS.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q2_K.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q2_K_S.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q3_K_L.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q3_K_M.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q3_K_S.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q4_0.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q4_1.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q4_K_M.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q4_K_S.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q5_K_M.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q5_K_S.gguf create mode 100644 Poseidon-Reasoning-1.7B.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..1d1bae8 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Poseidon-Reasoning-1.7B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Poseidon-Reasoning-1.7B.i1-IQ1_M.gguf b/Poseidon-Reasoning-1.7B.i1-IQ1_M.gguf new file mode 100644 index 0000000..22452e7 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b614d6e83811dcc1e50ff6f57337e2868e5321b4f3549dea98a6500d32399de8 +size 543794880 diff --git a/Poseidon-Reasoning-1.7B.i1-IQ1_S.gguf b/Poseidon-Reasoning-1.7B.i1-IQ1_S.gguf new file mode 100644 index 0000000..9cdcc29 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa5ca79be9f8ed008ecba50b4982cd479eb9a6ab39b08ca066dcb15425d46102 +size 515778240 diff --git a/Poseidon-Reasoning-1.7B.i1-IQ2_M.gguf b/Poseidon-Reasoning-1.7B.i1-IQ2_M.gguf new file mode 100644 index 0000000..ac5a023 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e9fd0689c8ffccc46f155aba39cb952e94fc520d5b083e1c33b27b599301955 +size 695183040 diff --git a/Poseidon-Reasoning-1.7B.i1-IQ2_S.gguf b/Poseidon-Reasoning-1.7B.i1-IQ2_S.gguf new file mode 100644 index 0000000..51e4973 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00eb082df86c32e7a46c282fa57381c65c780002688c7581b4ab281620265c08 +size 657827520 diff --git a/Poseidon-Reasoning-1.7B.i1-IQ2_XS.gguf b/Poseidon-Reasoning-1.7B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..abbb32e --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9fc39d55ba2c6ebec8766def30087bec8f9176335f8cf4cc8ab54ec7554139f +size 631514816 diff --git a/Poseidon-Reasoning-1.7B.i1-IQ2_XXS.gguf b/Poseidon-Reasoning-1.7B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..93df887 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d4a4c13562f98a98da8d0dbf629394a500b507dd9332d165a58307eeb048b2c +size 590489280 diff --git a/Poseidon-Reasoning-1.7B.i1-IQ3_M.gguf b/Poseidon-Reasoning-1.7B.i1-IQ3_M.gguf new file mode 100644 index 0000000..17dfaf5 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b011b0d26894ffe7ae7f2f37fc4be0df31d72414e99cf489edf77343e3e1799 +size 895663808 diff --git a/Poseidon-Reasoning-1.7B.i1-IQ3_S.gguf b/Poseidon-Reasoning-1.7B.i1-IQ3_S.gguf new file mode 100644 index 0000000..183deaa --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909de7fa0a54f37dd180669eb954116753911c323a7539506e1ca98b04523887 +size 867253952 diff --git a/Poseidon-Reasoning-1.7B.i1-IQ3_XS.gguf b/Poseidon-Reasoning-1.7B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..be41a60 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e31f9750d75dca25ca0affeffa91655cec682231af227a8429b7089ff7545500 +size 834223808 diff --git a/Poseidon-Reasoning-1.7B.i1-IQ3_XXS.gguf b/Poseidon-Reasoning-1.7B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..4973dc4 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124751a49f99b5b8058a8f34d3e107a03fe1048b4cf055999966fe20b3e71b72 +size 754362048 diff --git a/Poseidon-Reasoning-1.7B.i1-IQ4_NL.gguf b/Poseidon-Reasoning-1.7B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..8ae8ed8 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8478024d5e6831f9095e5a333d0d858930d71fb029161dd789f38e7db8926b8f +size 1054424768 diff --git a/Poseidon-Reasoning-1.7B.i1-IQ4_XS.gguf b/Poseidon-Reasoning-1.7B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..a4b1ff0 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ac4522a389d98b183d773c2111a20cd0a98f4cb72569525370b2a22df1b4b07 +size 1010384576 diff --git a/Poseidon-Reasoning-1.7B.i1-Q2_K.gguf b/Poseidon-Reasoning-1.7B.i1-Q2_K.gguf new file mode 100644 index 0000000..9571a44 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de9619462cefbda7464d9458be90cc688be0cefd7603bac7378cc998c02b223e +size 777797312 diff --git a/Poseidon-Reasoning-1.7B.i1-Q2_K_S.gguf b/Poseidon-Reasoning-1.7B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..a125b0b --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bdcb1f2ee2bfdae3c0f38d4ba316d28b259d58a4dc4b8810f7541b7aae947bf +size 732970688 diff --git a/Poseidon-Reasoning-1.7B.i1-Q3_K_L.gguf b/Poseidon-Reasoning-1.7B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..8f77d50 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d6842e484453ee4fdcf3bd0ff38817c8544ac7c3f4a9471b13dbc45a4b7eaf +size 1003503296 diff --git a/Poseidon-Reasoning-1.7B.i1-Q3_K_M.gguf b/Poseidon-Reasoning-1.7B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..a12a439 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b1b9af51a13ea878742db53adf06ede1279c79ae3171f5a8c44b009261f267 +size 939540160 diff --git a/Poseidon-Reasoning-1.7B.i1-Q3_K_S.gguf b/Poseidon-Reasoning-1.7B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..91ff41d --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5003ca2117bf51e5722c1fc42f347b8fced59ac5390f81d2b9188885323ed47 +size 867253952 diff --git a/Poseidon-Reasoning-1.7B.i1-Q4_0.gguf b/Poseidon-Reasoning-1.7B.i1-Q4_0.gguf new file mode 100644 index 0000000..9103d0a --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d13915aae5fe52a7f5e3f73cc0c2ae4d30c9d5327a2d2df897f2e8d81e171bee +size 1056784064 diff --git a/Poseidon-Reasoning-1.7B.i1-Q4_1.gguf b/Poseidon-Reasoning-1.7B.i1-Q4_1.gguf new file mode 100644 index 0000000..dd93563 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d56ca201969358fa90038f77dc46f4f04fb001d2fe306e4a7e77dbfb05715666 +size 1142505152 diff --git a/Poseidon-Reasoning-1.7B.i1-Q4_K_M.gguf b/Poseidon-Reasoning-1.7B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..47fd438 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1468dfc9adeaa8262fce89a5abf790e1ca1e18cc9ffaa26dd596ff2b53b270b4 +size 1107410624 diff --git a/Poseidon-Reasoning-1.7B.i1-Q4_K_S.gguf b/Poseidon-Reasoning-1.7B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..dbc5add --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29167d6452c09518a107924143da179cf6a90c2c41b772f68cf4ad2510be3e4c +size 1060191936 diff --git a/Poseidon-Reasoning-1.7B.i1-Q5_K_M.gguf b/Poseidon-Reasoning-1.7B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..212e921 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:637e234046c26470b6a6a0e2109d801d6c8489df1a17449de7cc629cd57ed264 +size 1257881280 diff --git a/Poseidon-Reasoning-1.7B.i1-Q5_K_S.gguf b/Poseidon-Reasoning-1.7B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..6ffee2b --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f3a3efaf57e5abb43aeb9cc576867763bb497bedf608e456b225cc84aa8b687 +size 1230585536 diff --git a/Poseidon-Reasoning-1.7B.i1-Q6_K.gguf b/Poseidon-Reasoning-1.7B.i1-Q6_K.gguf new file mode 100644 index 0000000..29fd2d0 --- /dev/null +++ b/Poseidon-Reasoning-1.7B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9159a18812c0c25cf13428d4daccd188f9a98e0d7a14f5be2dcda4820ce28890 +size 1417756352 diff --git a/README.md b/README.md new file mode 100644 index 0000000..0ea84ac --- /dev/null +++ b/README.md @@ -0,0 +1,91 @@ +--- +base_model: prithivMLmods/Poseidon-Reasoning-1.7B +datasets: +- prithivMLmods/Poseidon-Reasoning-5M +language: +- en +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- text-generation-inference +- moe +- code +- science +- biology +- chemistry +- thinking +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/prithivMLmods/Poseidon-Reasoning-1.7B + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Poseidon-Reasoning-1.7B-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ1_S.gguf) | i1-IQ1_S | 0.6 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ1_M.gguf) | i1-IQ1_M | 0.6 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ2_S.gguf) | i1-IQ2_S | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ2_M.gguf) | i1-IQ2_M | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.8 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q2_K.gguf) | i1-Q2_K | 0.9 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ3_S.gguf) | i1-IQ3_S | 1.0 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 1.0 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ3_M.gguf) | i1-IQ3_M | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.0 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.1 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 1.2 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q4_0.gguf) | i1-Q4_0 | 1.2 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 1.2 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q4_1.gguf) | i1-Q4_1 | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/Poseidon-Reasoning-1.7B-i1-GGUF/resolve/main/Poseidon-Reasoning-1.7B.i1-Q6_K.gguf) | i1-Q6_K | 1.5 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..b9ae566 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e38c8ce7bdfab2e09b25b9a13ca9491f7f3b4ebaf210032ed96794a38acb0c6 +size 2070873