From f0e56b66a1bc0691ce71988013b89bdbe4d3d778 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Thu, 23 Apr 2026 12:22:02 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Kyro-n1.1-3B-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++++ Kyro-n1.1-3B.i1-IQ1_M.gguf | 3 + Kyro-n1.1-3B.i1-IQ1_S.gguf | 3 + Kyro-n1.1-3B.i1-IQ2_M.gguf | 3 + Kyro-n1.1-3B.i1-IQ2_S.gguf | 3 + Kyro-n1.1-3B.i1-IQ2_XS.gguf | 3 + Kyro-n1.1-3B.i1-IQ2_XXS.gguf | 3 + Kyro-n1.1-3B.i1-IQ3_M.gguf | 3 + Kyro-n1.1-3B.i1-IQ3_S.gguf | 3 + Kyro-n1.1-3B.i1-IQ3_XS.gguf | 3 + Kyro-n1.1-3B.i1-IQ3_XXS.gguf | 3 + Kyro-n1.1-3B.i1-IQ4_NL.gguf | 3 + Kyro-n1.1-3B.i1-IQ4_XS.gguf | 3 + Kyro-n1.1-3B.i1-Q2_K.gguf | 3 + Kyro-n1.1-3B.i1-Q2_K_S.gguf | 3 + Kyro-n1.1-3B.i1-Q3_K_L.gguf | 3 + Kyro-n1.1-3B.i1-Q3_K_M.gguf | 3 + Kyro-n1.1-3B.i1-Q3_K_S.gguf | 3 + Kyro-n1.1-3B.i1-Q4_0.gguf | 3 + Kyro-n1.1-3B.i1-Q4_1.gguf | 3 + Kyro-n1.1-3B.i1-Q4_K_M.gguf | 3 + Kyro-n1.1-3B.i1-Q4_K_S.gguf | 3 + Kyro-n1.1-3B.i1-Q5_K_M.gguf | 3 + Kyro-n1.1-3B.i1-Q5_K_S.gguf | 3 + Kyro-n1.1-3B.i1-Q6_K.gguf | 3 + README.md | 112 +++++++++++++++++++++++++++++++++++ imatrix.dat | 3 + 27 files changed, 247 insertions(+) create mode 100644 .gitattributes create mode 100644 Kyro-n1.1-3B.i1-IQ1_M.gguf create mode 100644 Kyro-n1.1-3B.i1-IQ1_S.gguf create mode 100644 Kyro-n1.1-3B.i1-IQ2_M.gguf create mode 100644 Kyro-n1.1-3B.i1-IQ2_S.gguf create mode 100644 Kyro-n1.1-3B.i1-IQ2_XS.gguf create mode 100644 Kyro-n1.1-3B.i1-IQ2_XXS.gguf create mode 100644 Kyro-n1.1-3B.i1-IQ3_M.gguf create mode 100644 Kyro-n1.1-3B.i1-IQ3_S.gguf create mode 100644 Kyro-n1.1-3B.i1-IQ3_XS.gguf create mode 100644 Kyro-n1.1-3B.i1-IQ3_XXS.gguf create mode 100644 Kyro-n1.1-3B.i1-IQ4_NL.gguf create mode 100644 Kyro-n1.1-3B.i1-IQ4_XS.gguf create mode 100644 Kyro-n1.1-3B.i1-Q2_K.gguf create mode 100644 Kyro-n1.1-3B.i1-Q2_K_S.gguf create mode 100644 Kyro-n1.1-3B.i1-Q3_K_L.gguf create mode 100644 Kyro-n1.1-3B.i1-Q3_K_M.gguf create mode 100644 Kyro-n1.1-3B.i1-Q3_K_S.gguf create mode 100644 Kyro-n1.1-3B.i1-Q4_0.gguf create mode 100644 Kyro-n1.1-3B.i1-Q4_1.gguf create mode 100644 Kyro-n1.1-3B.i1-Q4_K_M.gguf create mode 100644 Kyro-n1.1-3B.i1-Q4_K_S.gguf create mode 100644 Kyro-n1.1-3B.i1-Q5_K_M.gguf create mode 100644 Kyro-n1.1-3B.i1-Q5_K_S.gguf create mode 100644 Kyro-n1.1-3B.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..2de2ccc --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Kyro-n1.1-3B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Kyro-n1.1-3B.i1-IQ1_M.gguf b/Kyro-n1.1-3B.i1-IQ1_M.gguf new file mode 100644 index 0000000..75e20af --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92f000e04bf7c8ddb91f3ba2549c60be7b12279e3f7e1d50017b228322f4af74 +size 850028416 diff --git a/Kyro-n1.1-3B.i1-IQ1_S.gguf b/Kyro-n1.1-3B.i1-IQ1_S.gguf new file mode 100644 index 0000000..203cf21 --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:396049f4bd67fcb1f80e097961def5ee7db133f1c68c7120e1186967535237a9 +size 791095168 diff --git a/Kyro-n1.1-3B.i1-IQ2_M.gguf b/Kyro-n1.1-3B.i1-IQ2_M.gguf new file mode 100644 index 0000000..5a3643f --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc5e8e2e8610431da5bf3df8d52b65cca8b578ab0122854fb12ecae86e0dd12c +size 1140516736 diff --git a/Kyro-n1.1-3B.i1-IQ2_S.gguf b/Kyro-n1.1-3B.i1-IQ2_S.gguf new file mode 100644 index 0000000..7990da7 --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bab58120ded15d64d900e4d5789ebcff412bfa9342b7c6b8270482eafbf9a00a +size 1061939072 diff --git a/Kyro-n1.1-3B.i1-IQ2_XS.gguf b/Kyro-n1.1-3B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..669d37f --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dc187b0b3fa4df86fb679be167ce7753ed898625ba398732ec4220a37aeac63 +size 1031546752 diff --git a/Kyro-n1.1-3B.i1-IQ2_XXS.gguf b/Kyro-n1.1-3B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..a22b946 --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0525daf710c89ba8f9e2028e762884153d15d6f223cbf909bf7f0e0fc4bbee7e +size 948250496 diff --git a/Kyro-n1.1-3B.i1-IQ3_M.gguf b/Kyro-n1.1-3B.i1-IQ3_M.gguf new file mode 100644 index 0000000..2c2601c --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2fe9318fa1a0f1823c33e53a931b064297468bcd9e244e4457ee5bcde50d70e +size 1488895872 diff --git a/Kyro-n1.1-3B.i1-IQ3_S.gguf b/Kyro-n1.1-3B.i1-IQ3_S.gguf new file mode 100644 index 0000000..7146c81 --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ae76d43e145e96cdbc0598dce794a3744c95f9568c651c2e37c68f3c636580 +size 1456865152 diff --git a/Kyro-n1.1-3B.i1-IQ3_XS.gguf b/Kyro-n1.1-3B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..c7d160c --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae66966900682482c9c8ad850eb0178403bc4b0e6eaed472ab108cff1d47c2e9 +size 1391837056 diff --git a/Kyro-n1.1-3B.i1-IQ3_XXS.gguf b/Kyro-n1.1-3B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..9bcb399 --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeaed5cce1ce3edfc912e9e1a5314841299ccf52d58dca8e1177c7cfdab2b7d8 +size 1282828160 diff --git a/Kyro-n1.1-3B.i1-IQ4_NL.gguf b/Kyro-n1.1-3B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..a51d199 --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f951dd3c6604ec63a87696072961bdf7e18e03c02c07ca5189f8c89dbeeeb2 +size 1825210240 diff --git a/Kyro-n1.1-3B.i1-IQ4_XS.gguf b/Kyro-n1.1-3B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..4feb886 --- /dev/null +++ b/Kyro-n1.1-3B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89ce89052c93dfb29ad06e6a886cb74936b3a4ddb6dbdacea67b7353ebb94323 +size 1739095936 diff --git a/Kyro-n1.1-3B.i1-Q2_K.gguf b/Kyro-n1.1-3B.i1-Q2_K.gguf new file mode 100644 index 0000000..9918d98 --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05022907d7b6b2b5e93f8d6ec0083363825c795d701aad46d545541a4f3f7a19 +size 1274756992 diff --git a/Kyro-n1.1-3B.i1-Q2_K_S.gguf b/Kyro-n1.1-3B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..fa4ff73 --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c3e0259122237986dadd2f25cec4742335b88b599614fc83e86223b197458ef +size 1198129024 diff --git a/Kyro-n1.1-3B.i1-Q3_K_L.gguf b/Kyro-n1.1-3B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..50bbc74 --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd5f8cd41ad08c28b622cf067f5350363781b51e8088ef3e8f1cd5b905cdca9a +size 1707392896 diff --git a/Kyro-n1.1-3B.i1-Q3_K_M.gguf b/Kyro-n1.1-3B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..67234ed --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91b244eb25f9b81854ed879b6209f5ff2a5f6119201aa97147498a5cf97e7703 +size 1590476672 diff --git a/Kyro-n1.1-3B.i1-Q3_K_S.gguf b/Kyro-n1.1-3B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..0a7269e --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1433f406bd89d0cc7b6baaca10e38b680fdbd5fa61a7e64850552c9e4f96291 +size 1454358400 diff --git a/Kyro-n1.1-3B.i1-Q4_0.gguf b/Kyro-n1.1-3B.i1-Q4_0.gguf new file mode 100644 index 0000000..382a040 --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ecb3f1b7b066f5882571595a3928eaa5353cfd1b01392a57e3a21ce25dd7d33 +size 1828487040 diff --git a/Kyro-n1.1-3B.i1-Q4_1.gguf b/Kyro-n1.1-3B.i1-Q4_1.gguf new file mode 100644 index 0000000..6a6d901 --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f028fbeddac1aa2430cacb22ea69d1e7c3606f3298f68038467c763738047b6 +size 1996259200 diff --git a/Kyro-n1.1-3B.i1-Q4_K_M.gguf b/Kyro-n1.1-3B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..8950ac3 --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f8ab7218f0687ab621f51d194a91c761b3049d06f6277e125bc698eb4d0aecd +size 1929904000 diff --git a/Kyro-n1.1-3B.i1-Q4_K_S.gguf b/Kyro-n1.1-3B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..09297c3 --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d92d880d76d3825fcd0788d66f83260c61c2b7f95d23b8ca64356c338c921410 +size 1834385280 diff --git a/Kyro-n1.1-3B.i1-Q5_K_M.gguf b/Kyro-n1.1-3B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..50dc580 --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b0b85689e531244d08d52b0d9d3fcd01df485895db20e7c46d9fff1112e81c +size 2224816000 diff --git a/Kyro-n1.1-3B.i1-Q5_K_S.gguf b/Kyro-n1.1-3B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..cdaaf0b --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b64aa934f9f5bd4a9828f4a6cd25c755a874704e20f5075a0a16bcde9095d8c9 +size 2169667456 diff --git a/Kyro-n1.1-3B.i1-Q6_K.gguf b/Kyro-n1.1-3B.i1-Q6_K.gguf new file mode 100644 index 0000000..fbb6b08 --- /dev/null +++ b/Kyro-n1.1-3B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec8ce656e91ee7ebf306c880ec9e295b6ef5c2ca2f7ea3405f37ef28beb6d155 +size 2538160000 diff --git a/README.md b/README.md new file mode 100644 index 0000000..b2e7864 --- /dev/null +++ b/README.md @@ -0,0 +1,112 @@ +--- +base_model: open-neo/Kyro-n1.1-3B +language: +- en +- zh +- fr +- es +- pt +- de +- it +- ru +- ja +- ko +- vi +- th +- ar +- fa +- he +- tr +- cs +- pl +- hi +- bn +- ur +- id +- ms +- lo +- my +- ceb +- km +- tl +- nl +library_name: transformers +license: other +license_link: https://huggingface.co/Qwen/Qwen2.5-3B-Instruct/blob/main/LICENSE +license_name: qwen-research +quantized_by: mradermacher +tags: +- reasoning +- kyro +- open-neo +- open-source +- deepseek-r1 +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/open-neo/Kyro-n1.1-3B + + +static quants are available at https://huggingface.co/mradermacher/Kyro-n1.1-3B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ1_S.gguf) | i1-IQ1_S | 0.9 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ1_M.gguf) | i1-IQ1_M | 1.0 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ2_S.gguf) | i1-IQ2_S | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ2_M.gguf) | i1-IQ2_M | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 1.3 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q2_K.gguf) | i1-Q2_K | 1.4 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 1.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 1.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ3_S.gguf) | i1-IQ3_S | 1.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ3_M.gguf) | i1-IQ3_M | 1.6 | | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.7 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.8 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.8 | | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 1.9 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q4_0.gguf) | i1-Q4_0 | 1.9 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 1.9 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 2.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q4_1.gguf) | i1-Q4_1 | 2.1 | | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 2.3 | | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 2.3 | | +| [GGUF](https://huggingface.co/mradermacher/Kyro-n1.1-3B-i1-GGUF/resolve/main/Kyro-n1.1-3B.i1-Q6_K.gguf) | i1-Q6_K | 2.6 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..99814fe --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c706555b07ab04129d6b5d8f414211620bf3512cd24c3f8655a446a245b9180 +size 3362977