From 0b8a56a75aeb27ad6277b123d2e3bb17f96a7d8b Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Mon, 4 May 2026 16:55:46 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++ Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_M.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_S.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_M.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_S.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XS.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XXS.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_M.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_S.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XS.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XXS.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-IQ4_XS.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q2_K.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_L.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_M.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_S.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_4.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_8.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_8_8.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_M.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_S.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_M.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_S.gguf | 3 + Komodo-Llama-3.2-3B-v2-fp16.i1-Q6_K.gguf | 3 + README.md | 90 ++++++++++++++++++++ imatrix.dat | 3 + 27 files changed, 225 insertions(+) create mode 100644 .gitattributes create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_M.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_S.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_M.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_S.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XS.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XXS.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_M.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_S.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XS.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XXS.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-IQ4_XS.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q2_K.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_L.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_M.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_S.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_4.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_8.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_8_8.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_M.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_S.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_M.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_S.gguf create mode 100644 Komodo-Llama-3.2-3B-v2-fp16.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..3252cfc --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_8.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_8_8.gguf filter=lfs diff=lfs merge=lfs -text +Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_M.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_M.gguf new file mode 100644 index 0000000..69419e3 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f084d28ef1c95df7a414321629635ccfa9774e415a828fcd604b19b551a626b0 +size 924192320 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_S.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_S.gguf new file mode 100644 index 0000000..6fc8ddf --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6011425c399c601509b5e6719ce8d0381e2c11b37707e06a4524ffaf4447280 +size 868159040 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_M.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_M.gguf new file mode 100644 index 0000000..cc01898 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dee27782d653461f2dc68565c3fa25c62c78e88284450c642f05549e942c5cf5 +size 1229033024 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_S.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_S.gguf new file mode 100644 index 0000000..bcaa969 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b073add7e0d17ab9f0c095047bb429b58ba716db30c9aa40fbf9685122c3eef +size 1154321984 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XS.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XS.gguf new file mode 100644 index 0000000..456e932 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f884e56abc24b00cce7c8d30ddb37305d1b28984531a17634ea1f9abb009ca88 +size 1100549696 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XXS.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..82a6234 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c92946c926c0b0a4aaa20adbdd27660ed43ddf59e0997970a1b718559ef17ab4 +size 1017581120 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_M.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_M.gguf new file mode 100644 index 0000000..c81bce5 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcd880610bf494c9007e4d64af85001d214039d7d27e08fee3d2dfb41e89eb04 +size 1599669824 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_S.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_S.gguf new file mode 100644 index 0000000..6b5f3c0 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76a6db4ef743f5b74b9420ff83a82ed3ed998f76b4aa020e086c3bf98fb69b10 +size 1542850112 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XS.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XS.gguf new file mode 100644 index 0000000..76ac116 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab10918c2e7eb6a52f2cba780786507ab314875ce9fb011c048b74cdd7cda65f +size 1476789824 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XXS.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..13fb56d --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58ccb9d8f82b0f53707c3850ea1476db575e59007c8829d3c5fa74b9532127fa +size 1348767296 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ4_XS.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ4_XS.gguf new file mode 100644 index 0000000..11a8c0b --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16c5e5f2584c60e83961b8853d14f4f381c9d11166f66eacf85944b1b6d4f232 +size 1829111360 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q2_K.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q2_K.gguf new file mode 100644 index 0000000..8976feb --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e72b1eabd35da777b9ce91b60374a9d70b83984e1a740ffa1f145290598b32a +size 1363936832 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_L.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_L.gguf new file mode 100644 index 0000000..6930970 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:136e6bc38788013b69b52b528263b771a90432b14ef8e0b57214191a92299098 +size 1815348800 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_M.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_M.gguf new file mode 100644 index 0000000..c80be79 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd57e70f0e0a26c89e436ea88a6e2d493877ac21c33b2fa81e0dfad16d846dba +size 1687160384 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_S.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_S.gguf new file mode 100644 index 0000000..017fe44 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73a169b708a921e3fbbd8f2a0d078d4eb937c318052b0017a000498033f75648 +size 1542850112 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0.gguf new file mode 100644 index 0000000..3786a67 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b903d557c22e8fe4cd3016287a255300bc78db242104f07d87378e0dfcb8b65 +size 1921910336 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_4.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_4.gguf new file mode 100644 index 0000000..e465607 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_4.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0faede2822b5245e40007715e782fadf91a1e5734c9198942a8ea39618b1bd7 +size 1917191744 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_8.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_8.gguf new file mode 100644 index 0000000..fc92c68 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2a65593c85dcd739598106e8bc8e31c56bff24559aa0f5c18dc99011d6147cb +size 1917191744 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_8_8.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_8_8.gguf new file mode 100644 index 0000000..3e52b1a --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_8_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5008823495431f06e37491436500ef6b61f426de59b1428f5ed809edbef5ad10 +size 1917191744 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_M.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_M.gguf new file mode 100644 index 0000000..d447076 --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a98a59217c4e813a741390da1a04c4b26d1e45e41fab21c9762faa18acb5d0b +size 2019378752 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_S.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_S.gguf new file mode 100644 index 0000000..f22c22d --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efbc0266174868213988888d30474b369f186973ddc4e8352290482836630d01 +size 1928201792 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_M.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_M.gguf new file mode 100644 index 0000000..190639a --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8066116845e1255766206356b60a4c3b745a41d4c5216d2e0a8ed1df7f52c507 +size 2322155072 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_S.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_S.gguf new file mode 100644 index 0000000..3cbe9af --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d81ea5b445870ea33c72b2d5e7374464a6e835363341ce1c8649906526d073fd +size 2269513280 diff --git a/Komodo-Llama-3.2-3B-v2-fp16.i1-Q6_K.gguf b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q6_K.gguf new file mode 100644 index 0000000..407b1ef --- /dev/null +++ b/Komodo-Llama-3.2-3B-v2-fp16.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca7c1d191d5c688e02982b5bc33a0a59fc218fd113a58465adc87fda4b9f0e74 +size 2643854912 diff --git a/README.md b/README.md new file mode 100644 index 0000000..9b86be0 --- /dev/null +++ b/README.md @@ -0,0 +1,90 @@ +--- +base_model: suayptalha/Komodo-Llama-3.2-3B-v2-fp16 +datasets: +- jeggers/competition_math +language: +- en +- th +- pt +- es +- de +- fr +- it +- hi +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- unsloth +- trl +- sft +- text-generation-inference +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/suayptalha/Komodo-Llama-3.2-3B-v2-fp16 + + +static quants are available at https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_S.gguf) | i1-IQ1_S | 1.0 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ1_M.gguf) | i1-IQ1_M | 1.0 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_XS.gguf) | i1-IQ2_XS | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_S.gguf) | i1-IQ2_S | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ2_M.gguf) | i1-IQ2_M | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 1.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q2_K.gguf) | i1-Q2_K | 1.5 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_XS.gguf) | i1-IQ3_XS | 1.6 | | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_S.gguf) | i1-IQ3_S | 1.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_S.gguf) | i1-Q3_K_S | 1.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ3_M.gguf) | i1-IQ3_M | 1.7 | | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.8 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.9 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.9 | | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_4.gguf) | i1-Q4_0_4_4 | 2.0 | fast on arm, low quality | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_4_8.gguf) | i1-Q4_0_4_8 | 2.0 | fast on arm+i8mm, low quality | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0_8_8.gguf) | i1-Q4_0_8_8 | 2.0 | fast on arm+sve, low quality | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_0.gguf) | i1-Q4_0 | 2.0 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_S.gguf) | i1-Q4_K_S | 2.0 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q4_K_M.gguf) | i1-Q4_K_M | 2.1 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_S.gguf) | i1-Q5_K_S | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q5_K_M.gguf) | i1-Q5_K_M | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/Komodo-Llama-3.2-3B-v2-fp16-i1-GGUF/resolve/main/Komodo-Llama-3.2-3B-v2-fp16.i1-Q6_K.gguf) | i1-Q6_K | 2.7 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..4d6e91f --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c60b392cc7b3ccdf57bf8cec7ac7e8ef37fa1cd732069ec32c9c4c3367f47cca +size 2988377