From 0b2890589ebd2bfba43dba29b9a2e41189153a62 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 9 May 2026 01:58:02 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/AetherDrake-SFT-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++++++++ AetherDrake-SFT.i1-IQ1_M.gguf | 3 ++ AetherDrake-SFT.i1-IQ1_S.gguf | 3 ++ AetherDrake-SFT.i1-IQ2_M.gguf | 3 ++ AetherDrake-SFT.i1-IQ2_S.gguf | 3 ++ AetherDrake-SFT.i1-IQ2_XS.gguf | 3 ++ AetherDrake-SFT.i1-IQ2_XXS.gguf | 3 ++ AetherDrake-SFT.i1-IQ3_M.gguf | 3 ++ AetherDrake-SFT.i1-IQ3_S.gguf | 3 ++ AetherDrake-SFT.i1-IQ3_XS.gguf | 3 ++ AetherDrake-SFT.i1-IQ3_XXS.gguf | 3 ++ AetherDrake-SFT.i1-IQ4_NL.gguf | 3 ++ AetherDrake-SFT.i1-IQ4_XS.gguf | 3 ++ AetherDrake-SFT.i1-Q2_K.gguf | 3 ++ AetherDrake-SFT.i1-Q2_K_S.gguf | 3 ++ AetherDrake-SFT.i1-Q3_K_L.gguf | 3 ++ AetherDrake-SFT.i1-Q3_K_M.gguf | 3 ++ AetherDrake-SFT.i1-Q3_K_S.gguf | 3 ++ AetherDrake-SFT.i1-Q4_0.gguf | 3 ++ AetherDrake-SFT.i1-Q4_1.gguf | 3 ++ AetherDrake-SFT.i1-Q4_K_M.gguf | 3 ++ AetherDrake-SFT.i1-Q4_K_S.gguf | 3 ++ AetherDrake-SFT.i1-Q5_K_M.gguf | 3 ++ AetherDrake-SFT.i1-Q5_K_S.gguf | 3 ++ AetherDrake-SFT.i1-Q6_K.gguf | 3 ++ README.md | 86 +++++++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 27 files changed, 221 insertions(+) create mode 100644 .gitattributes create mode 100644 AetherDrake-SFT.i1-IQ1_M.gguf create mode 100644 AetherDrake-SFT.i1-IQ1_S.gguf create mode 100644 AetherDrake-SFT.i1-IQ2_M.gguf create mode 100644 AetherDrake-SFT.i1-IQ2_S.gguf create mode 100644 AetherDrake-SFT.i1-IQ2_XS.gguf create mode 100644 AetherDrake-SFT.i1-IQ2_XXS.gguf create mode 100644 AetherDrake-SFT.i1-IQ3_M.gguf create mode 100644 AetherDrake-SFT.i1-IQ3_S.gguf create mode 100644 AetherDrake-SFT.i1-IQ3_XS.gguf create mode 100644 AetherDrake-SFT.i1-IQ3_XXS.gguf create mode 100644 AetherDrake-SFT.i1-IQ4_NL.gguf create mode 100644 AetherDrake-SFT.i1-IQ4_XS.gguf create mode 100644 AetherDrake-SFT.i1-Q2_K.gguf create mode 100644 AetherDrake-SFT.i1-Q2_K_S.gguf create mode 100644 AetherDrake-SFT.i1-Q3_K_L.gguf create mode 100644 AetherDrake-SFT.i1-Q3_K_M.gguf create mode 100644 AetherDrake-SFT.i1-Q3_K_S.gguf create mode 100644 AetherDrake-SFT.i1-Q4_0.gguf create mode 100644 AetherDrake-SFT.i1-Q4_1.gguf create mode 100644 AetherDrake-SFT.i1-Q4_K_M.gguf create mode 100644 AetherDrake-SFT.i1-Q4_K_S.gguf create mode 100644 AetherDrake-SFT.i1-Q5_K_M.gguf create mode 100644 AetherDrake-SFT.i1-Q5_K_S.gguf create mode 100644 AetherDrake-SFT.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..723a029 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +AetherDrake-SFT.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/AetherDrake-SFT.i1-IQ1_M.gguf b/AetherDrake-SFT.i1-IQ1_M.gguf new file mode 100644 index 0000000..a033414 --- /dev/null +++ b/AetherDrake-SFT.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9615911ce139799e5bb8854548d62f4fbdb4cb3f7a74619e0a48416f4b1a802a +size 2161977760 diff --git a/AetherDrake-SFT.i1-IQ1_S.gguf b/AetherDrake-SFT.i1-IQ1_S.gguf new file mode 100644 index 0000000..62f60bd --- /dev/null +++ b/AetherDrake-SFT.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855a5f040e7131282aea221c25b98cbc6e7766d011d1eb7d65a6d6ad446c1a85 +size 2019633568 diff --git a/AetherDrake-SFT.i1-IQ2_M.gguf b/AetherDrake-SFT.i1-IQ2_M.gguf new file mode 100644 index 0000000..9d4a8ea --- /dev/null +++ b/AetherDrake-SFT.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddf429cfdf9196567eb623a19f92d34d94d1046cbe06330f408ef096f18f75b6 +size 2948286880 diff --git a/AetherDrake-SFT.i1-IQ2_S.gguf b/AetherDrake-SFT.i1-IQ2_S.gguf new file mode 100644 index 0000000..a7078fb --- /dev/null +++ b/AetherDrake-SFT.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949b66c20ee98fe05cdcefe20b83806786d60a25a329220efb84eeb38c2aa071 +size 2758494624 diff --git a/AetherDrake-SFT.i1-IQ2_XS.gguf b/AetherDrake-SFT.i1-IQ2_XS.gguf new file mode 100644 index 0000000..e484383 --- /dev/null +++ b/AetherDrake-SFT.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f35849fcbbc30ecfe31b468d596b63124a8808fbae30e5ff78046adf6358b392 +size 2605787552 diff --git a/AetherDrake-SFT.i1-IQ2_XXS.gguf b/AetherDrake-SFT.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..e756c1b --- /dev/null +++ b/AetherDrake-SFT.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771de9a4c0bd36af78977afcf2d40c2d8330e599280ebd2359fa9ff9a7201097 +size 2399218080 diff --git a/AetherDrake-SFT.i1-IQ3_M.gguf b/AetherDrake-SFT.i1-IQ3_M.gguf new file mode 100644 index 0000000..f0c0543 --- /dev/null +++ b/AetherDrake-SFT.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:350082b372893fec87f414e8a29e3331ea70aa495047c0240bfe408048147abf +size 3784829344 diff --git a/AetherDrake-SFT.i1-IQ3_S.gguf b/AetherDrake-SFT.i1-IQ3_S.gguf new file mode 100644 index 0000000..8fabb93 --- /dev/null +++ b/AetherDrake-SFT.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc6fe34714907ead7a7913d79d081b38df0ad0c3bd55f39e64c79ae19bf9ac41 +size 3682331040 diff --git a/AetherDrake-SFT.i1-IQ3_XS.gguf b/AetherDrake-SFT.i1-IQ3_XS.gguf new file mode 100644 index 0000000..94e6b27 --- /dev/null +++ b/AetherDrake-SFT.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b965b451b178f4eae5befd30a912a69e13d444cd07f1397291e90ae2146d09 +size 3518753184 diff --git a/AetherDrake-SFT.i1-IQ3_XXS.gguf b/AetherDrake-SFT.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..a105b31 --- /dev/null +++ b/AetherDrake-SFT.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65df67b3fb4fa2f496a8bad54933819a98ae254dea1f4f55a8d6947ca2bf6bb6 +size 3274918304 diff --git a/AetherDrake-SFT.i1-IQ4_NL.gguf b/AetherDrake-SFT.i1-IQ4_NL.gguf new file mode 100644 index 0000000..1218e3e --- /dev/null +++ b/AetherDrake-SFT.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4518656880b9db994a59c44e07bd0ee5bec2d746e69cb4f5dce720182a04eee2 +size 4677994912 diff --git a/AetherDrake-SFT.i1-IQ4_XS.gguf b/AetherDrake-SFT.i1-IQ4_XS.gguf new file mode 100644 index 0000000..3adfefb --- /dev/null +++ b/AetherDrake-SFT.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d34e0056c1472459313f57dcf87282f1f88f2a48cb6d325992bb8afcd52c98a +size 4447668640 diff --git a/AetherDrake-SFT.i1-Q2_K.gguf b/AetherDrake-SFT.i1-Q2_K.gguf new file mode 100644 index 0000000..5de0c2f --- /dev/null +++ b/AetherDrake-SFT.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:354ec81be08884fd645fde8a2b25ace366b9ad583c00c33b92bd5def990d602d +size 3179137440 diff --git a/AetherDrake-SFT.i1-Q2_K_S.gguf b/AetherDrake-SFT.i1-Q2_K_S.gguf new file mode 100644 index 0000000..54cd429 --- /dev/null +++ b/AetherDrake-SFT.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fc2ea2db5f987b3e27045581df99fbf833fc096d4ceffcde91d62f02fa55b6d +size 2988820896 diff --git a/AetherDrake-SFT.i1-Q3_K_L.gguf b/AetherDrake-SFT.i1-Q3_K_L.gguf new file mode 100644 index 0000000..2447a91 --- /dev/null +++ b/AetherDrake-SFT.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d0ba1b6acff70b9c94d77ea67c4e061bdc9d4557aa8d1c5d9f60b93100656a9 +size 4321962400 diff --git a/AetherDrake-SFT.i1-Q3_K_M.gguf b/AetherDrake-SFT.i1-Q3_K_M.gguf new file mode 100644 index 0000000..c4e37fc --- /dev/null +++ b/AetherDrake-SFT.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a71ceb221373fa93021b1f6debee4868d390cc1c9ab45988c982949cab798cf1 +size 4018923936 diff --git a/AetherDrake-SFT.i1-Q3_K_S.gguf b/AetherDrake-SFT.i1-Q3_K_S.gguf new file mode 100644 index 0000000..d338e53 --- /dev/null +++ b/AetherDrake-SFT.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cba603994826109efdfed9589b29a3bce0a840924e117f4bc7a4ac27eaf1657 +size 3664505248 diff --git a/AetherDrake-SFT.i1-Q4_0.gguf b/AetherDrake-SFT.i1-Q4_0.gguf new file mode 100644 index 0000000..9f0b25c --- /dev/null +++ b/AetherDrake-SFT.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:696efd0e16b5b284aa1826329df0a4a166777171a64f1c075d33f8eba27bffcf +size 4675897760 diff --git a/AetherDrake-SFT.i1-Q4_1.gguf b/AetherDrake-SFT.i1-Q4_1.gguf new file mode 100644 index 0000000..371600c --- /dev/null +++ b/AetherDrake-SFT.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:714083381dd752235faafcbfc1f2ffd7faa4f83e31a219e2ebc7f40734365491 +size 5130258848 diff --git a/AetherDrake-SFT.i1-Q4_K_M.gguf b/AetherDrake-SFT.i1-Q4_K_M.gguf new file mode 100644 index 0000000..29e9dc8 --- /dev/null +++ b/AetherDrake-SFT.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e528434e3fd27b2fad06b887274aaae98d5212a9a5c0a1ae88a9008e43078e00 +size 4920740256 diff --git a/AetherDrake-SFT.i1-Q4_K_S.gguf b/AetherDrake-SFT.i1-Q4_K_S.gguf new file mode 100644 index 0000000..c0ee4a1 --- /dev/null +++ b/AetherDrake-SFT.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18dc154573d6f3ec0badfbd2877d56457114982ce1ec340b173266d88cfe8d70 +size 4692674976 diff --git a/AetherDrake-SFT.i1-Q5_K_M.gguf b/AetherDrake-SFT.i1-Q5_K_M.gguf new file mode 100644 index 0000000..a8479af --- /dev/null +++ b/AetherDrake-SFT.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:150562fe9f608b0b6779b592101c9a0c88fd260795fa6a494393f3f6997c1f89 +size 5732993440 diff --git a/AetherDrake-SFT.i1-Q5_K_S.gguf b/AetherDrake-SFT.i1-Q5_K_S.gguf new file mode 100644 index 0000000..266857b --- /dev/null +++ b/AetherDrake-SFT.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:378609b2c8ba0f740807ccc4489e43ce0cb4cf142c117e273e0d232240d7d0b5 +size 5599300000 diff --git a/AetherDrake-SFT.i1-Q6_K.gguf b/AetherDrake-SFT.i1-Q6_K.gguf new file mode 100644 index 0000000..325f9ee --- /dev/null +++ b/AetherDrake-SFT.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21e92547515ea4f6bd7837ea00173658d1462826b9a66879ee0e4978924ed84b +size 6596012448 diff --git a/README.md b/README.md new file mode 100644 index 0000000..7744fb1 --- /dev/null +++ b/README.md @@ -0,0 +1,86 @@ +--- +base_model: Daemontatox/AetherDrake-SFT +datasets: +- Daemontatox/LongCOT-Reason +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- text-generation-inference +- transformers +- unsloth +- Llama3 +- trl +- COT +- Reasoning +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/Daemontatox/AetherDrake-SFT + + +static quants are available at https://huggingface.co/mradermacher/AetherDrake-SFT-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ1_S.gguf) | i1-IQ1_S | 2.1 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ1_M.gguf) | i1-IQ1_M | 2.3 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.5 | | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ2_S.gguf) | i1-IQ2_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ2_M.gguf) | i1-IQ2_M | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q2_K_S.gguf) | i1-Q2_K_S | 3.1 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q2_K.gguf) | i1-Q2_K | 3.3 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.6 | | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.8 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ3_S.gguf) | i1-IQ3_S | 3.8 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ3_M.gguf) | i1-IQ3_M | 3.9 | | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q3_K_M.gguf) | i1-Q3_K_M | 4.1 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.4 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.5 | | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q4_0.gguf) | i1-Q4_0 | 4.8 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-IQ4_NL.gguf) | i1-IQ4_NL | 4.8 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.8 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q4_K_M.gguf) | i1-Q4_K_M | 5.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q4_1.gguf) | i1-Q4_1 | 5.2 | | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.7 | | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.8 | | +| [GGUF](https://huggingface.co/mradermacher/AetherDrake-SFT-i1-GGUF/resolve/main/AetherDrake-SFT.i1-Q6_K.gguf) | i1-Q6_K | 6.7 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..de65352 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff28b1e7de07c0cf2451913a71f68aa41e6cd2c6c971c94a63b34e52b29f0587 +size 4988157