From d0d3c752624503ea9ae6472a0f75fb70b09c9914 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sun, 12 Apr 2026 21:40:56 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Apollo2-0.5B-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++ Apollo2-0.5B.i1-IQ1_M.gguf | 3 + Apollo2-0.5B.i1-IQ1_S.gguf | 3 + Apollo2-0.5B.i1-IQ2_M.gguf | 3 + Apollo2-0.5B.i1-IQ2_S.gguf | 3 + Apollo2-0.5B.i1-IQ2_XS.gguf | 3 + Apollo2-0.5B.i1-IQ2_XXS.gguf | 3 + Apollo2-0.5B.i1-IQ3_M.gguf | 3 + Apollo2-0.5B.i1-IQ3_S.gguf | 3 + Apollo2-0.5B.i1-IQ3_XS.gguf | 3 + Apollo2-0.5B.i1-IQ3_XXS.gguf | 3 + Apollo2-0.5B.i1-IQ4_NL.gguf | 3 + Apollo2-0.5B.i1-IQ4_XS.gguf | 3 + Apollo2-0.5B.i1-Q2_K.gguf | 3 + Apollo2-0.5B.i1-Q2_K_S.gguf | 3 + Apollo2-0.5B.i1-Q3_K_L.gguf | 3 + Apollo2-0.5B.i1-Q3_K_M.gguf | 3 + Apollo2-0.5B.i1-Q3_K_S.gguf | 3 + Apollo2-0.5B.i1-Q4_0.gguf | 3 + Apollo2-0.5B.i1-Q4_1.gguf | 3 + Apollo2-0.5B.i1-Q4_K_M.gguf | 3 + Apollo2-0.5B.i1-Q4_K_S.gguf | 3 + Apollo2-0.5B.i1-Q5_K_M.gguf | 3 + Apollo2-0.5B.i1-Q5_K_S.gguf | 3 + Apollo2-0.5B.i1-Q6_K.gguf | 3 + README.md | 123 +++++++++++++++++++++++++++++++++++ imatrix.dat | 3 + 27 files changed, 258 insertions(+) create mode 100644 .gitattributes create mode 100644 Apollo2-0.5B.i1-IQ1_M.gguf create mode 100644 Apollo2-0.5B.i1-IQ1_S.gguf create mode 100644 Apollo2-0.5B.i1-IQ2_M.gguf create mode 100644 Apollo2-0.5B.i1-IQ2_S.gguf create mode 100644 Apollo2-0.5B.i1-IQ2_XS.gguf create mode 100644 Apollo2-0.5B.i1-IQ2_XXS.gguf create mode 100644 Apollo2-0.5B.i1-IQ3_M.gguf create mode 100644 Apollo2-0.5B.i1-IQ3_S.gguf create mode 100644 Apollo2-0.5B.i1-IQ3_XS.gguf create mode 100644 Apollo2-0.5B.i1-IQ3_XXS.gguf create mode 100644 Apollo2-0.5B.i1-IQ4_NL.gguf create mode 100644 Apollo2-0.5B.i1-IQ4_XS.gguf create mode 100644 Apollo2-0.5B.i1-Q2_K.gguf create mode 100644 Apollo2-0.5B.i1-Q2_K_S.gguf create mode 100644 Apollo2-0.5B.i1-Q3_K_L.gguf create mode 100644 Apollo2-0.5B.i1-Q3_K_M.gguf create mode 100644 Apollo2-0.5B.i1-Q3_K_S.gguf create mode 100644 Apollo2-0.5B.i1-Q4_0.gguf create mode 100644 Apollo2-0.5B.i1-Q4_1.gguf create mode 100644 Apollo2-0.5B.i1-Q4_K_M.gguf create mode 100644 Apollo2-0.5B.i1-Q4_K_S.gguf create mode 100644 Apollo2-0.5B.i1-Q5_K_M.gguf create mode 100644 Apollo2-0.5B.i1-Q5_K_S.gguf create mode 100644 Apollo2-0.5B.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..5f18b62 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Apollo2-0.5B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Apollo2-0.5B.i1-IQ1_M.gguf b/Apollo2-0.5B.i1-IQ1_M.gguf new file mode 100644 index 0000000..248c7d6 --- /dev/null +++ b/Apollo2-0.5B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c4509f210d08f72e59d077f8ce801861015badf2ba31623c21841dd9cc1de22 +size 394549088 diff --git a/Apollo2-0.5B.i1-IQ1_S.gguf b/Apollo2-0.5B.i1-IQ1_S.gguf new file mode 100644 index 0000000..57e3c19 --- /dev/null +++ b/Apollo2-0.5B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d15cc7df76c3305a6b4c876c39122fe41945e20c644332876ea2d13e698f91a2 +size 392404064 diff --git a/Apollo2-0.5B.i1-IQ2_M.gguf b/Apollo2-0.5B.i1-IQ2_M.gguf new file mode 100644 index 0000000..f917058 --- /dev/null +++ b/Apollo2-0.5B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fb4863b1291373856636dacd4dd025ca66b7961d9c8440b5f881b7642ac133f +size 405172064 diff --git a/Apollo2-0.5B.i1-IQ2_S.gguf b/Apollo2-0.5B.i1-IQ2_S.gguf new file mode 100644 index 0000000..57b2806 --- /dev/null +++ b/Apollo2-0.5B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abca20a1d5dd7ab6a9c5f495dd51429ca61a79112402f4cdf7e0aa1b6f8358c9 +size 402312032 diff --git a/Apollo2-0.5B.i1-IQ2_XS.gguf b/Apollo2-0.5B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..043cd66 --- /dev/null +++ b/Apollo2-0.5B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc3fd00b0d3932dea7bbe4b92e12c2f2762761aa3926876acc28c946d1735803 +size 400984160 diff --git a/Apollo2-0.5B.i1-IQ2_XXS.gguf b/Apollo2-0.5B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..eda27d1 --- /dev/null +++ b/Apollo2-0.5B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c33cca96f1f043cea8d1e4750e140c9fae1640b9e3163646a41ca72bdcc2cfb5 +size 398124128 diff --git a/Apollo2-0.5B.i1-IQ3_M.gguf b/Apollo2-0.5B.i1-IQ3_M.gguf new file mode 100644 index 0000000..884e32c --- /dev/null +++ b/Apollo2-0.5B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17a9803ab6ffde2c1e36b6861f286199b40c6c89e4186f0c6cfa60d7393e0973 +size 419327072 diff --git a/Apollo2-0.5B.i1-IQ3_S.gguf b/Apollo2-0.5B.i1-IQ3_S.gguf new file mode 100644 index 0000000..2a199b1 --- /dev/null +++ b/Apollo2-0.5B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:315c4f8c07a391b25208ff1c3c1ce139f9d2de76861a53d97686cd29805dca7a +size 415182176 diff --git a/Apollo2-0.5B.i1-IQ3_XS.gguf b/Apollo2-0.5B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..102b164 --- /dev/null +++ b/Apollo2-0.5B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7610fad149ff30f906c7c46e431f099c4eed4c05a87f975f864c628ff219b5ef +size 415182176 diff --git a/Apollo2-0.5B.i1-IQ3_XXS.gguf b/Apollo2-0.5B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..d4fb285 --- /dev/null +++ b/Apollo2-0.5B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad6bb9b714d5493a34d0eceeb3023ff98f76dcb21d7a091ddfecfe8da9f7072d +size 410279264 diff --git a/Apollo2-0.5B.i1-IQ4_NL.gguf b/Apollo2-0.5B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..7cbf584 --- /dev/null +++ b/Apollo2-0.5B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a733c62ce29105c9c8e05634fa94f39b5bc35413552b54b136ff23a3d9d5dce7 +size 429245792 diff --git a/Apollo2-0.5B.i1-IQ4_XS.gguf b/Apollo2-0.5B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..2f7b8b0 --- /dev/null +++ b/Apollo2-0.5B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:203270245f8f393a15c60cfbaa7b2b00478922214b99afe0f2212653c5ef2c70 +size 425977184 diff --git a/Apollo2-0.5B.i1-Q2_K.gguf b/Apollo2-0.5B.i1-Q2_K.gguf new file mode 100644 index 0000000..af88807 --- /dev/null +++ b/Apollo2-0.5B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a9c9a2dd990117da739617afc8a426bda51974b0cf514dc10c69f8aaf860c66 +size 415182176 diff --git a/Apollo2-0.5B.i1-Q2_K_S.gguf b/Apollo2-0.5B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..355d482 --- /dev/null +++ b/Apollo2-0.5B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c514bdbca4d6bbb4b674be3bcb5b335be00df4358a11b65a1d76c652342602 +size 407623520 diff --git a/Apollo2-0.5B.i1-Q3_K_L.gguf b/Apollo2-0.5B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..8241d3d --- /dev/null +++ b/Apollo2-0.5B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e6f6b32b257566c4ab8809e4780077536524848c6c07680858b3ea63c759d5e +size 445932896 diff --git a/Apollo2-0.5B.i1-Q3_K_M.gguf b/Apollo2-0.5B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..66afb52 --- /dev/null +++ b/Apollo2-0.5B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50cf52915b98ce2e635269cf6bb2557d8f6d602ec1131bacb012cf4e24c9a209 +size 432041312 diff --git a/Apollo2-0.5B.i1-Q3_K_S.gguf b/Apollo2-0.5B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..362d3af --- /dev/null +++ b/Apollo2-0.5B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:225ad01d45b117cee3be69c816b40d98ea2d959ee88a2f5ef2c8f33525d6459b +size 414838112 diff --git a/Apollo2-0.5B.i1-Q4_0.gguf b/Apollo2-0.5B.i1-Q4_0.gguf new file mode 100644 index 0000000..ad4273a --- /dev/null +++ b/Apollo2-0.5B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f4225427afd73f7b2112fc2f05d41ab1fcee2ef365f0b2bccabae096b0cbbe2 +size 429546848 diff --git a/Apollo2-0.5B.i1-Q4_1.gguf b/Apollo2-0.5B.i1-Q4_1.gguf new file mode 100644 index 0000000..e214e96 --- /dev/null +++ b/Apollo2-0.5B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d5095c638778a84ce85d52c2b555bbe32cb3626f4aba00848c85c7b501921d5 +size 459602272 diff --git a/Apollo2-0.5B.i1-Q4_K_M.gguf b/Apollo2-0.5B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..5659d09 --- /dev/null +++ b/Apollo2-0.5B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a39041700ad875af35cd5d469f7e9cbd8d5e7acb8e93fd17df9dd2c69442e11 +size 491399520 diff --git a/Apollo2-0.5B.i1-Q4_K_S.gguf b/Apollo2-0.5B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..43fb553 --- /dev/null +++ b/Apollo2-0.5B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d034c616a6063b96f520d4f39a471bf3109912dde9ba7e0cf80b62f2e4dd6111 +size 479063392 diff --git a/Apollo2-0.5B.i1-Q5_K_M.gguf b/Apollo2-0.5B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..679dc9f --- /dev/null +++ b/Apollo2-0.5B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85bd3358057b7a3b64a1dbcfb25a5ed1e990d74da76a9083516fab22c36c530b +size 522186080 diff --git a/Apollo2-0.5B.i1-Q5_K_S.gguf b/Apollo2-0.5B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..6f6826a --- /dev/null +++ b/Apollo2-0.5B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ca901582f6b6a5625604e7cb85f9e4e371997ffe451bfa79dce7deff6bb5449 +size 514810208 diff --git a/Apollo2-0.5B.i1-Q6_K.gguf b/Apollo2-0.5B.i1-Q6_K.gguf new file mode 100644 index 0000000..50b8124 --- /dev/null +++ b/Apollo2-0.5B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da0629f102eb26baee3471a37f9c1727a137b8eec859dda82bde59a70a87d20c +size 650378592 diff --git a/README.md b/README.md new file mode 100644 index 0000000..4dbb2f9 --- /dev/null +++ b/README.md @@ -0,0 +1,123 @@ +--- +base_model: FreedomIntelligence/Apollo2-0.5B +datasets: +- FreedomIntelligence/ApolloMoEDataset +language: +- ar +- en +- zh +- ko +- ja +- mn +- th +- vi +- lo +- mg +- de +- pt +- es +- fr +- ru +- it +- hr +- gl +- cs +- co +- la +- uk +- bs +- bg +- eo +- sq +- da +- sa +- gn +- sr +- sk +- gd +- lb +- hi +- ku +- mt +- he +- ln +- bm +- sw +- ig +- rw +- ha +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- biology +- medical +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/FreedomIntelligence/Apollo2-0.5B + + +static quants are available at https://huggingface.co/mradermacher/Apollo2-0.5B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ1_S.gguf) | i1-IQ1_S | 0.5 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ1_M.gguf) | i1-IQ1_M | 0.5 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ2_S.gguf) | i1-IQ2_S | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ2_M.gguf) | i1-IQ2_M | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.5 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.5 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 0.5 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ3_S.gguf) | i1-IQ3_S | 0.5 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q2_K.gguf) | i1-Q2_K | 0.5 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ3_M.gguf) | i1-IQ3_M | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 0.5 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q4_0.gguf) | i1-Q4_0 | 0.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 0.5 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 0.5 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q4_1.gguf) | i1-Q4_1 | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 0.6 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 0.6 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/Apollo2-0.5B-i1-GGUF/resolve/main/Apollo2-0.5B.i1-Q6_K.gguf) | i1-Q6_K | 0.8 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..83fa8ad --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:861bad52a1ab9723fcb04c7a1c2ced5ee5916f461f9a016af87fec170dc7acdb +size 988597