commit 1bce0ed26b7c2ab6147b01662102935b525a1f93 Author: ModelHub XC Date: Sun May 3 02:49:25 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..05cdb12 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q4_0_4_8.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-Q4_0_8_8.gguf filter=lfs diff=lfs merge=lfs -text +Athena-gemma-2-2b-it-Philos.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Athena-gemma-2-2b-it-Philos.i1-IQ1_M.gguf b/Athena-gemma-2-2b-it-Philos.i1-IQ1_M.gguf new file mode 100644 index 0000000..0ecbce3 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6253406a17670483fa0a080150db920b2d84e2d3528097ad57424e3b9ddb1365 +size 873798368 diff --git a/Athena-gemma-2-2b-it-Philos.i1-IQ1_S.gguf b/Athena-gemma-2-2b-it-Philos.i1-IQ1_S.gguf new file mode 100644 index 0000000..22318d2 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b8abd7b585ec0088626ab72eae35ca36c2f982bc63c127df763bd36cebb5fce +size 832160480 diff --git a/Athena-gemma-2-2b-it-Philos.i1-IQ2_M.gguf b/Athena-gemma-2-2b-it-Philos.i1-IQ2_M.gguf new file mode 100644 index 0000000..5537620 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1135f4d27e6d9a7b8c77f0ed7ecacbef6faf528420844785cee51cfeaa812629 +size 1088015072 diff --git a/Athena-gemma-2-2b-it-Philos.i1-IQ2_S.gguf b/Athena-gemma-2-2b-it-Philos.i1-IQ2_S.gguf new file mode 100644 index 0000000..a35a3de --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:402a9807876889b0c7cb814a0aaf65aae74cfb33bcafcf3c9fd567cac089d6a3 +size 1032497888 diff --git a/Athena-gemma-2-2b-it-Philos.i1-IQ2_XS.gguf b/Athena-gemma-2-2b-it-Philos.i1-IQ2_XS.gguf new file mode 100644 index 0000000..350f8a2 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51a71f29575247e1442eee5c0f2b0b237d0f41b919a0de184145a374e3d17b47 +size 1002545888 diff --git a/Athena-gemma-2-2b-it-Philos.i1-IQ2_XXS.gguf b/Athena-gemma-2-2b-it-Philos.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..385da6f --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c4ee951e1f824d22ef3606fc313e526c06380f9b7695de63c0874d32867bbe5 +size 943194848 diff --git a/Athena-gemma-2-2b-it-Philos.i1-IQ3_M.gguf b/Athena-gemma-2-2b-it-Philos.i1-IQ3_M.gguf new file mode 100644 index 0000000..db3074c --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cd671316c8f9cf1153e82af32b1cde1225c78467a08a196caf4bf6bea4dfc6c +size 1393562336 diff --git a/Athena-gemma-2-2b-it-Philos.i1-IQ3_S.gguf b/Athena-gemma-2-2b-it-Philos.i1-IQ3_S.gguf new file mode 100644 index 0000000..adf5621 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96ecbc8aa50304a9662634d96808491fbd0457b54c032075c61790049d44bbf8 +size 1360661216 diff --git a/Athena-gemma-2-2b-it-Philos.i1-IQ3_XS.gguf b/Athena-gemma-2-2b-it-Philos.i1-IQ3_XS.gguf new file mode 100644 index 0000000..f188650 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a879464b1f55cf5de18e1ef329d212d75edb290392f009d85662cf313a2c1be +size 1314212576 diff --git a/Athena-gemma-2-2b-it-Philos.i1-IQ3_XXS.gguf b/Athena-gemma-2-2b-it-Philos.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..e78083d --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4f087405d95e7c251b545d804d09d42c11be138275fe8702738002214ff10b3 +size 1181686496 diff --git a/Athena-gemma-2-2b-it-Philos.i1-IQ4_XS.gguf b/Athena-gemma-2-2b-it-Philos.i1-IQ4_XS.gguf new file mode 100644 index 0000000..b3176a3 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:706d43051fd5d6f3ef6463622e05df58f6082ced17ec252467dee558107f520e +size 1566251744 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q2_K.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q2_K.gguf new file mode 100644 index 0000000..8f928a3 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:994c044bfe327ec2783ba664d7a608be9a1c6ad8843916d0952fa7216a0e6dc0 +size 1229830880 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q3_K_L.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q3_K_L.gguf new file mode 100644 index 0000000..6a089f3 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4334bb7e63dc8ae3662eaefc8a89c16296e746a0e319274b1c204a2b825557e2 +size 1550437088 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q3_K_M.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q3_K_M.gguf new file mode 100644 index 0000000..3e37b60 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8840417eb3913627f043e36184159db624fb190b93cdcbd51eb623865938a9af +size 1461668576 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q3_K_S.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q3_K_S.gguf new file mode 100644 index 0000000..89263bf --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc86e1f1cdb161361b79bf48f99290e44764fd00af9de0a785b475798794b5dd +size 1360661216 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q4_0.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q4_0.gguf new file mode 100644 index 0000000..1a251af --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a189d20b0e8ff5514be8bc4f06a25e3df9b99783afcee0a83e40e2b108cb21b +size 1633491680 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q4_0_4_4.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q4_0_4_4.gguf new file mode 100644 index 0000000..f806567 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q4_0_4_4.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dec042bfcff42ae112a4716d7fd1b42c61d713943a7226204f9f3e4697375121 +size 1629510368 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q4_0_4_8.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q4_0_4_8.gguf new file mode 100644 index 0000000..4e76a71 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q4_0_4_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:697f88992b97ba5c599c4daad08085c66d6e448b55eafebc876a0d125f34ef8b +size 1629510368 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q4_0_8_8.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q4_0_8_8.gguf new file mode 100644 index 0000000..b76ec09 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q4_0_8_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91f97a0f3c32227fb53bde810533f7edefc88e8cdea7204469d51ea9cb231da +size 1629510368 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q4_K_M.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q4_K_M.gguf new file mode 100644 index 0000000..a094415 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa3bdb1b1788a1d37b0a233e2004f977fc1428a2010bc82324af2d06431a6d0 +size 1708583648 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q4_K_S.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q4_K_S.gguf new file mode 100644 index 0000000..b1fef5c --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc995bc77a7362d5d4945224205d1cefd56ffcfa6dae3c9756cc5e31ff9fe6b6 +size 1638652640 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q5_K_M.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q5_K_M.gguf new file mode 100644 index 0000000..9d30af1 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a955bc244c2532701d7f4fa0e8925c591b507169217d0b2131bb074ae714bd +size 1923279584 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q5_K_S.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q5_K_S.gguf new file mode 100644 index 0000000..fab3433 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dd18d4d23c8473b514b4cd2cbbcca65363635717297bc339adaf4d1fc5bbf12 +size 1882544864 diff --git a/Athena-gemma-2-2b-it-Philos.i1-Q6_K.gguf b/Athena-gemma-2-2b-it-Philos.i1-Q6_K.gguf new file mode 100644 index 0000000..c4f5547 --- /dev/null +++ b/Athena-gemma-2-2b-it-Philos.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fd23441182897fbd8dfa52d0d3b2ea5562e544b90df58852116181578e5d3a2 +size 2151394016 diff --git a/README.md b/README.md new file mode 100644 index 0000000..0afec30 --- /dev/null +++ b/README.md @@ -0,0 +1,82 @@ +--- +base_model: EpistemeAI/Athena-gemma-2-2b-it-Philos +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- text-generation-inference +- transformers +- unsloth +- gemma2 +- trl +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/EpistemeAI/Athena-gemma-2-2b-it-Philos + + +static quants are available at https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-IQ1_S.gguf) | i1-IQ1_S | 0.9 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-IQ1_M.gguf) | i1-IQ1_M | 1.0 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-IQ2_XS.gguf) | i1-IQ2_XS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-IQ2_S.gguf) | i1-IQ2_S | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-IQ2_M.gguf) | i1-IQ2_M | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 1.3 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q2_K.gguf) | i1-Q2_K | 1.3 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-IQ3_XS.gguf) | i1-IQ3_XS | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-IQ3_S.gguf) | i1-IQ3_S | 1.5 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q3_K_S.gguf) | i1-Q3_K_S | 1.5 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-IQ3_M.gguf) | i1-IQ3_M | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.6 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.7 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.7 | | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q4_0_4_4.gguf) | i1-Q4_0_4_4 | 1.7 | fast on arm, low quality | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q4_0_4_8.gguf) | i1-Q4_0_4_8 | 1.7 | fast on arm+i8mm, low quality | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q4_0_8_8.gguf) | i1-Q4_0_8_8 | 1.7 | fast on arm+sve, low quality | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q4_0.gguf) | i1-Q4_0 | 1.7 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q4_K_S.gguf) | i1-Q4_K_S | 1.7 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q4_K_M.gguf) | i1-Q4_K_M | 1.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q5_K_S.gguf) | i1-Q5_K_S | 2.0 | | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q5_K_M.gguf) | i1-Q5_K_M | 2.0 | | +| [GGUF](https://huggingface.co/mradermacher/Athena-gemma-2-2b-it-Philos-i1-GGUF/resolve/main/Athena-gemma-2-2b-it-Philos.i1-Q6_K.gguf) | i1-Q6_K | 2.3 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..b0f5d9d --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cfda018ec9375a1ad45f0c5dc49ed4dea1bb7a46ca91debd1f351e3bc8c5fd8 +size 2375559