commit 0e0ffe28e0eafc562d9bcee543d57fbfe5a78c1a Author: ModelHub XC Date: Wed Jun 17 19:17:16 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/DictaLM-3.0-24B-Base-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..fed59d5 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,59 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.imatrix.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +DictaLM-3.0-24B-Base.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/DictaLM-3.0-24B-Base.i1-IQ1_M.gguf b/DictaLM-3.0-24B-Base.i1-IQ1_M.gguf new file mode 100644 index 0000000..30af653 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c19ab393ad0a3d586b781f6b473f9e6e585b4c3d4df0472d16d9932d553d99d3 +size 5750494560 diff --git a/DictaLM-3.0-24B-Base.i1-IQ1_S.gguf b/DictaLM-3.0-24B-Base.i1-IQ1_S.gguf new file mode 100644 index 0000000..a086f22 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0174a4a5bf10d7420656527c4fbdc60e561a3c6700254e86d6a4bdc1692b2203 +size 5273720160 diff --git a/DictaLM-3.0-24B-Base.i1-IQ2_M.gguf b/DictaLM-3.0-24B-Base.i1-IQ2_M.gguf new file mode 100644 index 0000000..4285f58 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ad05a2db6a2c45819db36c4ac9ca6c0dbc855560436ba4ac265862ae930e35d +size 8114050400 diff --git a/DictaLM-3.0-24B-Base.i1-IQ2_S.gguf b/DictaLM-3.0-24B-Base.i1-IQ2_S.gguf new file mode 100644 index 0000000..48420ba --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:383696fee6b30975527a0d75f6e1084c6d72077fd004e111d721768b07e22a73 +size 7478351200 diff --git a/DictaLM-3.0-24B-Base.i1-IQ2_XS.gguf b/DictaLM-3.0-24B-Base.i1-IQ2_XS.gguf new file mode 100644 index 0000000..da7ee3a --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:022d1b23d9573ab323a4b16eff8264af6388c161de76e08a2821f2671234c366 +size 7207032160 diff --git a/DictaLM-3.0-24B-Base.i1-IQ2_XXS.gguf b/DictaLM-3.0-24B-Base.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..346bf96 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48305b0054a1da8e2ed7ede7654aaca5f25d647a019b76f367be11ddacce8b21 +size 6545118560 diff --git a/DictaLM-3.0-24B-Base.i1-IQ3_M.gguf b/DictaLM-3.0-24B-Base.i1-IQ3_M.gguf new file mode 100644 index 0000000..4b95806 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16498e2b21b2cfe0f9ca83fd9ffdd75e52f5aef4adcf699b950606153cf8ea70 +size 10650948960 diff --git a/DictaLM-3.0-24B-Base.i1-IQ3_S.gguf b/DictaLM-3.0-24B-Base.i1-IQ3_S.gguf new file mode 100644 index 0000000..30022d5 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:942b6a9ba64817ec9460a6b593c4792697c59d7062e0e33bc9ae63c6fe210405 +size 10428126560 diff --git a/DictaLM-3.0-24B-Base.i1-IQ3_XS.gguf b/DictaLM-3.0-24B-Base.i1-IQ3_XS.gguf new file mode 100644 index 0000000..229504a --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df1c600eabb52dcaa47e05d448d23b35a0879bf9b466674c6f07ba8f7255566f +size 9907115360 diff --git a/DictaLM-3.0-24B-Base.i1-IQ3_XXS.gguf b/DictaLM-3.0-24B-Base.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..5a24d73 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72d76d242cedf7e026132fe9e10344f0a97fdac19a3b33095a51c3f44ebefcaa +size 9280591200 diff --git a/DictaLM-3.0-24B-Base.i1-IQ4_XS.gguf b/DictaLM-3.0-24B-Base.i1-IQ4_XS.gguf new file mode 100644 index 0000000..200322c --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a86bf7f1058a6d882f5ad05f41e87dbe500d4ccd2e73ad5438165f8306ebc110 +size 12758914400 diff --git a/DictaLM-3.0-24B-Base.i1-Q2_K.gguf b/DictaLM-3.0-24B-Base.i1-Q2_K.gguf new file mode 100644 index 0000000..8f969cb --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9e12ac9350852b8a7feb07c888b22d78f14dd790d813f19923b260f46455e28 +size 8890324320 diff --git a/DictaLM-3.0-24B-Base.i1-Q2_K_S.gguf b/DictaLM-3.0-24B-Base.i1-Q2_K_S.gguf new file mode 100644 index 0000000..76aeac1 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce5807c5eb84c06d9fef350c77230bb839fd958a10c658380351eb26f6cc9f85 +size 8320161120 diff --git a/DictaLM-3.0-24B-Base.i1-Q3_K_L.gguf b/DictaLM-3.0-24B-Base.i1-Q3_K_L.gguf new file mode 100644 index 0000000..5d16341 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80db3b2997489669c59d445db5ad94e173ef7795a1077f0c295b3efcc6469fde +size 12400760160 diff --git a/DictaLM-3.0-24B-Base.i1-Q3_K_M.gguf b/DictaLM-3.0-24B-Base.i1-Q3_K_M.gguf new file mode 100644 index 0000000..5011f46 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9894992080e7dc2e5469b10c07d507517a16c2bc99c522c955a49461d18275e7 +size 11474081120 diff --git a/DictaLM-3.0-24B-Base.i1-Q3_K_S.gguf b/DictaLM-3.0-24B-Base.i1-Q3_K_S.gguf new file mode 100644 index 0000000..4425203 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cad6cf5438e6a32b83b37f1490ddb875155746498b37ef5778686fa390b134b1 +size 10400273760 diff --git a/DictaLM-3.0-24B-Base.i1-Q4_0.gguf b/DictaLM-3.0-24B-Base.i1-Q4_0.gguf new file mode 100644 index 0000000..b556f3d --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0280775499dd14f9afc96065b8f295a9cea3bd3e973806c247903490babb55c +size 13494228320 diff --git a/DictaLM-3.0-24B-Base.i1-Q4_1.gguf b/DictaLM-3.0-24B-Base.i1-Q4_1.gguf new file mode 100644 index 0000000..4eedfad --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff259667dda08d7ee1c54ecd1624f8bbea166083d8652efe6512c1f20766483 +size 14873105760 diff --git a/DictaLM-3.0-24B-Base.i1-Q4_K_M.gguf b/DictaLM-3.0-24B-Base.i1-Q4_K_M.gguf new file mode 100644 index 0000000..88763f4 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0afe268633865613c003de4a57f7edc232929802f5c96a8fbfd21c231e0342a2 +size 14333908320 diff --git a/DictaLM-3.0-24B-Base.i1-Q4_K_S.gguf b/DictaLM-3.0-24B-Base.i1-Q4_K_S.gguf new file mode 100644 index 0000000..45c2c22 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a8ba0af08bd06fedc5f14653240be4235576ad8658bcd6b6a5c5297264a04b0 +size 13549278560 diff --git a/DictaLM-3.0-24B-Base.i1-Q5_K_M.gguf b/DictaLM-3.0-24B-Base.i1-Q5_K_M.gguf new file mode 100644 index 0000000..12b22a9 --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b2fd56d34331b5738a2c207787d243ff205e8dcc6326a36f94bec1185a1d5dd +size 16763983200 diff --git a/DictaLM-3.0-24B-Base.i1-Q5_K_S.gguf b/DictaLM-3.0-24B-Base.i1-Q5_K_S.gguf new file mode 100644 index 0000000..6fd5d9d --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47c82d6cf9820a2d8793f71ad527be0cf420b0735b607581639884d37ad23543 +size 16304412000 diff --git a/DictaLM-3.0-24B-Base.i1-Q6_K.gguf b/DictaLM-3.0-24B-Base.i1-Q6_K.gguf new file mode 100644 index 0000000..4b15f8c --- /dev/null +++ b/DictaLM-3.0-24B-Base.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3abdcec3bf5cd31d89ecd9607ef64d464985baeed3f055df60fa8e928ee37dbc +size 19345937760 diff --git a/DictaLM-3.0-24B-Base.imatrix.gguf b/DictaLM-3.0-24B-Base.imatrix.gguf new file mode 100644 index 0000000..49daa4c --- /dev/null +++ b/DictaLM-3.0-24B-Base.imatrix.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7325a565503e4fe338083e6547dbaff60e7753fe36fb837c067ddc6152997935 +size 10037312 diff --git a/README.md b/README.md new file mode 100644 index 0000000..b19d2ff --- /dev/null +++ b/README.md @@ -0,0 +1,87 @@ +--- +base_model: dicta-il/DictaLM-3.0-24B-Base +language: +- en +- he +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- pretrained +--- +## About + + + + + + + + + +weighted/imatrix quants of https://huggingface.co/dicta-il/DictaLM-3.0-24B-Base + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#DictaLM-3.0-24B-Base-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.imatrix.gguf) | imatrix | 0.1 | imatrix file (for creating your own quants) | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-IQ1_S.gguf) | i1-IQ1_S | 5.4 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-IQ1_M.gguf) | i1-IQ1_M | 5.9 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 6.6 | | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-IQ2_XS.gguf) | i1-IQ2_XS | 7.3 | | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-IQ2_S.gguf) | i1-IQ2_S | 7.6 | | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-IQ2_M.gguf) | i1-IQ2_M | 8.2 | | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q2_K_S.gguf) | i1-Q2_K_S | 8.4 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q2_K.gguf) | i1-Q2_K | 9.0 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 9.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-IQ3_XS.gguf) | i1-IQ3_XS | 10.0 | | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q3_K_S.gguf) | i1-Q3_K_S | 10.5 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-IQ3_S.gguf) | i1-IQ3_S | 10.5 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-IQ3_M.gguf) | i1-IQ3_M | 10.8 | | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q3_K_M.gguf) | i1-Q3_K_M | 11.6 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q3_K_L.gguf) | i1-Q3_K_L | 12.5 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-IQ4_XS.gguf) | i1-IQ4_XS | 12.9 | | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q4_0.gguf) | i1-Q4_0 | 13.6 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q4_K_S.gguf) | i1-Q4_K_S | 13.6 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q4_K_M.gguf) | i1-Q4_K_M | 14.4 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q4_1.gguf) | i1-Q4_1 | 15.0 | | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q5_K_S.gguf) | i1-Q5_K_S | 16.4 | | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q5_K_M.gguf) | i1-Q5_K_M | 16.9 | | +| [GGUF](https://huggingface.co/mradermacher/DictaLM-3.0-24B-Base-i1-GGUF/resolve/main/DictaLM-3.0-24B-Base.i1-Q6_K.gguf) | i1-Q6_K | 19.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + +