From 7f4a8dfa46c71305c05d3cb8408154c6e8d14384 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 9 May 2026 19:31:13 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Julia-Alpha-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++++++++++++ Julia-Alpha.i1-IQ1_M.gguf | 3 ++ Julia-Alpha.i1-IQ1_S.gguf | 3 ++ Julia-Alpha.i1-IQ2_M.gguf | 3 ++ Julia-Alpha.i1-IQ2_S.gguf | 3 ++ Julia-Alpha.i1-IQ2_XS.gguf | 3 ++ Julia-Alpha.i1-IQ2_XXS.gguf | 3 ++ Julia-Alpha.i1-IQ3_M.gguf | 3 ++ Julia-Alpha.i1-IQ3_S.gguf | 3 ++ Julia-Alpha.i1-IQ3_XS.gguf | 3 ++ Julia-Alpha.i1-IQ3_XXS.gguf | 3 ++ Julia-Alpha.i1-IQ4_NL.gguf | 3 ++ Julia-Alpha.i1-IQ4_XS.gguf | 3 ++ Julia-Alpha.i1-Q2_K.gguf | 3 ++ Julia-Alpha.i1-Q2_K_S.gguf | 3 ++ Julia-Alpha.i1-Q3_K_L.gguf | 3 ++ Julia-Alpha.i1-Q3_K_M.gguf | 3 ++ Julia-Alpha.i1-Q3_K_S.gguf | 3 ++ Julia-Alpha.i1-Q4_0.gguf | 3 ++ Julia-Alpha.i1-Q4_1.gguf | 3 ++ Julia-Alpha.i1-Q4_K_M.gguf | 3 ++ Julia-Alpha.i1-Q4_K_S.gguf | 3 ++ Julia-Alpha.i1-Q5_K_M.gguf | 3 ++ Julia-Alpha.i1-Q5_K_S.gguf | 3 ++ Julia-Alpha.i1-Q6_K.gguf | 3 ++ README.md | 83 +++++++++++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 27 files changed, 218 insertions(+) create mode 100644 .gitattributes create mode 100644 Julia-Alpha.i1-IQ1_M.gguf create mode 100644 Julia-Alpha.i1-IQ1_S.gguf create mode 100644 Julia-Alpha.i1-IQ2_M.gguf create mode 100644 Julia-Alpha.i1-IQ2_S.gguf create mode 100644 Julia-Alpha.i1-IQ2_XS.gguf create mode 100644 Julia-Alpha.i1-IQ2_XXS.gguf create mode 100644 Julia-Alpha.i1-IQ3_M.gguf create mode 100644 Julia-Alpha.i1-IQ3_S.gguf create mode 100644 Julia-Alpha.i1-IQ3_XS.gguf create mode 100644 Julia-Alpha.i1-IQ3_XXS.gguf create mode 100644 Julia-Alpha.i1-IQ4_NL.gguf create mode 100644 Julia-Alpha.i1-IQ4_XS.gguf create mode 100644 Julia-Alpha.i1-Q2_K.gguf create mode 100644 Julia-Alpha.i1-Q2_K_S.gguf create mode 100644 Julia-Alpha.i1-Q3_K_L.gguf create mode 100644 Julia-Alpha.i1-Q3_K_M.gguf create mode 100644 Julia-Alpha.i1-Q3_K_S.gguf create mode 100644 Julia-Alpha.i1-Q4_0.gguf create mode 100644 Julia-Alpha.i1-Q4_1.gguf create mode 100644 Julia-Alpha.i1-Q4_K_M.gguf create mode 100644 Julia-Alpha.i1-Q4_K_S.gguf create mode 100644 Julia-Alpha.i1-Q5_K_M.gguf create mode 100644 Julia-Alpha.i1-Q5_K_S.gguf create mode 100644 Julia-Alpha.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..76a8e6c --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Julia-Alpha.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Julia-Alpha.i1-IQ1_M.gguf b/Julia-Alpha.i1-IQ1_M.gguf new file mode 100644 index 0000000..842b1f0 --- /dev/null +++ b/Julia-Alpha.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8284109c614af212facdcad74e37ba6bf0dbd66c1dc751cb03a0a0f6c72876d0 +size 1127018848 diff --git a/Julia-Alpha.i1-IQ1_S.gguf b/Julia-Alpha.i1-IQ1_S.gguf new file mode 100644 index 0000000..f3f3405 --- /dev/null +++ b/Julia-Alpha.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f14b92b7e869cdd53abfbfbf99158f7609e04723176a3428b6d74868c839cd09 +size 1055256928 diff --git a/Julia-Alpha.i1-IQ2_M.gguf b/Julia-Alpha.i1-IQ2_M.gguf new file mode 100644 index 0000000..7a77372 --- /dev/null +++ b/Julia-Alpha.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59d43596c4f82db1aaaeededb14f4ac2e18754ffc764e691e55241095059f69 +size 1512984928 diff --git a/Julia-Alpha.i1-IQ2_S.gguf b/Julia-Alpha.i1-IQ2_S.gguf new file mode 100644 index 0000000..973b7a7 --- /dev/null +++ b/Julia-Alpha.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dd5b48380fe2748a88ee670a280152990b0b75cd1ad3172393d4eb232d3f951 +size 1417302368 diff --git a/Julia-Alpha.i1-IQ2_XS.gguf b/Julia-Alpha.i1-IQ2_XS.gguf new file mode 100644 index 0000000..ba5d15e --- /dev/null +++ b/Julia-Alpha.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be640671e7ad1fa9e31e1cd42ca4ab18437f1b2a4a71e9b1f884ee3e68fefc96 +size 1354101088 diff --git a/Julia-Alpha.i1-IQ2_XXS.gguf b/Julia-Alpha.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..e6f43d2 --- /dev/null +++ b/Julia-Alpha.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41bac02164cb20e51d990b815101bf693c74ff746b6089d045f8cef981bd6846 +size 1246622048 diff --git a/Julia-Alpha.i1-IQ3_M.gguf b/Julia-Alpha.i1-IQ3_M.gguf new file mode 100644 index 0000000..01db90e --- /dev/null +++ b/Julia-Alpha.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7a9ce81069a88101f477d7ccaaee65cf261957ab973c8df3f42d8e51aeeb635 +size 1962897248 diff --git a/Julia-Alpha.i1-IQ3_S.gguf b/Julia-Alpha.i1-IQ3_S.gguf new file mode 100644 index 0000000..298a8df --- /dev/null +++ b/Julia-Alpha.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c24d5c75ef9debd5450c4f85e104b55309993ee1cee4d44926047fdd617e152 +size 1899532128 diff --git a/Julia-Alpha.i1-IQ3_XS.gguf b/Julia-Alpha.i1-IQ3_XS.gguf new file mode 100644 index 0000000..da5093e --- /dev/null +++ b/Julia-Alpha.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:698939ef76cdf28d1513215d4fba511ea8167b1c84a909dd426ae144f4fce5bd +size 1814376288 diff --git a/Julia-Alpha.i1-IQ3_XXS.gguf b/Julia-Alpha.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..9ba855b --- /dev/null +++ b/Julia-Alpha.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8406d20ae478aef4e1b55d3d88b90f5ca7aea665ea4c7b23eb6aee51e059f1ee +size 1670189408 diff --git a/Julia-Alpha.i1-IQ4_NL.gguf b/Julia-Alpha.i1-IQ4_NL.gguf new file mode 100644 index 0000000..9e82876 --- /dev/null +++ b/Julia-Alpha.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a58a9afc56d1f0ad9da162d48bf52d927bc72cf13b6af2725600511f06e7e0b7 +size 2381344608 diff --git a/Julia-Alpha.i1-IQ4_XS.gguf b/Julia-Alpha.i1-IQ4_XS.gguf new file mode 100644 index 0000000..bf9c6a0 --- /dev/null +++ b/Julia-Alpha.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9162308b5f3ffcc9a23c822fefad627ed09d54a2c21f13abd510b0c0feaf0c9e +size 2270752608 diff --git a/Julia-Alpha.i1-Q2_K.gguf b/Julia-Alpha.i1-Q2_K.gguf new file mode 100644 index 0000000..86fb951 --- /dev/null +++ b/Julia-Alpha.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e42cbb22a69072c9bf6466fcb64589e77f0f69284aa9c386d39f87de04359ef5 +size 1669500768 diff --git a/Julia-Alpha.i1-Q2_K_S.gguf b/Julia-Alpha.i1-Q2_K_S.gguf new file mode 100644 index 0000000..1b2a8d1 --- /dev/null +++ b/Julia-Alpha.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cc7dd7e749a9f12883cb8ee478903425021aaa81e2d2e158fb4f5c713a283ef +size 1563455328 diff --git a/Julia-Alpha.i1-Q3_K_L.gguf b/Julia-Alpha.i1-Q3_K_L.gguf new file mode 100644 index 0000000..37e4256 --- /dev/null +++ b/Julia-Alpha.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1119fe985a86f089b549a6d0b08ec2801d34da0ce3fca89bc7fe3902ebaff91 +size 2239786848 diff --git a/Julia-Alpha.i1-Q3_K_M.gguf b/Julia-Alpha.i1-Q3_K_M.gguf new file mode 100644 index 0000000..b4e87e9 --- /dev/null +++ b/Julia-Alpha.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81fe301573ada2b54549dfbc1dc5dd00aa1ef7d6f73594bf784f34117912f97b +size 2075619168 diff --git a/Julia-Alpha.i1-Q3_K_S.gguf b/Julia-Alpha.i1-Q3_K_S.gguf new file mode 100644 index 0000000..4d186f1 --- /dev/null +++ b/Julia-Alpha.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9070040976533321b5aced5618e14e7bb1501ab60b9dd02e7a17373462a5fab2 +size 1886998368 diff --git a/Julia-Alpha.i1-Q4_0.gguf b/Julia-Alpha.i1-Q4_0.gguf new file mode 100644 index 0000000..d5adee2 --- /dev/null +++ b/Julia-Alpha.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545109f5bcadd4d76defd6d3b40f8101655ccec495b028ed3f6897e23dff6bce +size 2375774048 diff --git a/Julia-Alpha.i1-Q4_1.gguf b/Julia-Alpha.i1-Q4_1.gguf new file mode 100644 index 0000000..36b3d89 --- /dev/null +++ b/Julia-Alpha.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728d4ba7d41e720cc5b7e9ae54c92a8d1a14bc3b5041c14855e78f2506bcfcae +size 2596630368 diff --git a/Julia-Alpha.i1-Q4_K_M.gguf b/Julia-Alpha.i1-Q4_K_M.gguf new file mode 100644 index 0000000..70c3fcb --- /dev/null +++ b/Julia-Alpha.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f828fcd59294dcb48d5c54f7155c65beec16ef9dd7c339563bb2c8996d3c08c0 +size 2497281888 diff --git a/Julia-Alpha.i1-Q4_K_S.gguf b/Julia-Alpha.i1-Q4_K_S.gguf new file mode 100644 index 0000000..58e13bf --- /dev/null +++ b/Julia-Alpha.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a8a81773335578866d999951355de1b28c676f352a0b8bce6b2bf895966a451 +size 2383310688 diff --git a/Julia-Alpha.i1-Q5_K_M.gguf b/Julia-Alpha.i1-Q5_K_M.gguf new file mode 100644 index 0000000..22e3bce --- /dev/null +++ b/Julia-Alpha.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67144bf58ebf343f8ed98bb3fecca0b9ea3d9e20995dd00b84da6c782aece361 +size 2889514848 diff --git a/Julia-Alpha.i1-Q5_K_S.gguf b/Julia-Alpha.i1-Q5_K_S.gguf new file mode 100644 index 0000000..e383043 --- /dev/null +++ b/Julia-Alpha.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f98ba792e220f3c8ae112737897abe2de679d31ca6ecc4203c6412487718a4 +size 2823712608 diff --git a/Julia-Alpha.i1-Q6_K.gguf b/Julia-Alpha.i1-Q6_K.gguf new file mode 100644 index 0000000..da54946 --- /dev/null +++ b/Julia-Alpha.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4630f7e3b71d083eab5cfbfa21b8e84918e413d3b3d93e3b472163a9f00663c +size 3306262368 diff --git a/README.md b/README.md new file mode 100644 index 0000000..47a9924 --- /dev/null +++ b/README.md @@ -0,0 +1,83 @@ +--- +base_model: test1234124/Julia-Alpha +datasets: +- TensorLabsAI/SolAgentS +language: +- en +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/test1234124/Julia-Alpha + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Julia-Alpha-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/Julia-Alpha-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ1_S.gguf) | i1-IQ1_S | 1.2 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ1_M.gguf) | i1-IQ1_M | 1.2 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ2_XS.gguf) | i1-IQ2_XS | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ2_S.gguf) | i1-IQ2_S | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ2_M.gguf) | i1-IQ2_M | 1.6 | | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q2_K_S.gguf) | i1-Q2_K_S | 1.7 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q2_K.gguf) | i1-Q2_K | 1.8 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 1.8 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ3_XS.gguf) | i1-IQ3_XS | 1.9 | | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q3_K_S.gguf) | i1-Q3_K_S | 2.0 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ3_S.gguf) | i1-IQ3_S | 2.0 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ3_M.gguf) | i1-IQ3_M | 2.1 | | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q3_K_M.gguf) | i1-Q3_K_M | 2.2 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q3_K_L.gguf) | i1-Q3_K_L | 2.3 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ4_XS.gguf) | i1-IQ4_XS | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q4_0.gguf) | i1-Q4_0 | 2.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-IQ4_NL.gguf) | i1-IQ4_NL | 2.5 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q4_K_S.gguf) | i1-Q4_K_S | 2.5 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q4_K_M.gguf) | i1-Q4_K_M | 2.6 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q4_1.gguf) | i1-Q4_1 | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q5_K_S.gguf) | i1-Q5_K_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q5_K_M.gguf) | i1-Q5_K_M | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/Julia-Alpha-i1-GGUF/resolve/main/Julia-Alpha.i1-Q6_K.gguf) | i1-Q6_K | 3.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..e675c37 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07cd111b8cda7c24d789415710e4a17bcf0a6e47484fa860b0981b5242934d4d +size 3842209