commit 5e4d7956f1789f7bac6afa8db2f486ec6fbb5136 Author: ModelHub XC Date: Mon May 11 10:40:39 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..465dd6f --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q4_0_4_8.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-Q4_0_8_8.gguf filter=lfs diff=lfs merge=lfs -text +EXAONE-3.0-7.8B-Instruct.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/EXAONE-3.0-7.8B-Instruct.i1-IQ1_M.gguf b/EXAONE-3.0-7.8B-Instruct.i1-IQ1_M.gguf new file mode 100644 index 0000000..b9dfc79 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36fddac459dfb47fa9ff7fe19cd153a325d515a44c4dd0d8378a2a285aa398d1 +size 2050775328 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-IQ1_S.gguf b/EXAONE-3.0-7.8B-Instruct.i1-IQ1_S.gguf new file mode 100644 index 0000000..833abcb --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d9afa5273d78203ac1cdbeb5e850688cac6facab411f808852893d1dff09c5c +size 1908431136 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-IQ2_M.gguf b/EXAONE-3.0-7.8B-Instruct.i1-IQ2_M.gguf new file mode 100644 index 0000000..52915c0 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac286523c8838bee303c157331c1304bc55ab6b3ccbe4affebb165219784016 +size 2826328352 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-IQ2_S.gguf b/EXAONE-3.0-7.8B-Instruct.i1-IQ2_S.gguf new file mode 100644 index 0000000..c6d7fae --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c0666489dc9f6169f198dcba83ddf3869466289b311348012df268e0310a06 +size 2636536096 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-IQ2_XS.gguf b/EXAONE-3.0-7.8B-Instruct.i1-IQ2_XS.gguf new file mode 100644 index 0000000..e8e3202 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:933f6e43fbbfa7e38337dc662f805e32009599c5144a965d84ac5ce51cd36092 +size 2494585120 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-IQ2_XXS.gguf b/EXAONE-3.0-7.8B-Instruct.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..a7adca4 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55c9a2b4ee18fb8014f91e30f9f5d7d0a02def71664ee0e1188a1b32cba48eb2 +size 2288015648 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-IQ3_M.gguf b/EXAONE-3.0-7.8B-Instruct.i1-IQ3_M.gguf new file mode 100644 index 0000000..5161af1 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:316b126b9b4398467bd2ba88ca05889f814580b998358b116ec4c599fca5c9a2 +size 3648805152 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-IQ3_S.gguf b/EXAONE-3.0-7.8B-Instruct.i1-IQ3_S.gguf new file mode 100644 index 0000000..033422d --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ae849c0df1b62b02b9bc633faf5a0c24a00c44eb0acafae67fb17da841161d +size 3546306848 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-IQ3_XS.gguf b/EXAONE-3.0-7.8B-Instruct.i1-IQ3_XS.gguf new file mode 100644 index 0000000..3b707ab --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cc5d9cdae7eb8f9bf6ec83861824b6ad8f25918809ce7152a2662be032bff7d +size 3382728992 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-IQ3_XXS.gguf b/EXAONE-3.0-7.8B-Instruct.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..57af55c --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3650f00a2beae08d7b45acbfb062f2e37854746409c131fbbcab438870b9821d +size 3152959776 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-IQ4_XS.gguf b/EXAONE-3.0-7.8B-Instruct.i1-IQ4_XS.gguf new file mode 100644 index 0000000..8f3c18d --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d6f03a7b402cd7ee200c24db65f32169bd433dd060fabba1006ecdf05c4709 +size 4300888352 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q2_K.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q2_K.gguf new file mode 100644 index 0000000..bcc6c55 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:231a2c9d2345ed7fef2cab3583087ab0146d1d03fd8f94ad30f2e4a66cbb3a27 +size 3053869344 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_L.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_L.gguf new file mode 100644 index 0000000..5c40d0f --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e558a492fa517b1a9a02144d4f8eeacc9ba792242bf3fc5b970c11295841fbd +size 4185938208 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_M.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_M.gguf new file mode 100644 index 0000000..75951a7 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9f24fa8e9b8cd5a1d10eae5ad8d5e1ef117c147725ae33dc90092c54e705db1 +size 3882899744 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_S.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_S.gguf new file mode 100644 index 0000000..f778686 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d2fe34f5b874e7ab641d88e0b47b78d94390b0943ffb3ab6e93d3e3899ec419 +size 3528481056 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q4_0.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q4_0.gguf new file mode 100644 index 0000000..d4c835c --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb32e05f1f5cb15b919db0e2e9897fe936da1da5904ca3c713f637e3e49c987 +size 4525807904 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_4_4.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_4_4.gguf new file mode 100644 index 0000000..3facb0c --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_4_4.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e928a09452dd0d926683797a648c873902ebefa56e46bd502e13611fd26b120b +size 4511127840 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_4_8.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_4_8.gguf new file mode 100644 index 0000000..28e959c --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_4_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90c7d86f628fee47ae05f084dcfadc19ad1e145b7147887b8e553e9cac6404e2 +size 4511127840 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_8_8.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_8_8.gguf new file mode 100644 index 0000000..d160f35 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_8_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3437a4a57c8bb12b99627ec95c18dd44d12c7a73596bdc3e9e3568910a39e5ff +size 4511127840 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q4_K_M.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q4_K_M.gguf new file mode 100644 index 0000000..2714847 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1e3dcb8fe069bb38e68ccdfb1651eb4f94fd68f0c8272645de6c41a8191acc3 +size 4770650400 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q4_K_S.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q4_K_S.gguf new file mode 100644 index 0000000..3e9e1c3 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:876abed8741f5e07e6b5ad396260128c6a3ebd4ccfadaa2d08d9544a1442a605 +size 4542585120 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q5_K_M.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q5_K_M.gguf new file mode 100644 index 0000000..55ac515 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590f49b50a0e79da89a937331f5106ba41d18e4a425b5202886837770a5114b8 +size 5569665312 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q5_K_S.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q5_K_S.gguf new file mode 100644 index 0000000..9906e87 --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b805b8f09faace3f2da2cba0b51971897846954fbf33a09cc250eb2f9385b68 +size 5435971872 diff --git a/EXAONE-3.0-7.8B-Instruct.i1-Q6_K.gguf b/EXAONE-3.0-7.8B-Instruct.i1-Q6_K.gguf new file mode 100644 index 0000000..e3c544f --- /dev/null +++ b/EXAONE-3.0-7.8B-Instruct.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02de1168296cd0860b042afb7cb10bd72adfd17a24cf056a5debf6cc6177d664 +size 6418618656 diff --git a/README.md b/README.md new file mode 100644 index 0000000..6a98c88 --- /dev/null +++ b/README.md @@ -0,0 +1,82 @@ +--- +base_model: LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct +language: +- en +- ko +library_name: transformers +license: other +license_link: LICENSE +license_name: exaone +quantized_by: mradermacher +tags: +- lg-ai +- exaone +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct + + +static quants are available at https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-IQ1_S.gguf) | i1-IQ1_S | 2.0 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-IQ1_M.gguf) | i1-IQ1_M | 2.2 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.6 | | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-IQ2_S.gguf) | i1-IQ2_S | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-IQ2_M.gguf) | i1-IQ2_M | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q2_K.gguf) | i1-Q2_K | 3.2 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.3 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.5 | | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-IQ3_S.gguf) | i1-IQ3_S | 3.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-IQ3_M.gguf) | i1-IQ3_M | 3.7 | | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_M.gguf) | i1-Q3_K_M | 4.0 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.3 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.4 | | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_4_4.gguf) | i1-Q4_0_4_4 | 4.6 | fast on arm, low quality | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_4_8.gguf) | i1-Q4_0_4_8 | 4.6 | fast on arm+i8mm, low quality | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q4_0_8_8.gguf) | i1-Q4_0_8_8 | 4.6 | fast on arm+sve, low quality | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q4_0.gguf) | i1-Q4_0 | 4.6 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.6 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q4_K_M.gguf) | i1-Q4_K_M | 4.9 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.5 | | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.7 | | +| [GGUF](https://huggingface.co/mradermacher/EXAONE-3.0-7.8B-Instruct-i1-GGUF/resolve/main/EXAONE-3.0-7.8B-Instruct.i1-Q6_K.gguf) | i1-Q6_K | 6.5 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..7d545af --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df5d275df0b062c3319edbfb370f6ceecddb6c19d453dceb09c9ef23accffd7e +size 4988157