commit 5fba688a2b7b22aa5a0e4d96ea4490f5bbaae0f0 Author: ModelHub XC Date: Sat May 9 06:44:47 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..abaafe6 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ1_M.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ1_M.gguf new file mode 100644 index 0000000..d7cdd9d --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23fbaba2aa5a76216a8fe37ecaa86f494ce4b76e6f0aa998f4a3c88a684ba41d +size 3164728608 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ1_S.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ1_S.gguf new file mode 100644 index 0000000..229fd05 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebbcdad7c38b337fccc31a54037703d42b2274826b98a3f85a9c23a35a7f718b +size 2947415328 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_M.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_M.gguf new file mode 100644 index 0000000..42ab004 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e09c57f0289c3ebcdbd57a91dcd6a32c96890623e230540da19cdc2ad635facd +size 4310461728 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_S.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_S.gguf new file mode 100644 index 0000000..19b514f --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbbe02849710af5541492449f412ecd7636c41f95086e92ab615bc205403257b +size 4020710688 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_XS.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_XS.gguf new file mode 100644 index 0000000..8712107 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:182fdc38c4fc7cc2930ba94b3e0f2feb98a6cd33a199c0d5cb14931caaab109e +size 3840261408 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_XXS.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..5d7a67a --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6938f7f355346046ab596cf971159bab033ede63a037455bf487318fe1347591 +size 3526917408 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_M.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_M.gguf new file mode 100644 index 0000000..f0f296f --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89803bc1cbcf47158758b91485f2150230deef210f0890dcfcd959d0b7a12c86 +size 5655723168 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_S.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_S.gguf new file mode 100644 index 0000000..be47a68 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48c4079a9dd55b3ebd8d156096b360451187c7c2009dfdc4b8839c135cbc825b +size 5458316448 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_XS.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_XS.gguf new file mode 100644 index 0000000..0663bac --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a4078f06b434431d1586105a927d26839d9291b3ddc5ae74a2abd6add084715 +size 5206166688 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_XXS.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..611683e --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90be99b2679337965623bbfd7dbecfc59b2128b47b376cedee8e512cc71f507c +size 4784901408 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ4_NL.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ4_NL.gguf new file mode 100644 index 0000000..d017536 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faab3e1d1102f1fc7389fe0cd2c5e314bbc0239c5fc391f2843b36ab24546fc4 +size 6887165088 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-IQ4_XS.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ4_XS.gguf new file mode 100644 index 0000000..4ea5327 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10a342849fb2c626391487d862f9bb035338567243380358a288e23adf3e437a +size 6550965408 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q2_K.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q2_K.gguf new file mode 100644 index 0000000..fa06e8e --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c4ff347e876a2295a59f7ffe4a5a582392e0f6270e20bea214075454812b59 +size 4768222368 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q2_K_S.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q2_K_S.gguf new file mode 100644 index 0000000..1a03644 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:541a31f7f102ea8458d12cd33c93cfda218ee461acc375eb0d8ceda924dfd471 +size 4448611488 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_L.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_L.gguf new file mode 100644 index 0000000..92be568 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e58983fe50ed1a22573163646f32326a420d8de5f55259ba5a02365a2f3475b +size 6480186528 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_M.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_M.gguf new file mode 100644 index 0000000..8fdf639 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:719cffae1ad67c92721d3273a4a881644823222a5a11a1cb717bb4cc7f3fa1d3 +size 6008818848 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_S.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_S.gguf new file mode 100644 index 0000000..75825e7 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5791c419bf8fe46160bb75ce838c8fb639ee099ff0dc965e8bcc884a02f8918e +size 5458316448 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_0.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_0.gguf new file mode 100644 index 0000000..37fec74 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fc6f6c873a8d2cada48e00d161be05c1ad5cc9c84fbc393dcea05cb9363f7ca +size 6909283488 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_1.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_1.gguf new file mode 100644 index 0000000..a1f7640 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3618a34a69f29607806a9ffe4b5f04ead80e6a490d473ee288fa388796ea0b7 +size 7559564448 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_K_M.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_K_M.gguf new file mode 100644 index 0000000..c5d5bce --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c27e95e7238383fef81a2de3ae262adf67ba01dc7896592637607a903a3eab4 +size 7300779168 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_K_S.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_K_S.gguf new file mode 100644 index 0000000..79f31cf --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b2db7152402822fd4b4c53605a0717660fa705f0a877e25300750fa10a6863f +size 6935334048 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q5_K_M.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q5_K_M.gguf new file mode 100644 index 0000000..6507261 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:532b3e1fb57eea9a73394bb2479d1da05c615ac00e62ff829201ce87d0db434b +size 8445037728 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q5_K_S.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q5_K_S.gguf new file mode 100644 index 0000000..b8aae92 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4a42d7f03ad7c934aef0de8bd4bef49c595b8761fe3fd813742aed3dfb33bfc +size 8231963808 diff --git a/EZO2.5-gemma-3-12b-it-Preview.i1-Q6_K.gguf b/EZO2.5-gemma-3-12b-it-Preview.i1-Q6_K.gguf new file mode 100644 index 0000000..bd4e2e8 --- /dev/null +++ b/EZO2.5-gemma-3-12b-it-Preview.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b7420652f7cffc5033d68cc3416d215278682812efd3f4a4641b495a012e2cc +size 9660812448 diff --git a/README.md b/README.md new file mode 100644 index 0000000..528b4c3 --- /dev/null +++ b/README.md @@ -0,0 +1,87 @@ +--- +base_model: AXCXEPT/EZO2.5-gemma-3-12b-it-Preview +language: +- ja +library_name: transformers +license: gemma +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- gemma-3 +- japanese +- text-generation +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/AXCXEPT/EZO2.5-gemma-3-12b-it-Preview + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#EZO2.5-gemma-3-12b-it-Preview-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-GGUF + +**This is a vision model - mmproj files (if any) will be in the [static repository](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-GGUF).** +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ1_S.gguf) | i1-IQ1_S | 3.0 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ1_M.gguf) | i1-IQ1_M | 3.3 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 3.6 | | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_XS.gguf) | i1-IQ2_XS | 3.9 | | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_S.gguf) | i1-IQ2_S | 4.1 | | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ2_M.gguf) | i1-IQ2_M | 4.4 | | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q2_K_S.gguf) | i1-Q2_K_S | 4.5 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q2_K.gguf) | i1-Q2_K | 4.9 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 4.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_XS.gguf) | i1-IQ3_XS | 5.3 | | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_S.gguf) | i1-IQ3_S | 5.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_S.gguf) | i1-Q3_K_S | 5.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ3_M.gguf) | i1-IQ3_M | 5.8 | | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_M.gguf) | i1-Q3_K_M | 6.1 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q3_K_L.gguf) | i1-Q3_K_L | 6.6 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ4_XS.gguf) | i1-IQ4_XS | 6.7 | | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-IQ4_NL.gguf) | i1-IQ4_NL | 7.0 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_0.gguf) | i1-Q4_0 | 7.0 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_K_S.gguf) | i1-Q4_K_S | 7.0 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_K_M.gguf) | i1-Q4_K_M | 7.4 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q4_1.gguf) | i1-Q4_1 | 7.7 | | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q5_K_S.gguf) | i1-Q5_K_S | 8.3 | | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q5_K_M.gguf) | i1-Q5_K_M | 8.5 | | +| [GGUF](https://huggingface.co/mradermacher/EZO2.5-gemma-3-12b-it-Preview-i1-GGUF/resolve/main/EZO2.5-gemma-3-12b-it-Preview.i1-Q6_K.gguf) | i1-Q6_K | 9.8 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..93e011f --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29d629ef2591f20022bf3f59c7ff01b716996550020b4c13d15258d8b933d16a +size 7433101