commit 071606067f9baa3b65efe952f4c58c7df3c8050d Author: ModelHub XC Date: Sat May 9 02:00:59 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/EraX-VL-2B-V1.5-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..f5b697f --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +EraX-VL-2B-V1.5.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/EraX-VL-2B-V1.5.i1-IQ1_M.gguf b/EraX-VL-2B-V1.5.i1-IQ1_M.gguf new file mode 100644 index 0000000..9fc7c6b --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93568eb20124eaa8dc7b7ce98c1e0d7183af1f75968b952de9a90ce5acdd9349 +size 464460544 diff --git a/EraX-VL-2B-V1.5.i1-IQ1_S.gguf b/EraX-VL-2B-V1.5.i1-IQ1_S.gguf new file mode 100644 index 0000000..5e98e53 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ad0ac3988ee3dc455ece457846eaae5e498c16e1abf8f1ac282a33de42e06f1 +size 436526848 diff --git a/EraX-VL-2B-V1.5.i1-IQ2_M.gguf b/EraX-VL-2B-V1.5.i1-IQ2_M.gguf new file mode 100644 index 0000000..3c43aef --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8635e4a32e3ddc974a4adbfb454f913de7e19a5b2a4be9b9dc97076853dc760 +size 601053952 diff --git a/EraX-VL-2B-V1.5.i1-IQ2_S.gguf b/EraX-VL-2B-V1.5.i1-IQ2_S.gguf new file mode 100644 index 0000000..b974725 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf6e94778ef99eac751b22366c5a67877aa39826abf6c80b4ef421f6f80350dc +size 563809024 diff --git a/EraX-VL-2B-V1.5.i1-IQ2_XS.gguf b/EraX-VL-2B-V1.5.i1-IQ2_XS.gguf new file mode 100644 index 0000000..5330218 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64a25c67b46e3da5201df3d7fd880f88a83c050a393c988e3ab0417725608e5b +size 550326016 diff --git a/EraX-VL-2B-V1.5.i1-IQ2_XXS.gguf b/EraX-VL-2B-V1.5.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..7e842d0 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d8cf2f2d3c4920ece99e883d01c7e706bab79720d3203d490c97e499bea82b +size 511016704 diff --git a/EraX-VL-2B-V1.5.i1-IQ3_M.gguf b/EraX-VL-2B-V1.5.i1-IQ3_M.gguf new file mode 100644 index 0000000..a729d77 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68e9325ca7c9b88b018b06a56c9d8b74d92e05bf66d3793f745415c7af048378 +size 776663296 diff --git a/EraX-VL-2B-V1.5.i1-IQ3_S.gguf b/EraX-VL-2B-V1.5.i1-IQ3_S.gguf new file mode 100644 index 0000000..c04ac0f --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2321f3281867ffa942c1084d85977febc6f10508f169efeac45d7ab66e310514 +size 762406144 diff --git a/EraX-VL-2B-V1.5.i1-IQ3_XS.gguf b/EraX-VL-2B-V1.5.i1-IQ3_XS.gguf new file mode 100644 index 0000000..a3948d2 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ef3ccc093524f36ae2ad86726459aaf97790396501e604b4db37a5ca7fcfd7d +size 731698432 diff --git a/EraX-VL-2B-V1.5.i1-IQ3_XXS.gguf b/EraX-VL-2B-V1.5.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..39f6070 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89a9796a5e4c12f45fc9deb024a17022e2f2fc633ec9f5f4241c1bc760c7079d +size 668791552 diff --git a/EraX-VL-2B-V1.5.i1-IQ4_NL.gguf b/EraX-VL-2B-V1.5.i1-IQ4_NL.gguf new file mode 100644 index 0000000..8cca1c9 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c34aefeafa6b3cdc76c724a924ceec6077877be836270a4b2be2582520f55037 +size 936330496 diff --git a/EraX-VL-2B-V1.5.i1-IQ4_XS.gguf b/EraX-VL-2B-V1.5.i1-IQ4_XS.gguf new file mode 100644 index 0000000..b46d561 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff906ebdf4018c22ac17e80dd44a391a89e69f80166203f763c00d6ca382e04a +size 895730944 diff --git a/EraX-VL-2B-V1.5.i1-Q2_K.gguf b/EraX-VL-2B-V1.5.i1-Q2_K.gguf new file mode 100644 index 0000000..668328b --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:199844833ec076103da0b298ae16a19ac878565cfa2e320885bf8f86e64bebf2 +size 676304128 diff --git a/EraX-VL-2B-V1.5.i1-Q2_K_S.gguf b/EraX-VL-2B-V1.5.i1-Q2_K_S.gguf new file mode 100644 index 0000000..a15173c --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ee7c42634c7757984eadfc1d08d9b838377c33a5ca338466e2f16a7f5fe0bca +size 640134400 diff --git a/EraX-VL-2B-V1.5.i1-Q3_K_L.gguf b/EraX-VL-2B-V1.5.i1-Q3_K_L.gguf new file mode 100644 index 0000000..4b11e2a --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:908b806a72d08e010d9934da8d6180ce772f7fc32181793d86764b307366ac60 +size 880162048 diff --git a/EraX-VL-2B-V1.5.i1-Q3_K_M.gguf b/EraX-VL-2B-V1.5.i1-Q3_K_M.gguf new file mode 100644 index 0000000..b7b9b49 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aee09130e7f0d51b42086494ba50a3ad53f5f464c03e2ca0ef24642d40239b85 +size 824177920 diff --git a/EraX-VL-2B-V1.5.i1-Q3_K_S.gguf b/EraX-VL-2B-V1.5.i1-Q3_K_S.gguf new file mode 100644 index 0000000..1541170 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ae51d688ccbfa2062aa38732452a65b42c06edb794fed5bef96ee239b0bff42 +size 760943872 diff --git a/EraX-VL-2B-V1.5.i1-Q4_0.gguf b/EraX-VL-2B-V1.5.i1-Q4_0.gguf new file mode 100644 index 0000000..a4f37a8 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409ee6e1cb4e9e32bc6f5cfa4940dff37ead613169d4d8d1c73cdff97929dc7c +size 937534720 diff --git a/EraX-VL-2B-V1.5.i1-Q4_1.gguf b/EraX-VL-2B-V1.5.i1-Q4_1.gguf new file mode 100644 index 0000000..658cbd2 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6246c6336796eff20ce6853ea7d9d0a9b06b559a86b01533afd69ee6f9a41f77 +size 1016841472 diff --git a/EraX-VL-2B-V1.5.i1-Q4_K_M.gguf b/EraX-VL-2B-V1.5.i1-Q4_K_M.gguf new file mode 100644 index 0000000..ec0d6b2 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:529d05a75024e43fd7f13783b200329c97c3353dbcb0be4e15a78a2c5f3eba68 +size 986047744 diff --git a/EraX-VL-2B-V1.5.i1-Q4_K_S.gguf b/EraX-VL-2B-V1.5.i1-Q4_K_S.gguf new file mode 100644 index 0000000..828e650 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:035bc4f72a94c011e8c77a26de2aa4c4683d46cbcf367ca8b939e2e8cb74bc07 +size 940311808 diff --git a/EraX-VL-2B-V1.5.i1-Q5_K_M.gguf b/EraX-VL-2B-V1.5.i1-Q5_K_M.gguf new file mode 100644 index 0000000..8bb2a3b --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91251b8eb1e368a673cfdae776e4b18d2b829f18245877345bec3daca0ee8e86 +size 1125049600 diff --git a/EraX-VL-2B-V1.5.i1-Q5_K_S.gguf b/EraX-VL-2B-V1.5.i1-Q5_K_S.gguf new file mode 100644 index 0000000..b5d7eb3 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee7d2cd0557dcfa8dd5959a605a7f747453442d1a8e315503f129409c64c6264 +size 1098728704 diff --git a/EraX-VL-2B-V1.5.i1-Q6_K.gguf b/EraX-VL-2B-V1.5.i1-Q6_K.gguf new file mode 100644 index 0000000..ab83805 --- /dev/null +++ b/EraX-VL-2B-V1.5.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ded8e01c3283f4e03fb57246f42a2ed21f3c6d2ecf7897dcb42851ccdf93031 +size 1272739072 diff --git a/README.md b/README.md new file mode 100644 index 0000000..2dc5aee --- /dev/null +++ b/README.md @@ -0,0 +1,95 @@ +--- +base_model: erax-ai/EraX-VL-2B-V1.5 +language: +- vi +- en +- zh +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- erax +- multimodal +- erax-vl-2B +- insurance +- ocr +- vietnamese +- bcg +- image-to-text +- image-text-to-text +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/erax-ai/EraX-VL-2B-V1.5 + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#EraX-VL-2B-V1.5-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-GGUF + +**This is a vision model - mmproj files (if any) will be in the [static repository](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-GGUF).** +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ1_S.gguf) | i1-IQ1_S | 0.5 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ1_M.gguf) | i1-IQ1_M | 0.6 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ2_S.gguf) | i1-IQ2_S | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ2_M.gguf) | i1-IQ2_M | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.7 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.8 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q2_K.gguf) | i1-Q2_K | 0.8 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q3_K_S.gguf) | i1-Q3_K_S | 0.9 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ3_S.gguf) | i1-IQ3_S | 0.9 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ3_M.gguf) | i1-IQ3_M | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q3_K_M.gguf) | i1-Q3_K_M | 0.9 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.0 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-IQ4_NL.gguf) | i1-IQ4_NL | 1.0 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q4_0.gguf) | i1-Q4_0 | 1.0 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q4_K_S.gguf) | i1-Q4_K_S | 1.0 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q4_K_M.gguf) | i1-Q4_K_M | 1.1 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q4_1.gguf) | i1-Q4_1 | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q5_K_S.gguf) | i1-Q5_K_S | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q5_K_M.gguf) | i1-Q5_K_M | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/EraX-VL-2B-V1.5-i1-GGUF/resolve/main/EraX-VL-2B-V1.5.i1-Q6_K.gguf) | i1-Q6_K | 1.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..9eda7c6 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d01248c1e7a59b2f488102f6096206798a1c0588fc184f85f621e5bfd256c287 +size 2042201