commit 0dff27dcd61719b7f0a54f8db064a8d3198f242d Author: ModelHub XC Date: Thu Apr 30 18:25:20 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/HelpingAI-Lite-2x1B-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..47ff168 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI-Lite-2x1B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/HelpingAI-Lite-2x1B.i1-IQ1_M.gguf b/HelpingAI-Lite-2x1B.i1-IQ1_M.gguf new file mode 100644 index 0000000..02ecab9 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc78f828491645b32d9b45bf20ed4b88fac12f74c9d83e31babf2976d5d34d92 +size 459115360 diff --git a/HelpingAI-Lite-2x1B.i1-IQ1_S.gguf b/HelpingAI-Lite-2x1B.i1-IQ1_S.gguf new file mode 100644 index 0000000..86328ff --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c08f3fb7ca47a39fcb38af9bd6a57f488c704e677c78c9d0e27cc9616f833a6 +size 422079328 diff --git a/HelpingAI-Lite-2x1B.i1-IQ2_M.gguf b/HelpingAI-Lite-2x1B.i1-IQ2_M.gguf new file mode 100644 index 0000000..c0ffae0 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc92da9c468f59f08dce17d6c997935456b11b763296b99d54ad48f5f68a7bf4 +size 646806368 diff --git a/HelpingAI-Lite-2x1B.i1-IQ2_S.gguf b/HelpingAI-Lite-2x1B.i1-IQ2_S.gguf new file mode 100644 index 0000000..1e08009 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:720dc422cdf1fda9013b5d31e281bdc5e6c410797af27c3faea176286e905975 +size 597424992 diff --git a/HelpingAI-Lite-2x1B.i1-IQ2_XS.gguf b/HelpingAI-Lite-2x1B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..d780dfe --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:848bf294d92a98740aa555c4eeca57122e4ae723157e1c496d4508af507cbe26 +size 573107040 diff --git a/HelpingAI-Lite-2x1B.i1-IQ2_XXS.gguf b/HelpingAI-Lite-2x1B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..7eaabb2 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8473778a712204109aef000558042dfda4f1b1da8b94b7c4342d2efb08601594 +size 520842080 diff --git a/HelpingAI-Lite-2x1B.i1-IQ3_M.gguf b/HelpingAI-Lite-2x1B.i1-IQ3_M.gguf new file mode 100644 index 0000000..8e4c035 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06b28a9a9671709357a7897d227f06b0eb376b6c742ebb3bf39e141c1c9ca131 +size 846728032 diff --git a/HelpingAI-Lite-2x1B.i1-IQ3_S.gguf b/HelpingAI-Lite-2x1B.i1-IQ3_S.gguf new file mode 100644 index 0000000..d18c8c6 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dc73eeb216e632053ad1aeff65c12d006f73830ea0439013801e5b38d549d11 +size 828345184 diff --git a/HelpingAI-Lite-2x1B.i1-IQ3_XS.gguf b/HelpingAI-Lite-2x1B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..622d383 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f18360beb2e1e00f877696e5c80699739f1bb1168241423d21f02753d100e008 +size 786713440 diff --git a/HelpingAI-Lite-2x1B.i1-IQ3_XXS.gguf b/HelpingAI-Lite-2x1B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..8c22e62 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a058df9ee22b25f423fb65b6e0fc1f5edb05209cde8f99cb2fe78816324a9f3 +size 736918368 diff --git a/HelpingAI-Lite-2x1B.i1-IQ4_NL.gguf b/HelpingAI-Lite-2x1B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..f6eda03 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af8a20aead9082e76dbfb522ce48497feb272ba379fab44e0dd5201d6aff65a +size 1066744672 diff --git a/HelpingAI-Lite-2x1B.i1-IQ4_XS.gguf b/HelpingAI-Lite-2x1B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..cd301dd --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a06c1972381a0766ef563b0299524b3ae618e59eccad872669666f19d65dd3b0 +size 1010989920 diff --git a/HelpingAI-Lite-2x1B.i1-Q2_K.gguf b/HelpingAI-Lite-2x1B.i1-Q2_K.gguf new file mode 100644 index 0000000..5909c91 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81a7b4d39d51a88d490267100b1b7521a3c3bbee68afe7d64c5e2317dfef44dd +size 708057952 diff --git a/HelpingAI-Lite-2x1B.i1-Q2_K_S.gguf b/HelpingAI-Lite-2x1B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..2f9cb3e --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8e9611300caa0b1e36abb9ad0bac8893e6685619ab37d5a9d34c6a5a4afe243 +size 657955680 diff --git a/HelpingAI-Lite-2x1B.i1-Q3_K_L.gguf b/HelpingAI-Lite-2x1B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..606df81 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74bd1d090cfee33e35ea9dd878b7ab6008871ebf4f9f2a3d52e3471d030f11ef +size 984419168 diff --git a/HelpingAI-Lite-2x1B.i1-Q3_K_M.gguf b/HelpingAI-Lite-2x1B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..70c91a6 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6be5eafcef76ef7d59ac137bffc65d3939125567d137e6c60e265c6441a3ede +size 911018848 diff --git a/HelpingAI-Lite-2x1B.i1-Q3_K_S.gguf b/HelpingAI-Lite-2x1B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..2c67b52 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aab9c0df92ce7d27195d472503f60fe8e8e1e1929b1b1dd9e71d0d0bfbe1241 +size 826813280 diff --git a/HelpingAI-Lite-2x1B.i1-Q4_0.gguf b/HelpingAI-Lite-2x1B.i1-Q4_0.gguf new file mode 100644 index 0000000..a0a5425 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78ddea15e2150e6ac23125e2c8c84351103628adb2058e2578751d4c27a4d6ba +size 1068186464 diff --git a/HelpingAI-Lite-2x1B.i1-Q4_1.gguf b/HelpingAI-Lite-2x1B.i1-Q4_1.gguf new file mode 100644 index 0000000..063556c --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c5802c3be6f49de90d850c90869625e149cc7f825b2975ee439c8fdf8626efb +size 1177533280 diff --git a/HelpingAI-Lite-2x1B.i1-Q4_K_M.gguf b/HelpingAI-Lite-2x1B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..35d3b1b --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53545808bcd9a54c360dc3304162f6b9d56355c97be837b05a647186d5b783eb +size 1126128480 diff --git a/HelpingAI-Lite-2x1B.i1-Q4_K_S.gguf b/HelpingAI-Lite-2x1B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..23b3f5d --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba35e94ebb857e2cd450890318cb73b229b1d220dac8f70be45229ee3c1328da +size 1071332192 diff --git a/HelpingAI-Lite-2x1B.i1-Q5_K_M.gguf b/HelpingAI-Lite-2x1B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..16f5106 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da44ad30cadedfcdf9d0a12033d2e843e809b59ca3fcf4199db630d07af497ba +size 1321098080 diff --git a/HelpingAI-Lite-2x1B.i1-Q5_K_S.gguf b/HelpingAI-Lite-2x1B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..031c289 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39cd6a0d2dd915035a5fa3efa72cd7b35e3b397d124a6f86f4a5078c17850a9f +size 1289763680 diff --git a/HelpingAI-Lite-2x1B.i1-Q6_K.gguf b/HelpingAI-Lite-2x1B.i1-Q6_K.gguf new file mode 100644 index 0000000..54ee3b5 --- /dev/null +++ b/HelpingAI-Lite-2x1B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7d858a5910fd1a5198ba9858b89235ff032dbca8682ea7ddd07affdbc169f5f +size 1528253280 diff --git a/README.md b/README.md new file mode 100644 index 0000000..6afedea --- /dev/null +++ b/README.md @@ -0,0 +1,85 @@ +--- +base_model: OEvortex/HelpingAI-Lite-2x1B +language: +- en +library_name: transformers +license: other +license_link: https://huggingface.co/OEvortex/vortex-3b/raw/main/LICENSE.md +license_name: hsul +quantized_by: mradermacher +tags: +- HelpingAI +- coder +- lite +- Fine-tuned +- moe +- nlp +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/OEvortex/HelpingAI-Lite-2x1B + + +static quants are available at https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ1_S.gguf) | i1-IQ1_S | 0.5 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ1_M.gguf) | i1-IQ1_M | 0.6 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ2_S.gguf) | i1-IQ2_S | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ2_M.gguf) | i1-IQ2_M | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.8 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q2_K.gguf) | i1-Q2_K | 0.8 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.8 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 0.9 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ3_S.gguf) | i1-IQ3_S | 0.9 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ3_M.gguf) | i1-IQ3_M | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.0 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.1 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 1.2 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q4_0.gguf) | i1-Q4_0 | 1.2 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 1.2 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q4_1.gguf) | i1-Q4_1 | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI-Lite-2x1B-i1-GGUF/resolve/main/HelpingAI-Lite-2x1B.i1-Q6_K.gguf) | i1-Q6_K | 1.6 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..25df532 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e75e60a1c6181f7e10d7561eece7fa2e398ded41271913135f9a5d7c1b1a7c31 +size 2619495