commit f2481c007cb3ad287ce5d811e93671efe0d0e8bb Author: ModelHub XC Date: Tue May 12 07:11:30 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/HelpingAI2.5-2B-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..b74e788 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,61 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q4_0_4_8.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-Q4_0_8_8.gguf filter=lfs diff=lfs merge=lfs -text +HelpingAI2.5-2B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/HelpingAI2.5-2B.i1-IQ1_M.gguf b/HelpingAI2.5-2B.i1-IQ1_M.gguf new file mode 100644 index 0000000..5878b66 --- /dev/null +++ b/HelpingAI2.5-2B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f7be1ca87a5f0d0492f7730b332b3d2807a392ad3876661b5abd99051e45bb1 +size 444159904 diff --git a/HelpingAI2.5-2B.i1-IQ1_S.gguf b/HelpingAI2.5-2B.i1-IQ1_S.gguf new file mode 100644 index 0000000..4d8b81f --- /dev/null +++ b/HelpingAI2.5-2B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac05b0c1283e352fb12c57d3525a2b0c61a32ed3a795483796f5389f45b5fdbb +size 412309408 diff --git a/HelpingAI2.5-2B.i1-IQ2_M.gguf b/HelpingAI2.5-2B.i1-IQ2_M.gguf new file mode 100644 index 0000000..1e354ff --- /dev/null +++ b/HelpingAI2.5-2B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e3d8a6c453828f38396f85692ddf40a6e464c46f9ef3402c28ebd4fd0a59001 +size 614815648 diff --git a/HelpingAI2.5-2B.i1-IQ2_S.gguf b/HelpingAI2.5-2B.i1-IQ2_S.gguf new file mode 100644 index 0000000..3c6b30d --- /dev/null +++ b/HelpingAI2.5-2B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c88208b46f3df46031eae252bcad3b84f2a72cd3427eb42fff44a889bc556df +size 572348320 diff --git a/HelpingAI2.5-2B.i1-IQ2_XS.gguf b/HelpingAI2.5-2B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..a94051b --- /dev/null +++ b/HelpingAI2.5-2B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac83940dd0ffcd1c482b1e30414f4772dd2ff1aa1e61dfb8b120748c85153f2 +size 542857120 diff --git a/HelpingAI2.5-2B.i1-IQ2_XXS.gguf b/HelpingAI2.5-2B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..c1dd68b --- /dev/null +++ b/HelpingAI2.5-2B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df1ed89c9cb8a51a9b12ee83ca4fcbba9fdec47c4d0e3b38a34b57622b32f8b5 +size 497244064 diff --git a/HelpingAI2.5-2B.i1-IQ3_M.gguf b/HelpingAI2.5-2B.i1-IQ3_M.gguf new file mode 100644 index 0000000..65368eb --- /dev/null +++ b/HelpingAI2.5-2B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f50230b8ae1910457a73dc3c578adb36ec4491f3eb61face57d086b195c2c1a +size 810244000 diff --git a/HelpingAI2.5-2B.i1-IQ3_S.gguf b/HelpingAI2.5-2B.i1-IQ3_S.gguf new file mode 100644 index 0000000..6c9285d --- /dev/null +++ b/HelpingAI2.5-2B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9977f980a23e8f4156dcde1320bde528797a008eb225dcf3bc487b0d951c252c +size 776820640 diff --git a/HelpingAI2.5-2B.i1-IQ3_XS.gguf b/HelpingAI2.5-2B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..56552df --- /dev/null +++ b/HelpingAI2.5-2B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c65737e910320f35a9c03f3880707669ae3fd407f40adfdb749adc8c6f9985e6 +size 739071904 diff --git a/HelpingAI2.5-2B.i1-IQ3_XXS.gguf b/HelpingAI2.5-2B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..a177bba --- /dev/null +++ b/HelpingAI2.5-2B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce3baeeec1b13cb3749512ed66d8b2482844b901dba444fa1883cda3725963a6 +size 680089504 diff --git a/HelpingAI2.5-2B.i1-IQ4_XS.gguf b/HelpingAI2.5-2B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..c8b61b5 --- /dev/null +++ b/HelpingAI2.5-2B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:228a94e6d3355029dceffb78e516f86d912b7556590453a91f497bbe17ddc949 +size 940398496 diff --git a/HelpingAI2.5-2B.i1-Q2_K.gguf b/HelpingAI2.5-2B.i1-Q2_K.gguf new file mode 100644 index 0000000..ac582c6 --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:328eddd5e13f80dd8fe289f1522c53a005cf15ef46d4570a367312b0cdaab722 +size 674584480 diff --git a/HelpingAI2.5-2B.i1-Q2_K_S.gguf b/HelpingAI2.5-2B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..c20ec5c --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fbbafaddb643a1020a7e08f4c74a562e377b4338b7f9c42086451f0fae98c4c +size 625039264 diff --git a/HelpingAI2.5-2B.i1-Q3_K_L.gguf b/HelpingAI2.5-2B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..3114363 --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3a80299182013a5bd7741953e3141b9a10bb9e04254f781eb3b352916f223cb +size 932534176 diff --git a/HelpingAI2.5-2B.i1-Q3_K_M.gguf b/HelpingAI2.5-2B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..da58872 --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e145714bf1112db93fab5160d812b6c266b3dbd351a2f47306fb46859905057d +size 860182432 diff --git a/HelpingAI2.5-2B.i1-Q3_K_S.gguf b/HelpingAI2.5-2B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..142df20 --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40923b5e2503bd7676ed70c39e99ed2b09e7a716c5d7aab56b3f00f26c518dbf +size 776820640 diff --git a/HelpingAI2.5-2B.i1-Q4_0.gguf b/HelpingAI2.5-2B.i1-Q4_0.gguf new file mode 100644 index 0000000..b762668 --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f8db33b0e705a87d8d807c95e181421fc8870c83790767290ec268797a357e6 +size 993875872 diff --git a/HelpingAI2.5-2B.i1-Q4_0_4_4.gguf b/HelpingAI2.5-2B.i1-Q4_0_4_4.gguf new file mode 100644 index 0000000..8152289 --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q4_0_4_4.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:465b8f982825d5ac627256357ed722a9bb14ab1ed49cab8be22595271cb7f952 +size 990730144 diff --git a/HelpingAI2.5-2B.i1-Q4_0_4_8.gguf b/HelpingAI2.5-2B.i1-Q4_0_4_8.gguf new file mode 100644 index 0000000..96d5df5 --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q4_0_4_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4ef5572826a705004937cb066842ea3ec5c93da5f5ebc7bc327a3bf2e04744d +size 990730144 diff --git a/HelpingAI2.5-2B.i1-Q4_0_8_8.gguf b/HelpingAI2.5-2B.i1-Q4_0_8_8.gguf new file mode 100644 index 0000000..6506cb7 --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q4_0_8_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3085a6a1cc8537cd480a9154205841c324c4d6bb423240fb66de06238f180d7a +size 990730144 diff --git a/HelpingAI2.5-2B.i1-Q4_K_M.gguf b/HelpingAI2.5-2B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..5f8ef9b --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64701330340ff1cac67193f538c85f64438528de8457cb6b19559b3c795f5de9 +size 1055610784 diff --git a/HelpingAI2.5-2B.i1-Q4_K_S.gguf b/HelpingAI2.5-2B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..6b29356 --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a627dda809122922cddda145acf5993d649fb51d07627f27644aa492e993cdc0 +size 999118752 diff --git a/HelpingAI2.5-2B.i1-Q5_K_M.gguf b/HelpingAI2.5-2B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..f3db9a7 --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d038b29391f01642d377d34ac67f70c0a8f2a3c98b7f91714e5da8c35b096a85 +size 1225480096 diff --git a/HelpingAI2.5-2B.i1-Q5_K_S.gguf b/HelpingAI2.5-2B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..306fe47 --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8629f49e2a5c82432e29791fe0bbffdba537549a080e8856db153daf987622f0 +size 1192056736 diff --git a/HelpingAI2.5-2B.i1-Q6_K.gguf b/HelpingAI2.5-2B.i1-Q6_K.gguf new file mode 100644 index 0000000..070706c --- /dev/null +++ b/HelpingAI2.5-2B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d817ba76935113f8efe12613fa2d2f53d35605be3d3cdcf0d281224b0346edcc +size 1405966240 diff --git a/README.md b/README.md new file mode 100644 index 0000000..1323696 --- /dev/null +++ b/README.md @@ -0,0 +1,85 @@ +--- +base_model: HelpingAI/HelpingAI2.5-2B +language: +- en +library_name: transformers +license: other +license_link: https://huggingface.co/OEvortex/HelpingAI2.5-2B/blob/main/LICENSE.md +license_name: helpingai +quantized_by: mradermacher +tags: +- HelpingAI +- Emotionally-Intelligent +- EQ-focused +- Conversational +- SLM +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/HelpingAI/HelpingAI2.5-2B + + +static quants are available at https://huggingface.co/mradermacher/HelpingAI2.5-2B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-IQ1_S.gguf) | i1-IQ1_S | 0.5 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-IQ1_M.gguf) | i1-IQ1_M | 0.5 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-IQ2_S.gguf) | i1-IQ2_S | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-IQ2_M.gguf) | i1-IQ2_M | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.7 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q2_K.gguf) | i1-Q2_K | 0.8 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.8 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-IQ3_S.gguf) | i1-IQ3_S | 0.9 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 0.9 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-IQ3_M.gguf) | i1-IQ3_M | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.0 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.0 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q4_0_4_4.gguf) | i1-Q4_0_4_4 | 1.1 | fast on arm, low quality | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q4_0_4_8.gguf) | i1-Q4_0_4_8 | 1.1 | fast on arm+i8mm, low quality | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q4_0_8_8.gguf) | i1-Q4_0_8_8 | 1.1 | fast on arm+sve, low quality | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q4_0.gguf) | i1-Q4_0 | 1.1 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 1.1 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 1.3 | | +| [GGUF](https://huggingface.co/mradermacher/HelpingAI2.5-2B-i1-GGUF/resolve/main/HelpingAI2.5-2B.i1-Q6_K.gguf) | i1-Q6_K | 1.5 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..f68c9f3 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a19a4f67c63e4c0d3f1a699b1d3dbfd8ef9d3cfd1d2c0d35d78cd973129cd19e +size 1971637