commit d09a2f88e39d123dc64770bdde67e2fdbda789a3 Author: ModelHub XC Date: Tue Apr 21 10:15:27 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/bloomz-1b1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..4d79fc9 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +bloomz-1b1.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..53432a9 --- /dev/null +++ b/README.md @@ -0,0 +1,111 @@ +--- +base_model: bigscience/bloomz-1b1 +datasets: +- bigscience/xP3 +language: +- ak +- ar +- as +- bm +- bn +- ca +- code +- en +- es +- eu +- fon +- fr +- gu +- hi +- id +- ig +- ki +- kn +- lg +- ln +- ml +- mr +- ne +- nso +- ny +- or +- pa +- pt +- rn +- rw +- sn +- st +- sw +- ta +- te +- tn +- ts +- tum +- tw +- ur +- vi +- wo +- xh +- yo +- zh +- zu +library_name: transformers +license: bigscience-bloom-rail-1.0 +quantized_by: mradermacher +--- +## About + + + + + + +static quants of https://huggingface.co/bigscience/bloomz-1b1 + + +weighted/imatrix quants are available at https://huggingface.co/mradermacher/bloomz-1b1-i1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.Q2_K.gguf) | Q2_K | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.Q3_K_S.gguf) | Q3_K_S | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.Q3_K_M.gguf) | Q3_K_M | 0.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.Q3_K_L.gguf) | Q3_K_L | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.IQ4_XS.gguf) | IQ4_XS | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.Q4_K_S.gguf) | Q4_K_S | 1.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.Q4_K_M.gguf) | Q4_K_M | 1.1 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.Q5_K_S.gguf) | Q5_K_S | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.Q5_K_M.gguf) | Q5_K_M | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.Q6_K.gguf) | Q6_K | 1.3 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.Q8_0.gguf) | Q8_0 | 1.7 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/bloomz-1b1-GGUF/resolve/main/bloomz-1b1.f16.gguf) | f16 | 3.0 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + + diff --git a/bloomz-1b1.IQ4_XS.gguf b/bloomz-1b1.IQ4_XS.gguf new file mode 100644 index 0000000..e537120 --- /dev/null +++ b/bloomz-1b1.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79df3894c1492d464bfd7fb80d883084ceb1aaf473cdf76dfaf7645ba8de6f9b +size 900787712 diff --git a/bloomz-1b1.Q2_K.gguf b/bloomz-1b1.Q2_K.gguf new file mode 100644 index 0000000..b9bf520 --- /dev/null +++ b/bloomz-1b1.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f751af5b5dd6b66bd18c3a6456fa9da268cb2ba24a880151c9df0d54d3704c +size 708824576 diff --git a/bloomz-1b1.Q3_K_L.gguf b/bloomz-1b1.Q3_K_L.gguf new file mode 100644 index 0000000..bd416d3 --- /dev/null +++ b/bloomz-1b1.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:716245bb6db67649c6d0037c7547498a72c7652582b0d4518cf356624db2b5fb +size 883768832 diff --git a/bloomz-1b1.Q3_K_M.gguf b/bloomz-1b1.Q3_K_M.gguf new file mode 100644 index 0000000..aa471e8 --- /dev/null +++ b/bloomz-1b1.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53c9bc41f2aa60e002bc4fd6b73f1637c66b07359634fe0d5ae698a2067e0759 +size 849559040 diff --git a/bloomz-1b1.Q3_K_S.gguf b/bloomz-1b1.Q3_K_S.gguf new file mode 100644 index 0000000..0a82673 --- /dev/null +++ b/bloomz-1b1.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3ac45235cf79a70a26560cb991b93b0a8f0dd9ab2b83f84200485d7198d63e +size 788217344 diff --git a/bloomz-1b1.Q4_K_M.gguf b/bloomz-1b1.Q4_K_M.gguf new file mode 100644 index 0000000..e41c72f --- /dev/null +++ b/bloomz-1b1.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c76e4d9d6b8d243497502e4bf345da887ce870631c5bc54e5c6942bb01d3603 +size 980069888 diff --git a/bloomz-1b1.Q4_K_S.gguf b/bloomz-1b1.Q4_K_S.gguf new file mode 100644 index 0000000..02d7268 --- /dev/null +++ b/bloomz-1b1.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcdfe1c8e6961a78c813c615db718cd9fa7523ae421fd45f351a22588d6289a3 +size 933178880 diff --git a/bloomz-1b1.Q5_K_M.gguf b/bloomz-1b1.Q5_K_M.gguf new file mode 100644 index 0000000..35239ae --- /dev/null +++ b/bloomz-1b1.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a124930bb0a48ab7f9c5331b548d40e516a1ace72f0f1ce502c2a51fd64e1ae +size 1100344832 diff --git a/bloomz-1b1.Q5_K_S.gguf b/bloomz-1b1.Q5_K_S.gguf new file mode 100644 index 0000000..c118ad0 --- /dev/null +++ b/bloomz-1b1.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b8a56261c94423a0d642bffeb4dce3ca3ced7b15749748cf60d46fe0726786c +size 1062743552 diff --git a/bloomz-1b1.Q6_K.gguf b/bloomz-1b1.Q6_K.gguf new file mode 100644 index 0000000..e1e97f8 --- /dev/null +++ b/bloomz-1b1.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45739ef82250b8d5e84e0dc19713a085c760b1e5416009b0ef68422c545691ac +size 1204166144 diff --git a/bloomz-1b1.Q8_0.gguf b/bloomz-1b1.Q8_0.gguf new file mode 100644 index 0000000..75ebe63 --- /dev/null +++ b/bloomz-1b1.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c82551cfc8e342c5438bd5e9b16d4c38813dd587d3471419c5fb88418a5a07df +size 1555381760 diff --git a/bloomz-1b1.f16.gguf b/bloomz-1b1.f16.gguf new file mode 100644 index 0000000..bf2eab4 --- /dev/null +++ b/bloomz-1b1.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14dfadef8675ad0d2caaea302f1ca30cc1f72a3316063dabadc0fc853a04ce22 +size 2914926080