commit a01855df6285a41f893e9de21fbfb381e3cf1ea4 Author: ModelHub XC Date: Tue May 5 08:57:41 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/bonsai-2b-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..7abe5d2 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +bonsai-2b.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..1f6551d --- /dev/null +++ b/README.md @@ -0,0 +1,80 @@ +--- +base_model: Sakalti/bonsai-2b +language: +- en +- ja +library_name: transformers +license: gemma +quantized_by: mradermacher +tags: +- mergekit +- merge +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/Sakalti/bonsai-2b + + +static quants are available at https://huggingface.co/mradermacher/bonsai-2b-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ1_S.gguf) | i1-IQ1_S | 0.9 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ1_M.gguf) | i1-IQ1_M | 1.0 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ2_XS.gguf) | i1-IQ2_XS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ2_S.gguf) | i1-IQ2_S | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ2_M.gguf) | i1-IQ2_M | 1.2 | | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q2_K_S.gguf) | i1-Q2_K_S | 1.3 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 1.3 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q2_K.gguf) | i1-Q2_K | 1.3 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ3_XS.gguf) | i1-IQ3_XS | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ3_S.gguf) | i1-IQ3_S | 1.5 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q3_K_S.gguf) | i1-Q3_K_S | 1.5 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ3_M.gguf) | i1-IQ3_M | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q3_K_M.gguf) | i1-Q3_K_M | 1.6 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q3_K_L.gguf) | i1-Q3_K_L | 1.7 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ4_XS.gguf) | i1-IQ4_XS | 1.7 | | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-IQ4_NL.gguf) | i1-IQ4_NL | 1.7 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q4_0.gguf) | i1-Q4_0 | 1.7 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q4_K_S.gguf) | i1-Q4_K_S | 1.7 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q4_K_M.gguf) | i1-Q4_K_M | 1.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q4_1.gguf) | i1-Q4_1 | 1.9 | | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q5_K_S.gguf) | i1-Q5_K_S | 2.0 | | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q5_K_M.gguf) | i1-Q5_K_M | 2.0 | | +| [GGUF](https://huggingface.co/mradermacher/bonsai-2b-i1-GGUF/resolve/main/bonsai-2b.i1-Q6_K.gguf) | i1-Q6_K | 2.3 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/bonsai-2b.i1-IQ1_M.gguf b/bonsai-2b.i1-IQ1_M.gguf new file mode 100644 index 0000000..7fa2952 --- /dev/null +++ b/bonsai-2b.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a60e5ab1330c4f3e0aa6fb775626bd4cecc29b2b6922314df1bd1700707dec +size 873798400 diff --git a/bonsai-2b.i1-IQ1_S.gguf b/bonsai-2b.i1-IQ1_S.gguf new file mode 100644 index 0000000..4423dbd --- /dev/null +++ b/bonsai-2b.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:577c9efa0feec4b3ea0fd33e45a8da6313b260954fe3a85bb6b9ae19f3558ca4 +size 832160512 diff --git a/bonsai-2b.i1-IQ2_M.gguf b/bonsai-2b.i1-IQ2_M.gguf new file mode 100644 index 0000000..1934aae --- /dev/null +++ b/bonsai-2b.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2e4efc352a332155b69cbd79e71091270757b252cd31ee7bdad464bc392706f +size 1088015104 diff --git a/bonsai-2b.i1-IQ2_S.gguf b/bonsai-2b.i1-IQ2_S.gguf new file mode 100644 index 0000000..a9355b1 --- /dev/null +++ b/bonsai-2b.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5911760becaec65f39f4bd3d14d6bcfa3a26a85a2480835e31e497f9700768b5 +size 1032497920 diff --git a/bonsai-2b.i1-IQ2_XS.gguf b/bonsai-2b.i1-IQ2_XS.gguf new file mode 100644 index 0000000..96ec97e --- /dev/null +++ b/bonsai-2b.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:882e232e0cf5bc4af8af7862cc3cd8c45c124f996feaa6f59565249cb01ba249 +size 1002545920 diff --git a/bonsai-2b.i1-IQ2_XXS.gguf b/bonsai-2b.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..410ce8f --- /dev/null +++ b/bonsai-2b.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5310cbaef8ba978956d7f1e2394cc56fb4507e2b3f81b4711a77e10e595517e6 +size 943194880 diff --git a/bonsai-2b.i1-IQ3_M.gguf b/bonsai-2b.i1-IQ3_M.gguf new file mode 100644 index 0000000..a826da3 --- /dev/null +++ b/bonsai-2b.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86d0225141af61e9c9dd20052eaa957b4a1ad645256c65a3260db79f4974b939 +size 1393562368 diff --git a/bonsai-2b.i1-IQ3_S.gguf b/bonsai-2b.i1-IQ3_S.gguf new file mode 100644 index 0000000..9f869af --- /dev/null +++ b/bonsai-2b.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1e28bbf96e1d53c391c0e907030eac949554af035efd106efbd17a2a79c4e9b +size 1360661248 diff --git a/bonsai-2b.i1-IQ3_XS.gguf b/bonsai-2b.i1-IQ3_XS.gguf new file mode 100644 index 0000000..fb58399 --- /dev/null +++ b/bonsai-2b.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:624d30b7903d80d55dcf65a2a201974892ab96e391fedfb0ad4392b2b09feb32 +size 1314212608 diff --git a/bonsai-2b.i1-IQ3_XXS.gguf b/bonsai-2b.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..cfefe41 --- /dev/null +++ b/bonsai-2b.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15dd29654e0ff48dd8c2a59aeb478a6f3a76be927224e28b8954675eb747f0ac +size 1181686528 diff --git a/bonsai-2b.i1-IQ4_NL.gguf b/bonsai-2b.i1-IQ4_NL.gguf new file mode 100644 index 0000000..57f7b7a --- /dev/null +++ b/bonsai-2b.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98b184f06396b6e0d5e659f81007f29d6ed9b66579f200a4ee3ec2e895806fdb +size 1629510400 diff --git a/bonsai-2b.i1-IQ4_XS.gguf b/bonsai-2b.i1-IQ4_XS.gguf new file mode 100644 index 0000000..441276a --- /dev/null +++ b/bonsai-2b.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bb9b2c6d454b5337b792215db1f6cfbf36c636a4241255f640ca13515491487 +size 1566251776 diff --git a/bonsai-2b.i1-Q2_K.gguf b/bonsai-2b.i1-Q2_K.gguf new file mode 100644 index 0000000..9ed9636 --- /dev/null +++ b/bonsai-2b.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a659aeaa5f9318b4d2a7ed29a8f097b71fdd985e7c83ae036202cc0e5b5c8cd +size 1229830912 diff --git a/bonsai-2b.i1-Q2_K_S.gguf b/bonsai-2b.i1-Q2_K_S.gguf new file mode 100644 index 0000000..932c092 --- /dev/null +++ b/bonsai-2b.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:990c9eeeee7bf7559b4bc3261450de96379363ff865dd5573bd779d6114cf143 +size 1170000640 diff --git a/bonsai-2b.i1-Q3_K_L.gguf b/bonsai-2b.i1-Q3_K_L.gguf new file mode 100644 index 0000000..0d973b9 --- /dev/null +++ b/bonsai-2b.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db662cbe27aa30208f7481d0e62bdf2ce569c3ea8d2328950a8ac65074bb03ee +size 1550437120 diff --git a/bonsai-2b.i1-Q3_K_M.gguf b/bonsai-2b.i1-Q3_K_M.gguf new file mode 100644 index 0000000..46f79db --- /dev/null +++ b/bonsai-2b.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f999de0771f8357793092236a497340bbf61c641ddbaf96b92dbcbd75a23c1 +size 1461668608 diff --git a/bonsai-2b.i1-Q3_K_S.gguf b/bonsai-2b.i1-Q3_K_S.gguf new file mode 100644 index 0000000..92ddf57 --- /dev/null +++ b/bonsai-2b.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a1b6fc2cc905c339b2c8d291ac9d4f76033ddd2c22e676f856cb2a618859d6b +size 1360661248 diff --git a/bonsai-2b.i1-Q4_0.gguf b/bonsai-2b.i1-Q4_0.gguf new file mode 100644 index 0000000..0dbfe16 --- /dev/null +++ b/bonsai-2b.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f505989fa77771e2335cecebbfc846804cc5648a9a394afe6fa4860c5ced2d3b +size 1633491712 diff --git a/bonsai-2b.i1-Q4_1.gguf b/bonsai-2b.i1-Q4_1.gguf new file mode 100644 index 0000000..e89dd59 --- /dev/null +++ b/bonsai-2b.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c2493b87b57da0e3eef02c922ca38a801ea058daaa216fc88e3d70484a32776 +size 1756027648 diff --git a/bonsai-2b.i1-Q4_K_M.gguf b/bonsai-2b.i1-Q4_K_M.gguf new file mode 100644 index 0000000..58b0dc0 --- /dev/null +++ b/bonsai-2b.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb7a687afe5d346b3f658d5e82d3f2883bc7478a32dd6ed3b5349696a2e89b57 +size 1708583680 diff --git a/bonsai-2b.i1-Q4_K_S.gguf b/bonsai-2b.i1-Q4_K_S.gguf new file mode 100644 index 0000000..d1d8326 --- /dev/null +++ b/bonsai-2b.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fd6ca05659cf6770af25de1aaa4fca7bf5b06bcb4394e21df7e724777eb9585 +size 1638652672 diff --git a/bonsai-2b.i1-Q5_K_M.gguf b/bonsai-2b.i1-Q5_K_M.gguf new file mode 100644 index 0000000..6b44225 --- /dev/null +++ b/bonsai-2b.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:098c8cdb1bf01833c8181471a9f77cdddba924d07d34b350510a456359430a69 +size 1923279616 diff --git a/bonsai-2b.i1-Q5_K_S.gguf b/bonsai-2b.i1-Q5_K_S.gguf new file mode 100644 index 0000000..cb38e52 --- /dev/null +++ b/bonsai-2b.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:082565b6047d7fdd322c5c548689a16f8d1a119ae36c02ebe1e94166d942d636 +size 1882544896 diff --git a/bonsai-2b.i1-Q6_K.gguf b/bonsai-2b.i1-Q6_K.gguf new file mode 100644 index 0000000..9353ff3 --- /dev/null +++ b/bonsai-2b.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7aa2f0a2604662a2cb00bf03afe20629f9b32c95f786d5a38888213a8ddbe5b +size 2151394048 diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..91d93e7 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84107401f1637b12c2be0903a1d18dad4b69e06d88b349bd64514181a69b15fb +size 2375559