commit f90bb0913d72c6714a5eb1a680e88d8b741cf0b6 Author: ModelHub XC Date: Wed Apr 22 07:46:10 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/rhybus-llama3.2-1b-instruct-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..30144d0 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +rhybus-llama3.2-1b-instruct.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..9b595e5 --- /dev/null +++ b/README.md @@ -0,0 +1,71 @@ +--- +base_model: Vinod-IE/rhybus-llama3.2-1b-instruct +language: +- en +library_name: transformers +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +--- +## About + + + + + + + + + +static quants of https://huggingface.co/Vinod-IE/rhybus-llama3.2-1b-instruct + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#rhybus-llama3.2-1b-instruct-GGUF).*** + +weighted/imatrix quants seem not to be available (by me) at this time. If they do not show up a week or so after the static ones, I have probably not planned for them. Feel free to request them by opening a Community Discussion. +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.Q2_K.gguf) | Q2_K | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.Q3_K_S.gguf) | Q3_K_S | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.Q3_K_M.gguf) | Q3_K_M | 0.8 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.Q3_K_L.gguf) | Q3_K_L | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.IQ4_XS.gguf) | IQ4_XS | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.Q4_K_S.gguf) | Q4_K_S | 0.9 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.Q4_K_M.gguf) | Q4_K_M | 0.9 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.Q5_K_S.gguf) | Q5_K_S | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.Q5_K_M.gguf) | Q5_K_M | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.Q6_K.gguf) | Q6_K | 1.1 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.Q8_0.gguf) | Q8_0 | 1.4 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/rhybus-llama3.2-1b-instruct-GGUF/resolve/main/rhybus-llama3.2-1b-instruct.f16.gguf) | f16 | 2.6 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + + diff --git a/rhybus-llama3.2-1b-instruct.IQ4_XS.gguf b/rhybus-llama3.2-1b-instruct.IQ4_XS.gguf new file mode 100644 index 0000000..6a4d490 --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c95b8bc68a8587844bfffca1a8dd15cee9ca09c07d22ef0da9712ee49193be2f +size 748384416 diff --git a/rhybus-llama3.2-1b-instruct.Q2_K.gguf b/rhybus-llama3.2-1b-instruct.Q2_K.gguf new file mode 100644 index 0000000..5fde0b2 --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7944984b0e303774d27c6fc755a674a1cab98db4fbde58bbc99336bb0e8f393e +size 580874400 diff --git a/rhybus-llama3.2-1b-instruct.Q3_K_L.gguf b/rhybus-llama3.2-1b-instruct.Q3_K_L.gguf new file mode 100644 index 0000000..a9f93ca --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77549ac3f04931bfd3ec2bb12df04630eaae1339a494c3584f3eb08486750ee9 +size 732524704 diff --git a/rhybus-llama3.2-1b-instruct.Q3_K_M.gguf b/rhybus-llama3.2-1b-instruct.Q3_K_M.gguf new file mode 100644 index 0000000..b2f7031 --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a15160c1d4fd62f69b745ac1d2c09d761b316e0f53d083cf5dbffc5f6bac71d0 +size 690843808 diff --git a/rhybus-llama3.2-1b-instruct.Q3_K_S.gguf b/rhybus-llama3.2-1b-instruct.Q3_K_S.gguf new file mode 100644 index 0000000..6ad3938 --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b87f33fd9107c6f96452967e710820d1c47e8615fc23a6f4bd7b757249cedcbe +size 641691808 diff --git a/rhybus-llama3.2-1b-instruct.Q4_K_M.gguf b/rhybus-llama3.2-1b-instruct.Q4_K_M.gguf new file mode 100644 index 0000000..0b1c55c --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3dc08a23e9a4a86787a361d6fc138b185f144967de52be5ec356e5c4af44194 +size 807694496 diff --git a/rhybus-llama3.2-1b-instruct.Q4_K_S.gguf b/rhybus-llama3.2-1b-instruct.Q4_K_S.gguf new file mode 100644 index 0000000..4e08159 --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:518b27d57dac426a92535aeaa619373181d51fa35ac2023443e0ecc6c24d52a4 +size 775647392 diff --git a/rhybus-llama3.2-1b-instruct.Q5_K_M.gguf b/rhybus-llama3.2-1b-instruct.Q5_K_M.gguf new file mode 100644 index 0000000..5c60ca9 --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffdb326546214ff06f57448cd3ed7ceb56e647f4b93156c8eef0fb38f9080f61 +size 911503520 diff --git a/rhybus-llama3.2-1b-instruct.Q5_K_S.gguf b/rhybus-llama3.2-1b-instruct.Q5_K_S.gguf new file mode 100644 index 0000000..7aef10e --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aac7ef9d08ad67b574269c8ee619edd244e95b0fb77bb21b3b0a4ca85c6f106 +size 892563616 diff --git a/rhybus-llama3.2-1b-instruct.Q6_K.gguf b/rhybus-llama3.2-1b-instruct.Q6_K.gguf new file mode 100644 index 0000000..91edc37 --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fc2ca2b509f6f1801442432498ebde83adabb1499c292b1817747be6c8182f6 +size 1021800608 diff --git a/rhybus-llama3.2-1b-instruct.Q8_0.gguf b/rhybus-llama3.2-1b-instruct.Q8_0.gguf new file mode 100644 index 0000000..20fc8d9 --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728aa53f37cf36d5d7d365df29cee361cb1da07af2bb25da61c0ca10c8c1f81f +size 1321083040 diff --git a/rhybus-llama3.2-1b-instruct.f16.gguf b/rhybus-llama3.2-1b-instruct.f16.gguf new file mode 100644 index 0000000..aa06426 --- /dev/null +++ b/rhybus-llama3.2-1b-instruct.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e6f30ced737fe4730f8506a11175356ba2b5056d8132e56316270debfe6330d +size 2479595680