commit 33ab03c7638b217127028392b5e6f0155aebaec1 Author: ModelHub XC Date: Wed May 20 20:16:17 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Olmoe-0.5B-6B-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..aa209fa --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.f16.gguf filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Olmoe-0.5B-6B.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Olmoe-0.5B-6B.IQ4_XS.gguf b/Olmoe-0.5B-6B.IQ4_XS.gguf new file mode 100644 index 0000000..7d00472 --- /dev/null +++ b/Olmoe-0.5B-6B.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cea2302252e5582a29c0db478d0edb8b8377c1c2d4feb6693585ba7608dbb303 +size 4797933568 diff --git a/Olmoe-0.5B-6B.Q2_K.gguf b/Olmoe-0.5B-6B.Q2_K.gguf new file mode 100644 index 0000000..16a46a9 --- /dev/null +++ b/Olmoe-0.5B-6B.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:648f675901dce319fa69423f89ec2b78e99124355db5933349dd9e1a853e2efa +size 3269515264 diff --git a/Olmoe-0.5B-6B.Q3_K_L.gguf b/Olmoe-0.5B-6B.Q3_K_L.gguf new file mode 100644 index 0000000..ca5eccf --- /dev/null +++ b/Olmoe-0.5B-6B.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e5b596d9bd2441e46ba35c0795b82bd5216ff2333490a55a2b4107f6de64199 +size 4615110656 diff --git a/Olmoe-0.5B-6B.Q3_K_M.gguf b/Olmoe-0.5B-6B.Q3_K_M.gguf new file mode 100644 index 0000000..f9d9c65 --- /dev/null +++ b/Olmoe-0.5B-6B.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e95b2745be584b05b4859933be58133588e468b2c919a7d6d24a314ac1fcad19 +size 4251779072 diff --git a/Olmoe-0.5B-6B.Q3_K_S.gguf b/Olmoe-0.5B-6B.Q3_K_S.gguf new file mode 100644 index 0000000..1768a29 --- /dev/null +++ b/Olmoe-0.5B-6B.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c08c99eb9161810fdb4b11a68e48ee39c2345b721e0bc40acf2056d962898f19 +size 3863576576 diff --git a/Olmoe-0.5B-6B.Q4_K_M.gguf b/Olmoe-0.5B-6B.Q4_K_M.gguf new file mode 100644 index 0000000..ce54b7c --- /dev/null +++ b/Olmoe-0.5B-6B.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:394c89cc7247d125a7361f0041dd0e5a0a0bbd6e93b86173719e54edf3b6920b +size 5397940224 diff --git a/Olmoe-0.5B-6B.Q4_K_S.gguf b/Olmoe-0.5B-6B.Q4_K_S.gguf new file mode 100644 index 0000000..a8e768a --- /dev/null +++ b/Olmoe-0.5B-6B.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1093b750235d9e57f8afbb12f210145108bd11ebb6b4b28b0f7f031da65766 +size 5065066496 diff --git a/Olmoe-0.5B-6B.Q5_K_M.gguf b/Olmoe-0.5B-6B.Q5_K_M.gguf new file mode 100644 index 0000000..452e734 --- /dev/null +++ b/Olmoe-0.5B-6B.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdfc05897d8f85a40cfd90e5c34b76f8a65deb9be8f152c4e8a2587e4a99a116 +size 6313904128 diff --git a/Olmoe-0.5B-6B.Q5_K_S.gguf b/Olmoe-0.5B-6B.Q5_K_S.gguf new file mode 100644 index 0000000..a50f43b --- /dev/null +++ b/Olmoe-0.5B-6B.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd25bc36c1b17874c91ba6b769a4ad963a3d1466bda375e7417566c24c3a6f9 +size 6123112448 diff --git a/Olmoe-0.5B-6B.Q6_K.gguf b/Olmoe-0.5B-6B.Q6_K.gguf new file mode 100644 index 0000000..067992e --- /dev/null +++ b/Olmoe-0.5B-6B.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8884638a05f884947bfbd0973aacd4e7b409fed8ba818d4d51d0c0f910604cd +size 7287115776 diff --git a/Olmoe-0.5B-6B.Q8_0.gguf b/Olmoe-0.5B-6B.Q8_0.gguf new file mode 100644 index 0000000..aa2e63d --- /dev/null +++ b/Olmoe-0.5B-6B.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9689ca25a1192867998a040cc9cecc7917b1bbd79bcada533045d90d871cbd54 +size 9434660864 diff --git a/Olmoe-0.5B-6B.f16.gguf b/Olmoe-0.5B-6B.f16.gguf new file mode 100644 index 0000000..6f32243 --- /dev/null +++ b/Olmoe-0.5B-6B.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f60439049f97662fb7b29d16be16e2fc139c324049c48d03ec0277b9554eff41 +size 17747738624 diff --git a/README.md b/README.md new file mode 100644 index 0000000..483ddc0 --- /dev/null +++ b/README.md @@ -0,0 +1,69 @@ +--- +base_model: motionlabs/Olmoe-0.5B-6B +language: +- en +library_name: transformers +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: [] +--- +## About + + + + + + +static quants of https://huggingface.co/motionlabs/Olmoe-0.5B-6B + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Olmoe-0.5B-6B-GGUF).*** + +weighted/imatrix quants seem not to be available (by me) at this time. If they do not show up a week or so after the static ones, I have probably not planned for them. Feel free to request them by opening a Community Discussion. +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.Q2_K.gguf) | Q2_K | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.Q3_K_S.gguf) | Q3_K_S | 4.0 | | +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.Q3_K_M.gguf) | Q3_K_M | 4.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.Q3_K_L.gguf) | Q3_K_L | 4.7 | | +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.IQ4_XS.gguf) | IQ4_XS | 4.9 | | +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.Q4_K_S.gguf) | Q4_K_S | 5.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.Q4_K_M.gguf) | Q4_K_M | 5.5 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.Q5_K_S.gguf) | Q5_K_S | 6.2 | | +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.Q5_K_M.gguf) | Q5_K_M | 6.4 | | +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.Q6_K.gguf) | Q6_K | 7.4 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.Q8_0.gguf) | Q8_0 | 9.5 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/Olmoe-0.5B-6B-GGUF/resolve/main/Olmoe-0.5B-6B.f16.gguf) | f16 | 17.8 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + +