From 63dba79fa0fd3ee1f00abb25ff46b3c1b9835b7a Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 11 Apr 2026 06:34:56 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF Source: Original Platform --- .gitattributes | 47 ++++++++++++++++ Dolphin3.0-Qwen2.5-0.5B.IQ4_XS.gguf | 3 ++ Dolphin3.0-Qwen2.5-0.5B.Q2_K.gguf | 3 ++ Dolphin3.0-Qwen2.5-0.5B.Q3_K_L.gguf | 3 ++ Dolphin3.0-Qwen2.5-0.5B.Q3_K_M.gguf | 3 ++ Dolphin3.0-Qwen2.5-0.5B.Q3_K_S.gguf | 3 ++ Dolphin3.0-Qwen2.5-0.5B.Q4_K_M.gguf | 3 ++ Dolphin3.0-Qwen2.5-0.5B.Q4_K_S.gguf | 3 ++ Dolphin3.0-Qwen2.5-0.5B.Q5_K_M.gguf | 3 ++ Dolphin3.0-Qwen2.5-0.5B.Q5_K_S.gguf | 3 ++ Dolphin3.0-Qwen2.5-0.5B.Q6_K.gguf | 3 ++ Dolphin3.0-Qwen2.5-0.5B.Q8_0.gguf | 3 ++ Dolphin3.0-Qwen2.5-0.5B.f16.gguf | 3 ++ README.md | 84 +++++++++++++++++++++++++++++ 14 files changed, 167 insertions(+) create mode 100644 .gitattributes create mode 100644 Dolphin3.0-Qwen2.5-0.5B.IQ4_XS.gguf create mode 100644 Dolphin3.0-Qwen2.5-0.5B.Q2_K.gguf create mode 100644 Dolphin3.0-Qwen2.5-0.5B.Q3_K_L.gguf create mode 100644 Dolphin3.0-Qwen2.5-0.5B.Q3_K_M.gguf create mode 100644 Dolphin3.0-Qwen2.5-0.5B.Q3_K_S.gguf create mode 100644 Dolphin3.0-Qwen2.5-0.5B.Q4_K_M.gguf create mode 100644 Dolphin3.0-Qwen2.5-0.5B.Q4_K_S.gguf create mode 100644 Dolphin3.0-Qwen2.5-0.5B.Q5_K_M.gguf create mode 100644 Dolphin3.0-Qwen2.5-0.5B.Q5_K_S.gguf create mode 100644 Dolphin3.0-Qwen2.5-0.5B.Q6_K.gguf create mode 100644 Dolphin3.0-Qwen2.5-0.5B.Q8_0.gguf create mode 100644 Dolphin3.0-Qwen2.5-0.5B.f16.gguf create mode 100644 README.md diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..2724689 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +Dolphin3.0-Qwen2.5-0.5B.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Dolphin3.0-Qwen2.5-0.5B.IQ4_XS.gguf b/Dolphin3.0-Qwen2.5-0.5B.IQ4_XS.gguf new file mode 100644 index 0000000..8fff166 --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:554872ad7c4214844826e682f5e6e3a67a58e3043ab6f949ce9b2215856cb37b +size 351448576 diff --git a/Dolphin3.0-Qwen2.5-0.5B.Q2_K.gguf b/Dolphin3.0-Qwen2.5-0.5B.Q2_K.gguf new file mode 100644 index 0000000..f9fdc5f --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f848dfdce6c922548cb285ae66174a6cba0908d3bb07e0ea15a032ea32095f01 +size 338610688 diff --git a/Dolphin3.0-Qwen2.5-0.5B.Q3_K_L.gguf b/Dolphin3.0-Qwen2.5-0.5B.Q3_K_L.gguf new file mode 100644 index 0000000..abf8423 --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53a783a9783f8833a493047539f7710305d0fc9ce67c4c38bb302c5efb61177a +size 369361408 diff --git a/Dolphin3.0-Qwen2.5-0.5B.Q3_K_M.gguf b/Dolphin3.0-Qwen2.5-0.5B.Q3_K_M.gguf new file mode 100644 index 0000000..228a62d --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b018f427a030d257b4872b32ea31ea698e15121d9b974350be5db46f8c0c14 +size 355469824 diff --git a/Dolphin3.0-Qwen2.5-0.5B.Q3_K_S.gguf b/Dolphin3.0-Qwen2.5-0.5B.Q3_K_S.gguf new file mode 100644 index 0000000..495f6ca --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0927eb7412b1061b57a34851173d326041d0e29d3502c8695d55196be3741672 +size 338266624 diff --git a/Dolphin3.0-Qwen2.5-0.5B.Q4_K_M.gguf b/Dolphin3.0-Qwen2.5-0.5B.Q4_K_M.gguf new file mode 100644 index 0000000..7abd59e --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ad07c1d90d786b58ef47fded892de3b5ff7cdb88c8a53868d385d76e5d82e0b +size 397811200 diff --git a/Dolphin3.0-Qwen2.5-0.5B.Q4_K_S.gguf b/Dolphin3.0-Qwen2.5-0.5B.Q4_K_S.gguf new file mode 100644 index 0000000..5eab2fc --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b1e0283b8255db681408d4186684823f262b044bbe6594dadc04dfe50c401ea +size 385475072 diff --git a/Dolphin3.0-Qwen2.5-0.5B.Q5_K_M.gguf b/Dolphin3.0-Qwen2.5-0.5B.Q5_K_M.gguf new file mode 100644 index 0000000..080c156 --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0a1f85bc474cde295854782ff04c875d915edcd06c684f16d14c033cf06016e +size 420089344 diff --git a/Dolphin3.0-Qwen2.5-0.5B.Q5_K_S.gguf b/Dolphin3.0-Qwen2.5-0.5B.Q5_K_S.gguf new file mode 100644 index 0000000..fa0ce22 --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a343c24941237c075e52c41af52e33c5dae96ea90e2cab8d4a9f3a8c8d32af90 +size 412713472 diff --git a/Dolphin3.0-Qwen2.5-0.5B.Q6_K.gguf b/Dolphin3.0-Qwen2.5-0.5B.Q6_K.gguf new file mode 100644 index 0000000..39e4281 --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea2129d40422fed3358e3030a5dbbb6fec40c193e4fbb73b99b86d550a08c3d1 +size 505739776 diff --git a/Dolphin3.0-Qwen2.5-0.5B.Q8_0.gguf b/Dolphin3.0-Qwen2.5-0.5B.Q8_0.gguf new file mode 100644 index 0000000..294138a --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05c9520afda466ef227c6fab681e9551257ccc2f6e7ce88cd1b853e173a5a5cf +size 531071488 diff --git a/Dolphin3.0-Qwen2.5-0.5B.f16.gguf b/Dolphin3.0-Qwen2.5-0.5B.f16.gguf new file mode 100644 index 0000000..fde0944 --- /dev/null +++ b/Dolphin3.0-Qwen2.5-0.5B.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17eccb7a5f341e7979a46ab4369b05fb18e547a5f2665671db264cb698ca6756 +size 994160128 diff --git a/README.md b/README.md new file mode 100644 index 0000000..11fdd0d --- /dev/null +++ b/README.md @@ -0,0 +1,84 @@ +--- +base_model: dphn/Dolphin3.0-Qwen2.5-0.5B +datasets: +- OpenCoder-LLM/opc-sft-stage1 +- OpenCoder-LLM/opc-sft-stage2 +- microsoft/orca-agentinstruct-1M-v1 +- microsoft/orca-math-word-problems-200k +- NousResearch/hermes-function-calling-v1 +- AI-MO/NuminaMath-CoT +- AI-MO/NuminaMath-TIR +- allenai/tulu-3-sft-mixture +- cognitivecomputations/dolphin-coder +- HuggingFaceTB/smoltalk +- cognitivecomputations/samantha-data +- m-a-p/CodeFeedback-Filtered-Instruction +- m-a-p/Code-Feedback +language: +- en +library_name: transformers +license: apache-2.0 +license_link: https://huggingface.co/Qwen/Qwen2.5-1.5B/blob/main/LICENSE +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +--- +## About + + + + + + +static quants of https://huggingface.co/dphn/Dolphin3.0-Qwen2.5-0.5B + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Dolphin3.0-Qwen2.5-0.5B-GGUF).*** + +weighted/imatrix quants are available at https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-i1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.Q3_K_S.gguf) | Q3_K_S | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.Q2_K.gguf) | Q2_K | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.IQ4_XS.gguf) | IQ4_XS | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.Q3_K_M.gguf) | Q3_K_M | 0.5 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.Q3_K_L.gguf) | Q3_K_L | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.Q4_K_S.gguf) | Q4_K_S | 0.5 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.Q4_K_M.gguf) | Q4_K_M | 0.5 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.Q5_K_S.gguf) | Q5_K_S | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.Q5_K_M.gguf) | Q5_K_M | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.Q6_K.gguf) | Q6_K | 0.6 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.Q8_0.gguf) | Q8_0 | 0.6 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/Dolphin3.0-Qwen2.5-0.5B-GGUF/resolve/main/Dolphin3.0-Qwen2.5-0.5B.f16.gguf) | f16 | 1.1 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + +