commit 665ee208068af5e533e97a50d5a1024994fea05f Author: ModelHub XC Date: Sat Apr 11 08:10:56 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..662c279 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +QwQ-R1-Distill-1.5B-CoT.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/QwQ-R1-Distill-1.5B-CoT.IQ4_XS.gguf b/QwQ-R1-Distill-1.5B-CoT.IQ4_XS.gguf new file mode 100644 index 0000000..fe13a16 --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8268f75fac51aa09e4a9ebff82d06d22b303e32ef814b0b61aa9c1a2ce35e6d9 +size 1026164448 diff --git a/QwQ-R1-Distill-1.5B-CoT.Q2_K.gguf b/QwQ-R1-Distill-1.5B-CoT.Q2_K.gguf new file mode 100644 index 0000000..62a5870 --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e7242080267c23edd133eb2e80e87f3b83d34ed6df1458644e2b3e006c21786 +size 752882400 diff --git a/QwQ-R1-Distill-1.5B-CoT.Q3_K_L.gguf b/QwQ-R1-Distill-1.5B-CoT.Q3_K_L.gguf new file mode 100644 index 0000000..acd3ac0 --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d063edc3f91d707f9efff7023664eff287225d0ee5bafd363a09b9ed80475997 +size 980442336 diff --git a/QwQ-R1-Distill-1.5B-CoT.Q3_K_M.gguf b/QwQ-R1-Distill-1.5B-CoT.Q3_K_M.gguf new file mode 100644 index 0000000..fa432e1 --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a1f48d3f58bb8d005b975ed273e992d4a697373c00906e8cd8e01bbafb0e171 +size 924458208 diff --git a/QwQ-R1-Distill-1.5B-CoT.Q3_K_S.gguf b/QwQ-R1-Distill-1.5B-CoT.Q3_K_S.gguf new file mode 100644 index 0000000..b5334df --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fba3031043fa276d546273eb3f9ba7c2060f374d4b5eb607707a768863cca4e5 +size 861224160 diff --git a/QwQ-R1-Distill-1.5B-CoT.Q4_K_M.gguf b/QwQ-R1-Distill-1.5B-CoT.Q4_K_M.gguf new file mode 100644 index 0000000..3a6e68e --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:414a79e8fcecad7a661d64e87becc15820bdac2f97f97a3605289eeefce31c8a +size 1117322976 diff --git a/QwQ-R1-Distill-1.5B-CoT.Q4_K_S.gguf b/QwQ-R1-Distill-1.5B-CoT.Q4_K_S.gguf new file mode 100644 index 0000000..151c9dd --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d63a43aa4837eecd94fd74a33763b71d392ccf0e4238d152183ebb28dfbbcbd8 +size 1071587040 diff --git a/QwQ-R1-Distill-1.5B-CoT.Q5_K_M.gguf b/QwQ-R1-Distill-1.5B-CoT.Q5_K_M.gguf new file mode 100644 index 0000000..72b116f --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:575f97fa5156fcfb3f878397f9d5aaf2347ce17b2575382c2e6f4354e0f7c326 +size 1285496544 diff --git a/QwQ-R1-Distill-1.5B-CoT.Q5_K_S.gguf b/QwQ-R1-Distill-1.5B-CoT.Q5_K_S.gguf new file mode 100644 index 0000000..3024854 --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc8c0b51e14af32014aeaeb63fa2fc1ff3f161bb2ac90fd4f2c79cd83698e318 +size 1259175648 diff --git a/QwQ-R1-Distill-1.5B-CoT.Q6_K.gguf b/QwQ-R1-Distill-1.5B-CoT.Q6_K.gguf new file mode 100644 index 0000000..d6bb2e7 --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48e0cb2c8c80022f7d5030412b5ba1e24913dcf62ebc0baf035d4b9f904d95e8 +size 1464180960 diff --git a/QwQ-R1-Distill-1.5B-CoT.Q8_0.gguf b/QwQ-R1-Distill-1.5B-CoT.Q8_0.gguf new file mode 100644 index 0000000..7fab0f8 --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae6cc7cd2301c3bb8169355de9ff8c05430976317f9735ac9f718ec5cd5c95cc +size 1894534368 diff --git a/QwQ-R1-Distill-1.5B-CoT.f16.gguf b/QwQ-R1-Distill-1.5B-CoT.f16.gguf new file mode 100644 index 0000000..432f009 --- /dev/null +++ b/QwQ-R1-Distill-1.5B-CoT.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ef7fa3c12ff19dcad8d1ef2f87a12190b44021336e2f98cc5bf92905cb5c2dd +size 3560418528 diff --git a/README.md b/README.md new file mode 100644 index 0000000..dab888a --- /dev/null +++ b/README.md @@ -0,0 +1,77 @@ +--- +base_model: prithivMLmods/QwQ-R1-Distill-1.5B-CoT +datasets: +- AI-MO/NuminaMath-CoT +- prithivMLmods/Math-Solve +- amphora/QwQ-LongCoT-130K +- prithivMLmods/Deepthink-Reasoning +- NovaSky-AI/Sky-T1_data_17k +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- QwQ +- Distill +- R1 +- Deepseek +- Qwen2.5 +- text-generation-inference +--- +## About + + + + + + +static quants of https://huggingface.co/prithivMLmods/QwQ-R1-Distill-1.5B-CoT + + +weighted/imatrix quants are available at https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-i1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.Q2_K.gguf) | Q2_K | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.Q3_K_S.gguf) | Q3_K_S | 1.0 | | +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.Q3_K_M.gguf) | Q3_K_M | 1.0 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.Q3_K_L.gguf) | Q3_K_L | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.IQ4_XS.gguf) | IQ4_XS | 1.1 | | +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.Q4_K_S.gguf) | Q4_K_S | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.Q4_K_M.gguf) | Q4_K_M | 1.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.Q5_K_S.gguf) | Q5_K_S | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.Q5_K_M.gguf) | Q5_K_M | 1.4 | | +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.Q6_K.gguf) | Q6_K | 1.6 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.Q8_0.gguf) | Q8_0 | 2.0 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/QwQ-R1-Distill-1.5B-CoT-GGUF/resolve/main/QwQ-R1-Distill-1.5B-CoT.f16.gguf) | f16 | 3.7 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + +