commit 78b6f6c64cc4334580832e499ab2cf198a360ba0 Author: ModelHub XC Date: Thu Apr 9 14:15:20 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..3e1fe34 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +LLDS-A-GRPO-Qwen2.5-3B-Ins.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.IQ4_XS.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.IQ4_XS.gguf new file mode 100644 index 0000000..fa32a23 --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cdcca52f4e4d3ad647cb1ad3bbeb508aa143c1dea5e0e98e8bed2696a269603 +size 1918492064 diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q2_K.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q2_K.gguf new file mode 100644 index 0000000..d91d2eb --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb2dfac7062224381b97315876593dd61127b1f5f8ae8982df08119620ad3f21 +size 1376857504 diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_L.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_L.gguf new file mode 100644 index 0000000..db7e5d0 --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1e64a85d70c170e925ce949c478c6194e7f4565295f820cd4840d1d660f18ce +size 1841096096 diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_M.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_M.gguf new file mode 100644 index 0000000..53eabf9 --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b666f364b296bd7916e7bac19ca29aabae88c305a3c088c5dd3e43a7e9e31c80 +size 1724179872 diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_S.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_S.gguf new file mode 100644 index 0000000..cc36594 --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d64e5b595b824c3a71df3769ec5825cc3e7b28cb97aa73b27ba092f6a2be9f1 +size 1588061600 diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q4_K_M.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q4_K_M.gguf new file mode 100644 index 0000000..80cf18e --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf7a5c1dd912f6348517456a554f31045c0209aef24312c1d61ba02765329d4 +size 2104933792 diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q4_K_S.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q4_K_S.gguf new file mode 100644 index 0000000..b6b1f67 --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8399508c5fc358407d7d18c757b7b149bfe60430d60c0d608f96f791499adba0 +size 2009415072 diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q5_K_M.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q5_K_M.gguf new file mode 100644 index 0000000..35094e7 --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:505a03a45a4133d95f1b5d8fe27816a2a1d7a3aac718610e7601d1d31dedaf05 +size 2438741408 diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q5_K_S.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q5_K_S.gguf new file mode 100644 index 0000000..8c1c8ef --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:626dcdc3dd0d4b0e95fc1381b8c78df541c6dbe015743d04b8f6350c8fefa1b1 +size 2383592864 diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q6_K.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q6_K.gguf new file mode 100644 index 0000000..facaf49 --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3319b15e6183ec646572782098248b0cddfbbd4b4e556c2ef8a3eb2e19ce5faa +size 2793412000 diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q8_0.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q8_0.gguf new file mode 100644 index 0000000..86dcf07 --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c309d3ed782dfc69d61d5d389a36984fd2249df5f244d74586ae4db7f18e3493 +size 3616089504 diff --git a/LLDS-A-GRPO-Qwen2.5-3B-Ins.f16.gguf b/LLDS-A-GRPO-Qwen2.5-3B-Ins.f16.gguf new file mode 100644 index 0000000..411ae05 --- /dev/null +++ b/LLDS-A-GRPO-Qwen2.5-3B-Ins.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf7cba1de5158cef86d7957b7f425241c5ed80152057288efc0cf641a739fca6 +size 6800647584 diff --git a/README.md b/README.md new file mode 100644 index 0000000..65954d1 --- /dev/null +++ b/README.md @@ -0,0 +1,75 @@ +--- +base_model: SEGAgentRL/LLDS-A-GRPO-Qwen2.5-3B-Ins +language: +- en +library_name: transformers +license: apache-2.0 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- Search +- QuestionAnswering +--- +## About + + + + + + + + + +static quants of https://huggingface.co/SEGAgentRL/LLDS-A-GRPO-Qwen2.5-3B-Ins + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF).*** + +weighted/imatrix quants are available at https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-i1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q2_K.gguf) | Q2_K | 1.5 | | +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_S.gguf) | Q3_K_S | 1.7 | | +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_M.gguf) | Q3_K_M | 1.8 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q3_K_L.gguf) | Q3_K_L | 1.9 | | +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.IQ4_XS.gguf) | IQ4_XS | 2.0 | | +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q4_K_S.gguf) | Q4_K_S | 2.1 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q4_K_M.gguf) | Q4_K_M | 2.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q5_K_S.gguf) | Q5_K_S | 2.5 | | +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q5_K_M.gguf) | Q5_K_M | 2.5 | | +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q6_K.gguf) | Q6_K | 2.9 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.Q8_0.gguf) | Q8_0 | 3.7 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/LLDS-A-GRPO-Qwen2.5-3B-Ins-GGUF/resolve/main/LLDS-A-GRPO-Qwen2.5-3B-Ins.f16.gguf) | f16 | 6.9 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + +