commit 5de2f0e8e48cb88e51c848ca10611c2ebec6b19d Author: ModelHub XC Date: Sun May 3 04:00:33 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Cogito-R1-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..7a47e5c --- /dev/null +++ b/.gitattributes @@ -0,0 +1,59 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Cogito-R1.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Cogito-R1.i1-IQ1_M.gguf b/Cogito-R1.i1-IQ1_M.gguf new file mode 100644 index 0000000..6232885 --- /dev/null +++ b/Cogito-R1.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:424228387102c12e8e0f4a63e86613894212d92a2a1828a678afe9001683f32f +size 7932162688 diff --git a/Cogito-R1.i1-IQ1_S.gguf b/Cogito-R1.i1-IQ1_S.gguf new file mode 100644 index 0000000..966a15a --- /dev/null +++ b/Cogito-R1.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20a0e5711da6e69a8fad5ffc82f2aa7b54dd05fe9d0a75bcceef0aed5479bb4f +size 7274508928 diff --git a/Cogito-R1.i1-IQ2_M.gguf b/Cogito-R1.i1-IQ2_M.gguf new file mode 100644 index 0000000..0a291e0 --- /dev/null +++ b/Cogito-R1.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82b01b80f1f98454f0de265fb109aafc41840a5932727dea9861235a9c97e25d +size 11264443008 diff --git a/Cogito-R1.i1-IQ2_S.gguf b/Cogito-R1.i1-IQ2_S.gguf new file mode 100644 index 0000000..08eb693 --- /dev/null +++ b/Cogito-R1.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a68d5d619bfef6ad1a78d6ccafc2e770f27c07efb007b2060fec776800a7a6db +size 10387571328 diff --git a/Cogito-R1.i1-IQ2_XS.gguf b/Cogito-R1.i1-IQ2_XS.gguf new file mode 100644 index 0000000..21593c0 --- /dev/null +++ b/Cogito-R1.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4fbbfb6f72b4075de328b4a52c3ec212b739f02b0ff1b85be47769b80902d52 +size 9957552768 diff --git a/Cogito-R1.i1-IQ2_XXS.gguf b/Cogito-R1.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..47cd8b8 --- /dev/null +++ b/Cogito-R1.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad58d05b262e1d0c5d5f222145617d9539a7125b122f9718854ea0a44f613f5b +size 9028252288 diff --git a/Cogito-R1.i1-IQ3_M.gguf b/Cogito-R1.i1-IQ3_M.gguf new file mode 100644 index 0000000..a16395f --- /dev/null +++ b/Cogito-R1.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee9df0090b09f42b13ded3132a3b76e10eb43aebbfb828735be4e9af6c843cb +size 14810124928 diff --git a/Cogito-R1.i1-IQ3_S.gguf b/Cogito-R1.i1-IQ3_S.gguf new file mode 100644 index 0000000..1f9198d --- /dev/null +++ b/Cogito-R1.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6970444ea7f5a7808662db4cb380e9305520c34be8ac70474cab8710b4e379f3 +size 14436897408 diff --git a/Cogito-R1.i1-IQ3_XS.gguf b/Cogito-R1.i1-IQ3_XS.gguf new file mode 100644 index 0000000..f89c66a --- /dev/null +++ b/Cogito-R1.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aacda903d860901cff5a6d4e4a5077767707403cd72a90cf5033762fe21f36c +size 13705515648 diff --git a/Cogito-R1.i1-IQ3_XXS.gguf b/Cogito-R1.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..5a79174 --- /dev/null +++ b/Cogito-R1.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c134f0f46bd4cca9058d6031b2319e963063f663c03e4ebfebd3620e114348f6 +size 12839273088 diff --git a/Cogito-R1.i1-IQ4_XS.gguf b/Cogito-R1.i1-IQ4_XS.gguf new file mode 100644 index 0000000..baa7545 --- /dev/null +++ b/Cogito-R1.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0131d231a564d009e51714db3f382468bbbda3ea9b2ed582415523ee9e70ae5 +size 17693155968 diff --git a/Cogito-R1.i1-Q2_K.gguf b/Cogito-R1.i1-Q2_K.gguf new file mode 100644 index 0000000..931c5b8 --- /dev/null +++ b/Cogito-R1.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d8ba67a939851b0d4d26bf2da6d7b2b272239003982fba4a67d7d0b35899a2a +size 12313100928 diff --git a/Cogito-R1.i1-Q2_K_S.gguf b/Cogito-R1.i1-Q2_K_S.gguf new file mode 100644 index 0000000..b4077ed --- /dev/null +++ b/Cogito-R1.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3f609fb4e674fce23e6b1ddec2334245d662178f34132d6e207f4307e2335b7 +size 11488002688 diff --git a/Cogito-R1.i1-Q3_K_L.gguf b/Cogito-R1.i1-Q3_K_L.gguf new file mode 100644 index 0000000..523bc1c --- /dev/null +++ b/Cogito-R1.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3843557f12c2c595e61847be580da92038ac0f206ea2cbf3f36fe2167f3c1ac +size 17247081088 diff --git a/Cogito-R1.i1-Q3_K_M.gguf b/Cogito-R1.i1-Q3_K_M.gguf new file mode 100644 index 0000000..dc955d1 --- /dev/null +++ b/Cogito-R1.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb6ce4671c3d750bd0cacd388ba8a6bf5cdaf8142af032934de123bc3f2e7fd +size 15935050368 diff --git a/Cogito-R1.i1-Q3_K_S.gguf b/Cogito-R1.i1-Q3_K_S.gguf new file mode 100644 index 0000000..530d890 --- /dev/null +++ b/Cogito-R1.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5df05fa719b7a742bb534de2271d1142d386ffd919906197264d4e5e7be53cb +size 14392332928 diff --git a/Cogito-R1.i1-Q4_0.gguf b/Cogito-R1.i1-Q4_0.gguf new file mode 100644 index 0000000..fbb8855 --- /dev/null +++ b/Cogito-R1.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93f3c93c1c9e324cff63d4e1e54ad8cd927498a3e35460fc7a10be472f8695e +size 18711011968 diff --git a/Cogito-R1.i1-Q4_1.gguf b/Cogito-R1.i1-Q4_1.gguf new file mode 100644 index 0000000..c430609 --- /dev/null +++ b/Cogito-R1.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95e6d45c384d9487ac76343c8a2069e8b466c85f038b557250b6fcbf1b5b07dd +size 20639244928 diff --git a/Cogito-R1.i1-Q4_K_M.gguf b/Cogito-R1.i1-Q4_K_M.gguf new file mode 100644 index 0000000..8c4f79a --- /dev/null +++ b/Cogito-R1.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da395317d8817a0337a3a121b2e2ad7b11ca21ca0896412384303dae03ba5a66 +size 19851338368 diff --git a/Cogito-R1.i1-Q4_K_S.gguf b/Cogito-R1.i1-Q4_K_S.gguf new file mode 100644 index 0000000..72730dd --- /dev/null +++ b/Cogito-R1.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e40cf3f8b21bf52a817e6e29852ddd332b3606aea47eae9df0328e0364fce81c +size 18784412288 diff --git a/Cogito-R1.i1-Q5_K_M.gguf b/Cogito-R1.i1-Q5_K_M.gguf new file mode 100644 index 0000000..1a7e089 --- /dev/null +++ b/Cogito-R1.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:997a735b41c5defb7b62af296fec7ac3e7ff1988e1f527afafb4016ad3455821 +size 23262159488 diff --git a/Cogito-R1.i1-Q5_K_S.gguf b/Cogito-R1.i1-Q5_K_S.gguf new file mode 100644 index 0000000..299d933 --- /dev/null +++ b/Cogito-R1.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fbf5c74ef3a135efb989c2de97c532204c58f8a2ee9a588c35aeb52c20118a1 +size 22638256768 diff --git a/Cogito-R1.i1-Q6_K.gguf b/Cogito-R1.i1-Q6_K.gguf new file mode 100644 index 0000000..03cd219 --- /dev/null +++ b/Cogito-R1.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5f7e16e27f6d7fc06144f69490589b7bd8f0d17efb7954ee3210a1d843eaf9d +size 26886156928 diff --git a/README.md b/README.md new file mode 100644 index 0000000..c4405a6 --- /dev/null +++ b/README.md @@ -0,0 +1,92 @@ +--- +base_model: Daemontatox/Cogito-R1 +datasets: +- PrimeIntellect/NuminaMath-QwQ-CoT-5M +- AI-MO/NuminaMath-CoT +- simplescaling/s1K +- cognitivecomputations/dolphin-r1 +- openai/gsm8k +- bespokelabs/Bespoke-Stratos-17k +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- text-generation-inference +- transformers +- unsloth +- qwen2 +- trl +- reasoning +- Chain-of-Thought +- Reinforcement Learning +- GRPO +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/Daemontatox/Cogito-R1 + + +static quants are available at https://huggingface.co/mradermacher/Cogito-R1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-IQ1_S.gguf) | i1-IQ1_S | 7.4 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-IQ1_M.gguf) | i1-IQ1_M | 8.0 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 9.1 | | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-IQ2_XS.gguf) | i1-IQ2_XS | 10.1 | | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-IQ2_S.gguf) | i1-IQ2_S | 10.5 | | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-IQ2_M.gguf) | i1-IQ2_M | 11.4 | | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q2_K_S.gguf) | i1-Q2_K_S | 11.6 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q2_K.gguf) | i1-Q2_K | 12.4 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 12.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-IQ3_XS.gguf) | i1-IQ3_XS | 13.8 | | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q3_K_S.gguf) | i1-Q3_K_S | 14.5 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-IQ3_S.gguf) | i1-IQ3_S | 14.5 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-IQ3_M.gguf) | i1-IQ3_M | 14.9 | | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q3_K_M.gguf) | i1-Q3_K_M | 16.0 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q3_K_L.gguf) | i1-Q3_K_L | 17.3 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-IQ4_XS.gguf) | i1-IQ4_XS | 17.8 | | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q4_0.gguf) | i1-Q4_0 | 18.8 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q4_K_S.gguf) | i1-Q4_K_S | 18.9 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q4_K_M.gguf) | i1-Q4_K_M | 20.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q4_1.gguf) | i1-Q4_1 | 20.7 | | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q5_K_S.gguf) | i1-Q5_K_S | 22.7 | | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q5_K_M.gguf) | i1-Q5_K_M | 23.4 | | +| [GGUF](https://huggingface.co/mradermacher/Cogito-R1-i1-GGUF/resolve/main/Cogito-R1.i1-Q6_K.gguf) | i1-Q6_K | 27.0 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..29b66d0 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc74a326d0ea74f4cc1301dfe7465178fc18f1d705dfddfb930704b26bd0c016 +size 14957085