From 04ecabe2603316687daa8f76b90d018615f960ed Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 19 Jun 2026 12:23:12 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: prithivMLmods/SmolLM2-Rethink-135M-GGUF Source: Original Platform --- .gitattributes | 47 ++++++++++++++++++++++++++++++++ README.md | 45 ++++++++++++++++++++++++++++++ SmolLM2-Rethink-135M.BF16.gguf | 3 ++ SmolLM2-Rethink-135M.F16.gguf | 3 ++ SmolLM2-Rethink-135M.F32.gguf | 3 ++ SmolLM2-Rethink-135M.Q2_K.gguf | 3 ++ SmolLM2-Rethink-135M.Q3_K_L.gguf | 3 ++ SmolLM2-Rethink-135M.Q3_K_M.gguf | 3 ++ SmolLM2-Rethink-135M.Q3_K_S.gguf | 3 ++ SmolLM2-Rethink-135M.Q4_K_M.gguf | 3 ++ SmolLM2-Rethink-135M.Q4_K_S.gguf | 3 ++ SmolLM2-Rethink-135M.Q5_K_M.gguf | 3 ++ SmolLM2-Rethink-135M.Q5_K_S.gguf | 3 ++ SmolLM2-Rethink-135M.Q6_K.gguf | 3 ++ SmolLM2-Rethink-135M.Q8_0.gguf | 3 ++ config.json | 3 ++ configuration.json | 1 + 17 files changed, 135 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 SmolLM2-Rethink-135M.BF16.gguf create mode 100644 SmolLM2-Rethink-135M.F16.gguf create mode 100644 SmolLM2-Rethink-135M.F32.gguf create mode 100644 SmolLM2-Rethink-135M.Q2_K.gguf create mode 100644 SmolLM2-Rethink-135M.Q3_K_L.gguf create mode 100644 SmolLM2-Rethink-135M.Q3_K_M.gguf create mode 100644 SmolLM2-Rethink-135M.Q3_K_S.gguf create mode 100644 SmolLM2-Rethink-135M.Q4_K_M.gguf create mode 100644 SmolLM2-Rethink-135M.Q4_K_S.gguf create mode 100644 SmolLM2-Rethink-135M.Q5_K_M.gguf create mode 100644 SmolLM2-Rethink-135M.Q5_K_S.gguf create mode 100644 SmolLM2-Rethink-135M.Q6_K.gguf create mode 100644 SmolLM2-Rethink-135M.Q8_0.gguf create mode 100644 config.json create mode 100644 configuration.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..53d7257 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bin.* filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..e51cb72 --- /dev/null +++ b/README.md @@ -0,0 +1,45 @@ +--- +license: apache-2.0 +language: +- en +base_model: +- prithivMLmods/SmolLM2-Rethink-135M +pipeline_tag: text-generation +library_name: transformers +tags: +- text-generation-inference +- trl +--- +# **SmolLM2-Rethink-135M-GGUF** + +> SmolLM2-Rethink-135M is an experimental lightweight model trained on the Celestia3-DeepSeek-R1-0528 reasoning dataset. Based on the SmolLM2-135M-Instruct architecture, this model is specifically optimized for reasoning, structured outputs, and efficient small-scale deployment. Despite its compact size (135M parameters), it demonstrates strong capabilities in logical deduction, conversational coherence, and lightweight inference tasks. + +## Model Files + +| File Name | Size | Type | Description | +|-----------|------|------|-------------| +| SmolLM2-Rethink-135M.Q2_K.gguf | 88.2 MB | Model | Q2_K quantized model (smallest) | +| SmolLM2-Rethink-135M.Q3_K_S.gguf | 88.2 MB | Model | Q3_K_S quantized model | +| SmolLM2-Rethink-135M.Q3_K_M.gguf | 93.5 MB | Model | Q3_K_M quantized model | +| SmolLM2-Rethink-135M.Q3_K_L.gguf | 97.5 MB | Model | Q3_K_L quantized model | +| SmolLM2-Rethink-135M.Q4_K_S.gguf | 102 MB | Model | Q4_K_S quantized model | +| SmolLM2-Rethink-135M.Q4_K_M.gguf | 105 MB | Model | Q4_K_M quantized model | +| SmolLM2-Rethink-135M.Q5_K_S.gguf | 110 MB | Model | Q5_K_S quantized model | +| SmolLM2-Rethink-135M.Q5_K_M.gguf | 112 MB | Model | Q5_K_M quantized model | +| SmolLM2-Rethink-135M.Q6_K.gguf | 138 MB | Model | Q6_K quantized model | +| SmolLM2-Rethink-135M.Q8_0.gguf | 145 MB | Model | Q8_0 quantized model | +| SmolLM2-Rethink-135M.BF16.gguf | 271 MB | Model | BF16 precision model | +| SmolLM2-Rethink-135M.F16.gguf | 271 MB | Model | F16 precision model | +| SmolLM2-Rethink-135M.F32.gguf | 540 MB | Model | F32 full precision model (largest) | +| .gitattributes | 2.4 kB | Config | Git LFS configuration | +| config.json | 29 Bytes | Config | Model configuration | +| README.md | 31 Bytes | Documentation | Repository documentation | + +## Quants Usage + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) \ No newline at end of file diff --git a/SmolLM2-Rethink-135M.BF16.gguf b/SmolLM2-Rethink-135M.BF16.gguf new file mode 100644 index 0000000..eedffac --- /dev/null +++ b/SmolLM2-Rethink-135M.BF16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae5ca9b86c63be43b7a4e2feb0beb269375d5657b404c562703c152698a53729 +size 270885600 diff --git a/SmolLM2-Rethink-135M.F16.gguf b/SmolLM2-Rethink-135M.F16.gguf new file mode 100644 index 0000000..156f769 --- /dev/null +++ b/SmolLM2-Rethink-135M.F16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0804c725fe5f6db56c7015ab11ce172f38c587f9c76f38e0483a9db6365fe466 +size 270885600 diff --git a/SmolLM2-Rethink-135M.F32.gguf b/SmolLM2-Rethink-135M.F32.gguf new file mode 100644 index 0000000..e5d1a55 --- /dev/null +++ b/SmolLM2-Rethink-135M.F32.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2f2f6156c2ea10f60144dab6d3cbc3fd155a30e2615193963f51b6ae445bfea +size 539845344 diff --git a/SmolLM2-Rethink-135M.Q2_K.gguf b/SmolLM2-Rethink-135M.Q2_K.gguf new file mode 100644 index 0000000..9ae941c --- /dev/null +++ b/SmolLM2-Rethink-135M.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e812821173eaaa909daf6502f92aa555b5281ced55b3981e252cd534c14e19f7 +size 88201440 diff --git a/SmolLM2-Rethink-135M.Q3_K_L.gguf b/SmolLM2-Rethink-135M.Q3_K_L.gguf new file mode 100644 index 0000000..2567f2e --- /dev/null +++ b/SmolLM2-Rethink-135M.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8adce86bdad1ee3b1ee345666ebb774ae0b3b5e77360d9bb255138191926322b +size 97532640 diff --git a/SmolLM2-Rethink-135M.Q3_K_M.gguf b/SmolLM2-Rethink-135M.Q3_K_M.gguf new file mode 100644 index 0000000..6bee51a --- /dev/null +++ b/SmolLM2-Rethink-135M.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa02c887f9c629041630b251b9ee69af1a7d8edd583c2733385e92e18c188933 +size 93509856 diff --git a/SmolLM2-Rethink-135M.Q3_K_S.gguf b/SmolLM2-Rethink-135M.Q3_K_S.gguf new file mode 100644 index 0000000..9defa37 --- /dev/null +++ b/SmolLM2-Rethink-135M.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8845a8ff0ea74d6b174c402c6ea84d16dac6dd3ef601836d10a2c6293b48bc2 +size 88201440 diff --git a/SmolLM2-Rethink-135M.Q4_K_M.gguf b/SmolLM2-Rethink-135M.Q4_K_M.gguf new file mode 100644 index 0000000..a9683fa --- /dev/null +++ b/SmolLM2-Rethink-135M.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762f3e930c7e9d6b1bc5c83e6862d28f47f4d52ce78359568bbe4cfc9f3196f7 +size 105453792 diff --git a/SmolLM2-Rethink-135M.Q4_K_S.gguf b/SmolLM2-Rethink-135M.Q4_K_S.gguf new file mode 100644 index 0000000..2891fd0 --- /dev/null +++ b/SmolLM2-Rethink-135M.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08630ededb55fde69b2b95b58d3c30787d6810c61356bac1096fd74481058325 +size 102039264 diff --git a/SmolLM2-Rethink-135M.Q5_K_M.gguf b/SmolLM2-Rethink-135M.Q5_K_M.gguf new file mode 100644 index 0000000..eecaae5 --- /dev/null +++ b/SmolLM2-Rethink-135M.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f65b690ece67ae52314f400b9dcfc203445524891ad64ce17a360553441ae959 +size 112103136 diff --git a/SmolLM2-Rethink-135M.Q5_K_S.gguf b/SmolLM2-Rethink-135M.Q5_K_S.gguf new file mode 100644 index 0000000..492627b --- /dev/null +++ b/SmolLM2-Rethink-135M.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69bbbdad201df10c4f9e4b66cc740b8afec08d6a8e4cb648384460effca73011 +size 109974240 diff --git a/SmolLM2-Rethink-135M.Q6_K.gguf b/SmolLM2-Rethink-135M.Q6_K.gguf new file mode 100644 index 0000000..cadf5f4 --- /dev/null +++ b/SmolLM2-Rethink-135M.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ffecb933561337380d00f5db5ca6a8c6d6d2c44baa3db9293e08372aa79b32f +size 138382560 diff --git a/SmolLM2-Rethink-135M.Q8_0.gguf b/SmolLM2-Rethink-135M.Q8_0.gguf new file mode 100644 index 0000000..5ff15ae --- /dev/null +++ b/SmolLM2-Rethink-135M.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f570221fd7e7a2b4dc48d64c8f8165b3d59674caac7c0f314ea9cb70dc21b29a +size 144810720 diff --git a/config.json b/config.json new file mode 100644 index 0000000..a4ba21b --- /dev/null +++ b/config.json @@ -0,0 +1,3 @@ +{ + "model_type": "llama" +} \ No newline at end of file diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file