From 9c37f223226f49bc6f5e3fd99f7d91031c2a1e7f Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 18 Apr 2026 08:31:46 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: afrideva/smol_llama-101M-GQA-GGUF Source: Original Platform --- .gitattributes | 42 ++++++++++++ README.md | 114 ++++++++++++++++++++++++++++++++ smol_llama-101m-gqa.fp16.gguf | 3 + smol_llama-101m-gqa.q2_k.gguf | 3 + smol_llama-101m-gqa.q3_k_m.gguf | 3 + smol_llama-101m-gqa.q4_k_m.gguf | 3 + smol_llama-101m-gqa.q5_k_m.gguf | 3 + smol_llama-101m-gqa.q6_k.gguf | 3 + smol_llama-101m-gqa.q8_0.gguf | 3 + 9 files changed, 177 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 smol_llama-101m-gqa.fp16.gguf create mode 100644 smol_llama-101m-gqa.q2_k.gguf create mode 100644 smol_llama-101m-gqa.q3_k_m.gguf create mode 100644 smol_llama-101m-gqa.q4_k_m.gguf create mode 100644 smol_llama-101m-gqa.q5_k_m.gguf create mode 100644 smol_llama-101m-gqa.q6_k.gguf create mode 100644 smol_llama-101m-gqa.q8_0.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..c4251c0 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,42 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +smol_llama-101m-gqa.fp16.gguf filter=lfs diff=lfs merge=lfs -text +smol_llama-101m-gqa.q2_k.gguf filter=lfs diff=lfs merge=lfs -text +smol_llama-101m-gqa.q3_k_m.gguf filter=lfs diff=lfs merge=lfs -text +smol_llama-101m-gqa.q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text +smol_llama-101m-gqa.q5_k_m.gguf filter=lfs diff=lfs merge=lfs -text +smol_llama-101m-gqa.q6_k.gguf filter=lfs diff=lfs merge=lfs -text +smol_llama-101m-gqa.q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..6bb30a3 --- /dev/null +++ b/README.md @@ -0,0 +1,114 @@ +--- +base_model: BEE-spoke-data/smol_llama-101M-GQA +datasets: +- JeanKaddour/minipile +- pszemraj/simple_wikipedia_LM +- BEE-spoke-data/wikipedia-20230901.en-deduped +- mattymchen/refinedweb-3m +inference: false +language: +- en +license: apache-2.0 +model_creator: BEE-spoke-data +model_name: smol_llama-101M-GQA +pipeline_tag: text-generation +quantized_by: afrideva +tags: +- smol_llama +- llama2 +- gguf +- ggml +- quantized +- q2_k +- q3_k_m +- q4_k_m +- q5_k_m +- q6_k +- q8_0 +thumbnail: https://i.ibb.co/TvyMrRc/rsz-smol-llama-banner.png +widget: +- example_title: El Microondas + text: My name is El Microondas the Wise and +- example_title: Kennesaw State University + text: Kennesaw State University is a public +- example_title: Bungie + text: Bungie Studios is an American video game developer. They are most famous for + developing the award winning Halo series of video games. They also made Destiny. + The studio was founded +- example_title: Mona Lisa + text: The Mona Lisa is a world-renowned painting created by +- example_title: Harry Potter Series + text: The Harry Potter series, written by J.K. Rowling, begins with the book titled +- example_title: Riddle + text: 'Question: I have cities, but no houses. I have mountains, but no trees. I + have water, but no fish. What am I? + + Answer:' +- example_title: Photosynthesis + text: The process of photosynthesis involves the conversion of +- example_title: Story Continuation + text: Jane went to the store to buy some groceries. She picked up apples, oranges, + and a loaf of bread. When she got home, she realized she forgot +- example_title: Math Problem + text: 'Problem 2: If a train leaves Station A at 9:00 AM and travels at 60 mph, + and another train leaves Station B at 10:00 AM and travels at 80 mph, when will + they meet if the distance between the stations is 300 miles? + + To determine' +- example_title: Algorithm Definition + text: In the context of computer programming, an algorithm is +--- +# BEE-spoke-data/smol_llama-101M-GQA-GGUF + +Quantized GGUF model files for [smol_llama-101M-GQA](https://huggingface.co/BEE-spoke-data/smol_llama-101M-GQA) from [BEE-spoke-data](https://huggingface.co/BEE-spoke-data) + + +| Name | Quant method | Size | +| ---- | ---- | ---- | +| [smol_llama-101m-gqa.fp16.gguf](https://huggingface.co/afrideva/smol_llama-101M-GQA-GGUF/resolve/main/smol_llama-101m-gqa.fp16.gguf) | fp16 | 203.28 MB | +| [smol_llama-101m-gqa.q2_k.gguf](https://huggingface.co/afrideva/smol_llama-101M-GQA-GGUF/resolve/main/smol_llama-101m-gqa.q2_k.gguf) | q2_k | 50.93 MB | +| [smol_llama-101m-gqa.q3_k_m.gguf](https://huggingface.co/afrideva/smol_llama-101M-GQA-GGUF/resolve/main/smol_llama-101m-gqa.q3_k_m.gguf) | q3_k_m | 57.06 MB | +| [smol_llama-101m-gqa.q4_k_m.gguf](https://huggingface.co/afrideva/smol_llama-101M-GQA-GGUF/resolve/main/smol_llama-101m-gqa.q4_k_m.gguf) | q4_k_m | 65.40 MB | +| [smol_llama-101m-gqa.q5_k_m.gguf](https://huggingface.co/afrideva/smol_llama-101M-GQA-GGUF/resolve/main/smol_llama-101m-gqa.q5_k_m.gguf) | q5_k_m | 74.34 MB | +| [smol_llama-101m-gqa.q6_k.gguf](https://huggingface.co/afrideva/smol_llama-101M-GQA-GGUF/resolve/main/smol_llama-101m-gqa.q6_k.gguf) | q6_k | 83.83 MB | +| [smol_llama-101m-gqa.q8_0.gguf](https://huggingface.co/afrideva/smol_llama-101M-GQA-GGUF/resolve/main/smol_llama-101m-gqa.q8_0.gguf) | q8_0 | 108.35 MB | + + + +## Original Model Card: +# smol_llama-101M-GQA + +banner + +A small 101M param (total) decoder model. This is the first version of the model. + +- 768 hidden size, 6 layers +- GQA (24 heads, 8 key-value), context length 1024 +- train-from-scratch + +## Notes + +**This checkpoint** is the 'raw' pre-trained model and has not been tuned to a more specific task. **It should be fine-tuned** before use in most cases. + +### Checkpoints & Links + +- _smol_-er 81M parameter checkpoint with in/out embeddings tied: [here](https://huggingface.co/BEE-spoke-data/smol_llama-81M-tied) +- Fine-tuned on `pypi` to generate Python code - [link](https://huggingface.co/BEE-spoke-data/smol_llama-101M-GQA-python) +- For the chat version of this model, please [see here](https://youtu.be/dQw4w9WgXcQ?si=3ePIqrY1dw94KMu4) + +--- + + +# [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard) +Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_BEE-spoke-data__smol_llama-101M-GQA) + +| Metric | Value | +|-----------------------|---------------------------| +| Avg. | 25.32 | +| ARC (25-shot) | 23.55 | +| HellaSwag (10-shot) | 28.77 | +| MMLU (5-shot) | 24.24 | +| TruthfulQA (0-shot) | 45.76 | +| Winogrande (5-shot) | 50.67 | +| GSM8K (5-shot) | 0.83 | +| DROP (3-shot) | 3.39 | \ No newline at end of file diff --git a/smol_llama-101m-gqa.fp16.gguf b/smol_llama-101m-gqa.fp16.gguf new file mode 100644 index 0000000..775315f --- /dev/null +++ b/smol_llama-101m-gqa.fp16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebb3c8a47a09195ac7ba7954ff1a26c03d87c8293ce9725265e6e33ecd77725a +size 203276896 diff --git a/smol_llama-101m-gqa.q2_k.gguf b/smol_llama-101m-gqa.q2_k.gguf new file mode 100644 index 0000000..6e355ca --- /dev/null +++ b/smol_llama-101m-gqa.q2_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4162244f21add68d96997c3ee4f2df2bdac98663fcee3ea86c7fb3104698bd5 +size 50931072 diff --git a/smol_llama-101m-gqa.q3_k_m.gguf b/smol_llama-101m-gqa.q3_k_m.gguf new file mode 100644 index 0000000..08bfe1d --- /dev/null +++ b/smol_llama-101m-gqa.q3_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b75e3ef95ad4a6f0275d707580b24c4c70a2a2876a129314e80e57206dd0761 +size 57062016 diff --git a/smol_llama-101m-gqa.q4_k_m.gguf b/smol_llama-101m-gqa.q4_k_m.gguf new file mode 100644 index 0000000..07cb632 --- /dev/null +++ b/smol_llama-101m-gqa.q4_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ffd327c914074b08301aa288bb0344f44915d315bc5526d6ae6a0f8c79c552a +size 65404800 diff --git a/smol_llama-101m-gqa.q5_k_m.gguf b/smol_llama-101m-gqa.q5_k_m.gguf new file mode 100644 index 0000000..dac43c9 --- /dev/null +++ b/smol_llama-101m-gqa.q5_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a44697c898f489d975134012291add0eb5bedbdbad123363bba70fbe4bb3a0 +size 74338176 diff --git a/smol_llama-101m-gqa.q6_k.gguf b/smol_llama-101m-gqa.q6_k.gguf new file mode 100644 index 0000000..45495aa --- /dev/null +++ b/smol_llama-101m-gqa.q6_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b03454870d97720a616761fd3626f0a02ec0dc5bddb48989f1069ce8da7ffaa5 +size 83829888 diff --git a/smol_llama-101m-gqa.q8_0.gguf b/smol_llama-101m-gqa.q8_0.gguf new file mode 100644 index 0000000..3eb20c4 --- /dev/null +++ b/smol_llama-101m-gqa.q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3759687f4e76bd4387d84a7eb049ace18b4a7abb56ec185796c373173dd6f93e +size 108352128