From 14f619e6b0df3ae9c9415b22d03b77b4cf803af2 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 19 Jun 2026 06:15:17 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: Eclipse-Senpai/KeyLM-75M-Instruct-GGUF Source: Original Platform --- .gitattributes | 36 +++++++++++++++++++++++++ KeyLM-75M-Instruct.F16.gguf | 3 +++ README.md | 52 +++++++++++++++++++++++++++++++++++++ 3 files changed, 91 insertions(+) create mode 100644 .gitattributes create mode 100644 KeyLM-75M-Instruct.F16.gguf create mode 100644 README.md diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..2ac3e95 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,36 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +KeyLM-75M-Instruct.F16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/KeyLM-75M-Instruct.F16.gguf b/KeyLM-75M-Instruct.F16.gguf new file mode 100644 index 0000000..c11d9b9 --- /dev/null +++ b/KeyLM-75M-Instruct.F16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c258bc317340147eb13f7455900560f958ed6f1f723fa58c90090cbad443a56 +size 150979840 diff --git a/README.md b/README.md new file mode 100644 index 0000000..621bc56 --- /dev/null +++ b/README.md @@ -0,0 +1,52 @@ +--- +license: apache-2.0 +language: +- en +base_model: Eclipse-Senpai/KeyLM-75M-Instruct +base_model_relation: quantized +pipeline_tag: text-generation +library_name: gguf +tags: +- keylm +- gguf +- llama.cpp +- small-language-model +- instruct +--- + +# KeyLM-75M-Instruct-GGUF + +GGUF builds of [**KeyLM-75M-Instruct**](https://huggingface.co/Eclipse-Senpai/KeyLM-75M-Instruct) for `llama.cpp`, LM Studio, Ollama, and other GGUF runtimes. + +KeyLM is a 75M-parameter instruction-tuned language model trained from scratch on approximately 18 billion tokens. See the [main model card](https://huggingface.co/Eclipse-Senpai/KeyLM-75M-Instruct) for benchmarks, training details, limitations, and the `transformers` (safetensors) version. + +## Files + +| File | Quant | Size | Notes | +|---|---|---|---| +| `KeyLM-75M-Instruct.F16.gguf` | F16 | ~144 MB | Full precision and recommended. The model is already tiny, so there is little reason to quantize further. | + +## Run with llama.cpp + +```bash +# straight from the Hub +llama-cli -hf Eclipse-Senpai/KeyLM-75M-Instruct-GGUF -cnv + +# or a local file +llama-cli -m KeyLM-75M-Instruct.F16.gguf -cnv +``` + +The chat template (`User:` / `Assistant:`, assistant turns ending with ``) is embedded in the GGUF, so conversation mode (`-cnv`) applies it automatically. + +## LM Studio / Ollama + +- **LM Studio:** load the `.gguf`; the embedded chat template is detected automatically. +- **Ollama:** `ollama run hf.co/Eclipse-Senpai/KeyLM-75M-Instruct-GGUF` + +## Notes & limitations + +KeyLM is a tiny model: good at simple instruction following and short chat, near random chance on knowledge/reasoning benchmarks. It is not a factual assistant. Full numbers and caveats are on the [main model card](https://huggingface.co/Eclipse-Senpai/KeyLM-75M-Instruct). + +## License + +Apache 2.0.