From f8cf9cfa21058cae554965dc75b616c6bdd0f5ef Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 12 Jun 2026 23:22:19 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: North-ML1/Wind-Edge-1.6-GGUF Source: Original Platform --- .gitattributes | 42 +++++++++ README.md | 185 ++++++++++++++++++++++++++++++++++++++ Wind-Edge-1.6-F16.gguf | 3 + Wind-Edge-1.6-IQ3_M.gguf | 3 + Wind-Edge-1.6-Q4_K_M.gguf | 3 + Wind-Edge-1.6-Q6_K.gguf | 3 + Wind-Edge-1.6-Q8_0.gguf | 3 + Wind-Edge-1.6-TQ1_0.gguf | 3 + Wind-Edge-1.6-TQ2_0.gguf | 3 + 9 files changed, 248 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 Wind-Edge-1.6-F16.gguf create mode 100644 Wind-Edge-1.6-IQ3_M.gguf create mode 100644 Wind-Edge-1.6-Q4_K_M.gguf create mode 100644 Wind-Edge-1.6-Q6_K.gguf create mode 100644 Wind-Edge-1.6-Q8_0.gguf create mode 100644 Wind-Edge-1.6-TQ1_0.gguf create mode 100644 Wind-Edge-1.6-TQ2_0.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..e15a053 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,42 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Wind-Edge-1.6-F16.gguf filter=lfs diff=lfs merge=lfs -text +Wind-Edge-1.6-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Wind-Edge-1.6-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Wind-Edge-1.6-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Wind-Edge-1.6-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +Wind-Edge-1.6-TQ1_0.gguf filter=lfs diff=lfs merge=lfs -text +Wind-Edge-1.6-TQ2_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..b5c4dcc --- /dev/null +++ b/README.md @@ -0,0 +1,185 @@ +--- +model-index: +- name: wind-edge-1.6@f16 + results: + - task: + type: text-generation + name: Code Generation + dataset: + name: CodeBench-30 + type: North-ML1/CodeBench-30 + split: train + metrics: + - name: Overall Accuracy + type: accuracy + value: 6.25 + verified: false + - name: Easy Tier Accuracy + type: accuracy + value: 17.14 + verified: false + - name: Medium Tier Accuracy + type: accuracy + value: 0.00 + verified: false + - name: Hard Tier Accuracy + type: accuracy + value: 0.00 + verified: false + +library_name: transformers +pipeline_tag: text-generation +tags: +- wind-edge +- causal-lm +- edge +- small-language-model +- 0.4b +license: mit +datasets: +- Jackrong/GLM-5.1-Reasoning-1M-Cleaned +language: +- en +base_model: +- North-ML1/Wind-Edge-1.6-Instruct +--- + +# Wind Edge 1.6 — Geode (0.4B) + +A 0.4B parameter causal language model built for edge deployment. Fast, small, and honest about what it can do. + +**[North ML](https://huggingface.co/north-ml1)** · [Wind Arc 1.5 Preview](https://huggingface.co/arthu1/wind-arc-1-5-preview) + +--- + +## Overview + +Wind Edge 1.6 (Geode) is a compact LLM trained for real-time, on-device inference. At 0.4B parameters it sits in the ultra-small tier — expect strong common-sense and classification performance, limited hard reasoning. + +**Best use cases:** +- Instruction-following dialogue (short to medium turns) +- Text classification and sentiment +- Light code completion +- Summarization of short passages + +**Not recommended for:** multi-step math, complex logical chains, long-context tasks. + +--- + +## Changes vs 1.5 + +- Improved instruction adherence on structured output formats +- More stable multi-sentence generation (fewer mid-sequence repetitions) +- Reduced hallucination rate on short factual queries (internal held-out eval) + +--- + +## Honest Benchmark Estimates + +Realistic ranges for a well-trained 0.4B model — not cherry-picked numbers. + +| Task | Expected Range | Notes | +|-----------------------|----------------|-------| +| Common Sense (0-shot) | 0.60 – 0.68 | Reliable strength | +| Sentiment Analysis | 0.70 – 0.80 | Reliable strength | +| Text Classification | 0.68 – 0.78 | Reliable strength | +| Reading Comprehension | 0.52 – 0.63 | Context-dependent | +| Summarization | 0.58 – 0.68 | Short docs only | +| Code Generation | 0.45 – 0.58 | Simple tasks only | +| Math Reasoning | 0.15 – 0.28 | Known weak point at this scale | +| Logical Reasoning | 0.18 – 0.28 | Known weak point at this scale | + +A 0.4B model cannot compete with 7B+ on reasoning — Geode doesn't pretend to. + +--- + +## Usage + +```python +from transformers import AutoModelForCausalLM, AutoTokenizer + +model = AutoModelForCausalLM.from_pretrained("north-ml1/wind-edge-1.6") +tokenizer = AutoTokenizer.from_pretrained("north-ml1/wind-edge-1.6") + +inputs = tokenizer("You are Wind Edge, a helpful AI assistant.\nUser: ", return_tensors="pt") +output = model.generate(**inputs, max_new_tokens=256, temperature=0.6, top_p=0.9) +print(tokenizer.decode(output[0], skip_special_tokens=True)) +``` + +### Recommended Settings + +| Parameter | Value | +|--------------------|----------| +| temperature | 0.0 | +| top_p | 0.95 | +| min_p | 0.05 | +| max_new_tokens | 256–512 | +| repetition_penalty | 1.1 | +| context_limit | 1024-4096| + + +--- + +## GGUF Quantizations + +GGUF quants converted from [arthu1/Wind-Edge-1.6-Instruct](https://huggingface.co/arthu1/Wind-Edge-1.6-Instruct) using a Qwen3-compatible tensor layout. The Transformers repo remains canonical — use these for llama.cpp, LM Studio, Ollama-style runtimes, and any other GGUF-compatible inference stack. + +### Files + +| File | bpw | Use | +|------|-----|-----| +| Wind-Edge-1.6-TQ1_0.gguf | ~1.7 bpw | Experimental 1-bit/ternary. Lowest quality, smallest size. | +| Wind-Edge-1.6-TQ2_0.gguf | ~2.1 bpw | Very small 2-bit/ternary option. | +| Wind-Edge-1.6-IQ3_M.gguf | ~3.7 bpw | Good balance for tiny devices. | +| Wind-Edge-1.6-Q4_K_M.gguf | ~4.6 bpw | **Recommended default.** | +| Wind-Edge-1.6-Q6_K.gguf | ~6.1 bpw | Higher quality, still compact. | +| Wind-Edge-1.6-Q8_0.gguf | ~8.5 bpw | Near-lossless practical quant. | +| Wind-Edge-1.6-F16.gguf | 16 bpw | Full precision GGUF export. | + +Q4_K_M, Q6_K, and Q8_0 are the recommended daily drivers. TQ1_0 and TQ2_0 are included for constrained edge hardware but will lose measurable reasoning and factual accuracy. + +### llama.cpp + +```bash +llama-cli \ + -m Wind-Edge-1.6-Q4_K_M.gguf \ + -cnv \ + --temp 0.6 \ + --top-p 0.9 \ + --repeat-penalty 1.06 \ + -n 512 +``` + +For deterministic output, use `--temp 0` and keep prompts short. + +### Chat Template + +The GGUF metadata includes the chat template. If your runtime doesn't apply it automatically: + +``` +<|im_start|>system +You are Wind-Edge-1.6, a compact AI assistant model. You are not a human.<|im_end|> +<|im_start|>user +Who are you?<|im_end|> +<|im_start|>assistant + + +``` + +--- + +## Model Details + +| Property | Value | +|----------------|-------| +| Parameters | ~0.4B | +| Architecture | Causal LM (decoder-only) | +| Context Length | 8192 tokens | +| Quantization | 1-16bit (GGUF) | +| Org | [north-ml1](https://huggingface.co/north-ml1) | + +--- + +## License + +MIT \ No newline at end of file diff --git a/Wind-Edge-1.6-F16.gguf b/Wind-Edge-1.6-F16.gguf new file mode 100644 index 0000000..cda2c66 --- /dev/null +++ b/Wind-Edge-1.6-F16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:108fce7c2d67173d8245fc8900cae45b2c49f5c14cd878e21210b2edabcd758b +size 883511296 diff --git a/Wind-Edge-1.6-IQ3_M.gguf b/Wind-Edge-1.6-IQ3_M.gguf new file mode 100644 index 0000000..99cace0 --- /dev/null +++ b/Wind-Edge-1.6-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:565183d11fdc63c20ee06e9f636bb508c10d5c09716fad307aa6708335fa35ea +size 263748608 diff --git a/Wind-Edge-1.6-Q4_K_M.gguf b/Wind-Edge-1.6-Q4_K_M.gguf new file mode 100644 index 0000000..8124d57 --- /dev/null +++ b/Wind-Edge-1.6-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a9941e9f93cadc09bb49d158b2b2589c6c3ddb8debe1461840a673ecdac892e +size 302726144 diff --git a/Wind-Edge-1.6-Q6_K.gguf b/Wind-Edge-1.6-Q6_K.gguf new file mode 100644 index 0000000..53d898b --- /dev/null +++ b/Wind-Edge-1.6-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6942f53c62fa4d41811932626bee62bff5d5ed668efd5a97c09ed66412d1b93f +size 365984768 diff --git a/Wind-Edge-1.6-Q8_0.gguf b/Wind-Edge-1.6-Q8_0.gguf new file mode 100644 index 0000000..196405f --- /dev/null +++ b/Wind-Edge-1.6-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb883838ea397002683d1ee93846bbe994c1bfab61cf051679a519668adae999 +size 472231936 diff --git a/Wind-Edge-1.6-TQ1_0.gguf b/Wind-Edge-1.6-TQ1_0.gguf new file mode 100644 index 0000000..9a8b2ed --- /dev/null +++ b/Wind-Edge-1.6-TQ1_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91eb211d1b00708247a9610281322cb4c7f3999f8f164099e6e1397c80f09d8 +size 193461248 diff --git a/Wind-Edge-1.6-TQ2_0.gguf b/Wind-Edge-1.6-TQ2_0.gguf new file mode 100644 index 0000000..2f29d66 --- /dev/null +++ b/Wind-Edge-1.6-TQ2_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e725eb5f2f03bc1262b18d604e689764e48ae6bab2f3ef89c1ac57ba0cf6c35 +size 206732288