commit aac090c485bef8044395c287caed6d075d9b4b73 Author: ModelHub XC Date: Wed Apr 29 06:12:31 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: inspirebek/qwen3-4b-uzbek-v2-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..3587589 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,44 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +qwen3-4b-uzbek-v2-f16.gguf filter=lfs diff=lfs merge=lfs -text +qwen3-4b-uzbek-v2-q2_k.gguf filter=lfs diff=lfs merge=lfs -text +qwen3-4b-uzbek-v2-q3_k_m.gguf filter=lfs diff=lfs merge=lfs -text +qwen3-4b-uzbek-v2-q4_k_m.gguf filter=lfs diff=lfs merge=lfs -text +qwen3-4b-uzbek-v2-q4_k_s.gguf filter=lfs diff=lfs merge=lfs -text +qwen3-4b-uzbek-v2-q5_k_m.gguf filter=lfs diff=lfs merge=lfs -text +qwen3-4b-uzbek-v2-q5_k_s.gguf filter=lfs diff=lfs merge=lfs -text +qwen3-4b-uzbek-v2-q6_k.gguf filter=lfs diff=lfs merge=lfs -text +qwen3-4b-uzbek-v2-q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..354b7d4 --- /dev/null +++ b/README.md @@ -0,0 +1,89 @@ +--- +language: +- uz +- en +license: cc-by-nc-4.0 +datasets: +- yakhyo/uz-wiki +- tahrirchi/uz-books-v2 +- tahrirchi/uz-crawl +- saillab/alpaca_uzbek_taco +- behbudiy/alpaca-cleaned-uz +- UAzimov/uzbek-instruct-llm +- CohereLabs/aya_collection_language_split +- med-alex/qa_mt_ru_to_uzn +- med-alex/qa_mt_tr_to_uzn +library_name: gguf +pipeline_tag: text-generation +base_model: inspirebek/qwen3-4b-uzbek-v2 +tags: +- uzbek +- qwen3 +- quantized +- gguf +- llama.cpp +- ollama +--- + +# qwen3-4b-uzbek-v2-gguf + +gguf suite for [`inspirebek/qwen3-4b-uzbek-v2`](https://huggingface.co/inspirebek/qwen3-4b-uzbek-v2). cpu / apple silicon / vulkan / rocm via `llama.cpp`, ollama, lm studio, etc. + +## files + +| quant | size | notes | +|---|---|---| +| `f16` | 8.8 gb | reference fp16 | +| `Q8_0` | 4.7 gb | near-lossless | +| `Q6_K` | 3.6 gb | recommended for quality | +| `Q5_K_M` | 3.2 gb | balanced | +| `Q5_K_S` | 3.1 gb | slightly lighter | +| `Q4_K_M` | 2.7 gb | **recommended for most users** | +| `Q4_K_S` | 2.6 gb | smaller, slight quality loss | +| `Q3_K_M` | 2.2 gb | aggressive | +| `Q2_K` | 1.8 gb | edge / low-ram only | + +## usage + +**llama.cpp:** + +```bash +llama-cli -m qwen3-4b-uzbek-v2-q4_k_m.gguf -p "Salom! Qalaysan?" -cnv +``` + +**ollama:** + +```bash +ollama run hf.co/inspirebek/qwen3-4b-uzbek-v2-GGUF:Q4_K_M +``` + +## quantization + +converted from the bf16 merged model via `llama.cpp`'s `convert_hf_to_gguf.py` → `llama-quantize`. no calibration data (k-quants are statistics-only). + +## datasets + +**stage a — fluency (continued pretraining):** + +- [`yakhyo/uz-wiki`](https://huggingface.co/datasets/yakhyo/uz-wiki) · MIT +- [`tahrirchi/uz-books-v2`](https://huggingface.co/datasets/tahrirchi/uz-books-v2) · MIT +- [`tahrirchi/uz-crawl`](https://huggingface.co/datasets/tahrirchi/uz-crawl) · Apache-2.0 + +**stage b — instruct (sft):** + +- [`saillab/alpaca_uzbek_taco`](https://huggingface.co/datasets/saillab/alpaca_uzbek_taco) · CC-BY-NC-4.0 +- [`behbudiy/alpaca-cleaned-uz`](https://huggingface.co/datasets/behbudiy/alpaca-cleaned-uz) · CC-BY-4.0 +- [`UAzimov/uzbek-instruct-llm`](https://huggingface.co/datasets/UAzimov/uzbek-instruct-llm) · Apache-2.0 +- [`CohereLabs/aya_collection_language_split`](https://huggingface.co/datasets/CohereLabs/aya_collection_language_split) · Apache-2.0 +- [`med-alex/qa_mt_ru_to_uzn`](https://huggingface.co/datasets/med-alex/qa_mt_ru_to_uzn) · unspecified +- [`med-alex/qa_mt_tr_to_uzn`](https://huggingface.co/datasets/med-alex/qa_mt_tr_to_uzn) · unspecified + +> ⚠️ licensing note: `saillab/alpaca_uzbek_taco` is cc-by-nc-4.0, which restricts commercial use of derivative models. downstream users who need a fully permissive license should retrain without that subset. + +## sibling formats + +- [`inspirebek/qwen3-4b-uzbek-v2`](https://huggingface.co/inspirebek/qwen3-4b-uzbek-v2) +- [`inspirebek/qwen3-4b-uzbek-v2-lora`](https://huggingface.co/inspirebek/qwen3-4b-uzbek-v2-lora) +- [`inspirebek/qwen3-4b-uzbek-v2-bnb-4bit`](https://huggingface.co/inspirebek/qwen3-4b-uzbek-v2-bnb-4bit) +- [`inspirebek/qwen3-4b-uzbek-v2-awq`](https://huggingface.co/inspirebek/qwen3-4b-uzbek-v2-awq) +- [`inspirebek/qwen3-4b-uzbek-v2-GGUF`](https://huggingface.co/inspirebek/qwen3-4b-uzbek-v2-GGUF) diff --git a/qwen3-4b-uzbek-v2-f16.gguf b/qwen3-4b-uzbek-v2-f16.gguf new file mode 100644 index 0000000..47e7117 --- /dev/null +++ b/qwen3-4b-uzbek-v2-f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac6d636d1934ef37e2f3b73424c9b9fbf8762c2f997f6823098f7e8399e4b4b1 +size 8829197760 diff --git a/qwen3-4b-uzbek-v2-q2_k.gguf b/qwen3-4b-uzbek-v2-q2_k.gguf new file mode 100644 index 0000000..12ebda9 --- /dev/null +++ b/qwen3-4b-uzbek-v2-q2_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fec0869049c20a4b715e1801d43ad3b770673b235a9e5bddfed3da01cc7e803 +size 1797126080 diff --git a/qwen3-4b-uzbek-v2-q3_k_m.gguf b/qwen3-4b-uzbek-v2-q3_k_m.gguf new file mode 100644 index 0000000..abd50d2 --- /dev/null +++ b/qwen3-4b-uzbek-v2-q3_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292bfc24710e98728bb0d071f0890451de3909a8fb8d70e7652474d6397e6438 +size 2242747840 diff --git a/qwen3-4b-uzbek-v2-q4_k_m.gguf b/qwen3-4b-uzbek-v2-q4_k_m.gguf new file mode 100644 index 0000000..67c0ee1 --- /dev/null +++ b/qwen3-4b-uzbek-v2-q4_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4310a4a113c0dd24476fa51b5ffe0881a135f5821dbe66778f8be4a9a97fa001 +size 2716068800 diff --git a/qwen3-4b-uzbek-v2-q4_k_s.gguf b/qwen3-4b-uzbek-v2-q4_k_s.gguf new file mode 100644 index 0000000..f7a6b2c --- /dev/null +++ b/qwen3-4b-uzbek-v2-q4_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:370abde45cbaff2b32ac085ca5f7beadee26c5ba332f9daaa28e96603817d080 +size 2602097600 diff --git a/qwen3-4b-uzbek-v2-q5_k_m.gguf b/qwen3-4b-uzbek-v2-q5_k_m.gguf new file mode 100644 index 0000000..c6e14fa --- /dev/null +++ b/qwen3-4b-uzbek-v2-q5_k_m.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27209d83adbf8caa1d4a5f37cc2a8b6b476e0be1840794698c4a1c5a43e9e3eb +size 3156921280 diff --git a/qwen3-4b-uzbek-v2-q5_k_s.gguf b/qwen3-4b-uzbek-v2-q5_k_s.gguf new file mode 100644 index 0000000..03b0133 --- /dev/null +++ b/qwen3-4b-uzbek-v2-q5_k_s.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337e80d16a1c1f6d7358d2140f42d9a4e17020fecda1f6af69e2ab3accb326b1 +size 3091119040 diff --git a/qwen3-4b-uzbek-v2-q6_k.gguf b/qwen3-4b-uzbek-v2-q6_k.gguf new file mode 100644 index 0000000..2ec8019 --- /dev/null +++ b/qwen3-4b-uzbek-v2-q6_k.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303a5d2d09a4a1a0ed1af488ca6d55a9e0c35edf15330b34a402da8969e1bb84 +size 3625327040 diff --git a/qwen3-4b-uzbek-v2-q8_0.gguf b/qwen3-4b-uzbek-v2-q8_0.gguf new file mode 100644 index 0000000..44825b6 --- /dev/null +++ b/qwen3-4b-uzbek-v2-q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4496688b1cc6d3ae3217dcf8f25a84ce93f39171d1800a6dcb1bac8ffc03e8c3 +size 4693671360