From 7171db38079b568cbfb3743974b8a8764b12284f Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Wed, 22 Apr 2026 12:19:34 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/karasu-1.1B-GGUF Source: Original Platform --- .gitattributes | 47 ++++++++++++++++++++++++++++ README.md | 69 +++++++++++++++++++++++++++++++++++++++++ karasu-1.1B.IQ4_XS.gguf | 3 ++ karasu-1.1B.Q2_K.gguf | 3 ++ karasu-1.1B.Q3_K_L.gguf | 3 ++ karasu-1.1B.Q3_K_M.gguf | 3 ++ karasu-1.1B.Q3_K_S.gguf | 3 ++ karasu-1.1B.Q4_K_M.gguf | 3 ++ karasu-1.1B.Q4_K_S.gguf | 3 ++ karasu-1.1B.Q5_K_M.gguf | 3 ++ karasu-1.1B.Q5_K_S.gguf | 3 ++ karasu-1.1B.Q6_K.gguf | 3 ++ karasu-1.1B.Q8_0.gguf | 3 ++ karasu-1.1B.f16.gguf | 3 ++ 14 files changed, 152 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 karasu-1.1B.IQ4_XS.gguf create mode 100644 karasu-1.1B.Q2_K.gguf create mode 100644 karasu-1.1B.Q3_K_L.gguf create mode 100644 karasu-1.1B.Q3_K_M.gguf create mode 100644 karasu-1.1B.Q3_K_S.gguf create mode 100644 karasu-1.1B.Q4_K_M.gguf create mode 100644 karasu-1.1B.Q4_K_S.gguf create mode 100644 karasu-1.1B.Q5_K_M.gguf create mode 100644 karasu-1.1B.Q5_K_S.gguf create mode 100644 karasu-1.1B.Q6_K.gguf create mode 100644 karasu-1.1B.Q8_0.gguf create mode 100644 karasu-1.1B.f16.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..0b12f6b --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.f16.gguf filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +karasu-1.1B.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..fc2c814 --- /dev/null +++ b/README.md @@ -0,0 +1,69 @@ +--- +base_model: lightblue/karasu-1.1B +datasets: +- oscar-corpus/OSCAR-2301 +- mc4 +language: +- ja +library_name: transformers +license: apache-2.0 +license_link: https://github.com/QwenLM/Qwen/blob/main/Tongyi%20Qianwen%20LICENSE%20AGREEMENT +license_name: tongyi-qianwen-license-agreement +quantized_by: mradermacher +--- +## About + + + + + + +static quants of https://huggingface.co/lightblue/karasu-1.1B + + +weighted/imatrix quants are available at https://huggingface.co/mradermacher/karasu-1.1B-i1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.Q2_K.gguf) | Q2_K | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.Q3_K_S.gguf) | Q3_K_S | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.Q3_K_M.gguf) | Q3_K_M | 0.6 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.Q3_K_L.gguf) | Q3_K_L | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.IQ4_XS.gguf) | IQ4_XS | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.Q4_K_S.gguf) | Q4_K_S | 0.7 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.Q4_K_M.gguf) | Q4_K_M | 0.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.Q5_K_S.gguf) | Q5_K_S | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.Q5_K_M.gguf) | Q5_K_M | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.Q6_K.gguf) | Q6_K | 1.0 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.Q8_0.gguf) | Q8_0 | 1.3 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/karasu-1.1B-GGUF/resolve/main/karasu-1.1B.f16.gguf) | f16 | 2.3 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + + diff --git a/karasu-1.1B.IQ4_XS.gguf b/karasu-1.1B.IQ4_XS.gguf new file mode 100644 index 0000000..e8e9f83 --- /dev/null +++ b/karasu-1.1B.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89171d2affee7d3b71754a8df216b1d6a8e32baacebc2aebceaa427b68074b2a +size 609807936 diff --git a/karasu-1.1B.Q2_K.gguf b/karasu-1.1B.Q2_K.gguf new file mode 100644 index 0000000..361d60d --- /dev/null +++ b/karasu-1.1B.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:020a06eb9917255ff29b376a39b26dadd2b95c22b0f5ffd799495a9e856e5d98 +size 432131648 diff --git a/karasu-1.1B.Q3_K_L.gguf b/karasu-1.1B.Q3_K_L.gguf new file mode 100644 index 0000000..b6f9a70 --- /dev/null +++ b/karasu-1.1B.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:833b326af3ef030c4159f4e3a96759fea1ecc8f1e9b8b4859618d21f3fbe62ce +size 591527488 diff --git a/karasu-1.1B.Q3_K_M.gguf b/karasu-1.1B.Q3_K_M.gguf new file mode 100644 index 0000000..66d4194 --- /dev/null +++ b/karasu-1.1B.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfcb6a109fd9dd5240af2240f643686c07f5908045acee68182c88544379bbfb +size 548404800 diff --git a/karasu-1.1B.Q3_K_S.gguf b/karasu-1.1B.Q3_K_S.gguf new file mode 100644 index 0000000..3c289f8 --- /dev/null +++ b/karasu-1.1B.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac50f0497bb5feb80656a9d60b6701a5d0cc42031f59e55d57c95d8c36d53a91 +size 499342912 diff --git a/karasu-1.1B.Q4_K_M.gguf b/karasu-1.1B.Q4_K_M.gguf new file mode 100644 index 0000000..211c8f0 --- /dev/null +++ b/karasu-1.1B.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95c31fc4e9d2ca90db57e0438df255865fdff0c0525a7f701b64d67a7129ea7 +size 667815488 diff --git a/karasu-1.1B.Q4_K_S.gguf b/karasu-1.1B.Q4_K_S.gguf new file mode 100644 index 0000000..ea2b06b --- /dev/null +++ b/karasu-1.1B.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b4b3ecaed8476c72e39f0cb6254f454da5d876695af6cbb91c29f28ae57e7f +size 639872576 diff --git a/karasu-1.1B.Q5_K_M.gguf b/karasu-1.1B.Q5_K_M.gguf new file mode 100644 index 0000000..5874a96 --- /dev/null +++ b/karasu-1.1B.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda2bddaa6fa866c0e9a4d308ed9593be15a81fc176902b201c29863dc05549a +size 782044736 diff --git a/karasu-1.1B.Q5_K_S.gguf b/karasu-1.1B.Q5_K_S.gguf new file mode 100644 index 0000000..4febf01 --- /dev/null +++ b/karasu-1.1B.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37a1ff19771d7e14176f9148714a9c35b9bfd9c87501d662ef95c703c4b12a07 +size 766029376 diff --git a/karasu-1.1B.Q6_K.gguf b/karasu-1.1B.Q6_K.gguf new file mode 100644 index 0000000..b18f1b4 --- /dev/null +++ b/karasu-1.1B.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b8f3b571a44f7a244bb21712857e03eaec2835bb4d8f2781b4ef1396bc69f24 +size 903413312 diff --git a/karasu-1.1B.Q8_0.gguf b/karasu-1.1B.Q8_0.gguf new file mode 100644 index 0000000..dea3f1e --- /dev/null +++ b/karasu-1.1B.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e433f92f14ddfe95c8a0b32f78fd15666bd6defad95246efc6c6a2113bf0f5a +size 1169808960 diff --git a/karasu-1.1B.f16.gguf b/karasu-1.1B.f16.gguf new file mode 100644 index 0000000..5e58c61 --- /dev/null +++ b/karasu-1.1B.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:006a5c70bdeb025e6a278e983c809fb3134ad7da0281f66ed520c1922fc982ed +size 2201017920