From dbc46fc34acad960cb26a828526a78753e098e05 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Tue, 12 May 2026 08:24:32 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF Source: Original Platform --- .gitattributes | 47 +++++++++++++++ LFM2.5-1.2B-Saiga-It-v2.IQ4_XS.gguf | 3 + LFM2.5-1.2B-Saiga-It-v2.Q2_K.gguf | 3 + LFM2.5-1.2B-Saiga-It-v2.Q3_K_L.gguf | 3 + LFM2.5-1.2B-Saiga-It-v2.Q3_K_M.gguf | 3 + LFM2.5-1.2B-Saiga-It-v2.Q3_K_S.gguf | 3 + LFM2.5-1.2B-Saiga-It-v2.Q4_K_M.gguf | 3 + LFM2.5-1.2B-Saiga-It-v2.Q4_K_S.gguf | 3 + LFM2.5-1.2B-Saiga-It-v2.Q5_K_M.gguf | 3 + LFM2.5-1.2B-Saiga-It-v2.Q5_K_S.gguf | 3 + LFM2.5-1.2B-Saiga-It-v2.Q6_K.gguf | 3 + LFM2.5-1.2B-Saiga-It-v2.Q8_0.gguf | 3 + LFM2.5-1.2B-Saiga-It-v2.f16.gguf | 3 + README.md | 89 +++++++++++++++++++++++++++++ 14 files changed, 172 insertions(+) create mode 100644 .gitattributes create mode 100644 LFM2.5-1.2B-Saiga-It-v2.IQ4_XS.gguf create mode 100644 LFM2.5-1.2B-Saiga-It-v2.Q2_K.gguf create mode 100644 LFM2.5-1.2B-Saiga-It-v2.Q3_K_L.gguf create mode 100644 LFM2.5-1.2B-Saiga-It-v2.Q3_K_M.gguf create mode 100644 LFM2.5-1.2B-Saiga-It-v2.Q3_K_S.gguf create mode 100644 LFM2.5-1.2B-Saiga-It-v2.Q4_K_M.gguf create mode 100644 LFM2.5-1.2B-Saiga-It-v2.Q4_K_S.gguf create mode 100644 LFM2.5-1.2B-Saiga-It-v2.Q5_K_M.gguf create mode 100644 LFM2.5-1.2B-Saiga-It-v2.Q5_K_S.gguf create mode 100644 LFM2.5-1.2B-Saiga-It-v2.Q6_K.gguf create mode 100644 LFM2.5-1.2B-Saiga-It-v2.Q8_0.gguf create mode 100644 LFM2.5-1.2B-Saiga-It-v2.f16.gguf create mode 100644 README.md diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..478aca8 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +LFM2.5-1.2B-Saiga-It-v2.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/LFM2.5-1.2B-Saiga-It-v2.IQ4_XS.gguf b/LFM2.5-1.2B-Saiga-It-v2.IQ4_XS.gguf new file mode 100644 index 0000000..70fa035 --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b9b2fc12f233e82945a6341bb141a7c621f4f4a2670456fb45dea3accf1779a +size 668621824 diff --git a/LFM2.5-1.2B-Saiga-It-v2.Q2_K.gguf b/LFM2.5-1.2B-Saiga-It-v2.Q2_K.gguf new file mode 100644 index 0000000..b53ee20 --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54a14ac8cddab7ecf0d9f2e0f44e80debdb7b0fa5a2158749ac276e7c0aef09c +size 483400704 diff --git a/LFM2.5-1.2B-Saiga-It-v2.Q3_K_L.gguf b/LFM2.5-1.2B-Saiga-It-v2.Q3_K_L.gguf new file mode 100644 index 0000000..fa38022 --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47c583f6073650ff83db224368e6d4577b31401281ba60365e43f726ffbebf83 +size 635476992 diff --git a/LFM2.5-1.2B-Saiga-It-v2.Q3_K_M.gguf b/LFM2.5-1.2B-Saiga-It-v2.Q3_K_M.gguf new file mode 100644 index 0000000..49f8352 --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b787e582d927641c3a79d785c2622c7f877c9a1f7bb0fc14c92362d35a3a772c +size 600349696 diff --git a/LFM2.5-1.2B-Saiga-It-v2.Q3_K_S.gguf b/LFM2.5-1.2B-Saiga-It-v2.Q3_K_S.gguf new file mode 100644 index 0000000..d38cc10 --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d49789a893184f30c399c3dcf7c5f5040b2270044a758760a4ca97ba7faf6b42 +size 558160896 diff --git a/LFM2.5-1.2B-Saiga-It-v2.Q4_K_M.gguf b/LFM2.5-1.2B-Saiga-It-v2.Q4_K_M.gguf new file mode 100644 index 0000000..b36374f --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af1db4151ab2860df1ee6bdbda0812aeb98c237aac1aa2044f000363d053da17 +size 730897408 diff --git a/LFM2.5-1.2B-Saiga-It-v2.Q4_K_S.gguf b/LFM2.5-1.2B-Saiga-It-v2.Q4_K_S.gguf new file mode 100644 index 0000000..263434d --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fca48bdec2134871ed447a787d0af974946bf0df8d45447c78f29953953e5d5 +size 700472320 diff --git a/LFM2.5-1.2B-Saiga-It-v2.Q5_K_M.gguf b/LFM2.5-1.2B-Saiga-It-v2.Q5_K_M.gguf new file mode 100644 index 0000000..6e69916 --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e2589407020ac4636ffbb3eb0e18eb65c220ab88f741de7a07c1f3356ec4b7 +size 843357184 diff --git a/LFM2.5-1.2B-Saiga-It-v2.Q5_K_S.gguf b/LFM2.5-1.2B-Saiga-It-v2.Q5_K_S.gguf new file mode 100644 index 0000000..f1f0b7f --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdbd874bcfd3ffc4ed4248f573cc58c9fc55f41bbd1f711201e536a2be4d8f4a +size 825252864 diff --git a/LFM2.5-1.2B-Saiga-It-v2.Q6_K.gguf b/LFM2.5-1.2B-Saiga-It-v2.Q6_K.gguf new file mode 100644 index 0000000..1631c2c --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baa4109d866a5babf252ba3cb83a7983383ca68f130c4569507ce3fff0412122 +size 962845696 diff --git a/LFM2.5-1.2B-Saiga-It-v2.Q8_0.gguf b/LFM2.5-1.2B-Saiga-It-v2.Q8_0.gguf new file mode 100644 index 0000000..669d4d3 --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb26c515ae2f59063623e7974c7754e6e82c88fc83ee82e7a88d67f74129d598 +size 1246256128 diff --git a/LFM2.5-1.2B-Saiga-It-v2.f16.gguf b/LFM2.5-1.2B-Saiga-It-v2.f16.gguf new file mode 100644 index 0000000..52b64c5 --- /dev/null +++ b/LFM2.5-1.2B-Saiga-It-v2.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e68f1d8bdea1df4b543afc9b65efabcaf91e85c6f0ab0d25bc5d68403cfb8b3 +size 2343328768 diff --git a/README.md b/README.md new file mode 100644 index 0000000..f5b1133 --- /dev/null +++ b/README.md @@ -0,0 +1,89 @@ +--- +base_model: NickupAI/LFM2.5-1.2B-Saiga-It-v2 +datasets: +- IlyaGusev/saiga_scored +- d0rj/alpaca-cleaned-ru +- IlyaGusev/ru_sharegpt_cleaned +- IlyaGusev/ru_turbo_saiga +- lksy/ru_instruct_gpt4 +- wikimedia/wikipedia +- uonlp/CulturaX +- allenai/c4 +language: +- ru +- en +library_name: transformers +license: other +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- russian +- saiga +- continued-pretraining +- sft +- lfm +- liquid-ai +--- +## About + + + + + + + + + +static quants of https://huggingface.co/NickupAI/LFM2.5-1.2B-Saiga-It-v2 + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#LFM2.5-1.2B-Saiga-It-v2-GGUF).*** + +weighted/imatrix quants are available at https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-i1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.Q2_K.gguf) | Q2_K | 0.6 | | +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.Q3_K_S.gguf) | Q3_K_S | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.Q3_K_M.gguf) | Q3_K_M | 0.7 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.Q3_K_L.gguf) | Q3_K_L | 0.7 | | +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.IQ4_XS.gguf) | IQ4_XS | 0.8 | | +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.Q4_K_S.gguf) | Q4_K_S | 0.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.Q4_K_M.gguf) | Q4_K_M | 0.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.Q5_K_S.gguf) | Q5_K_S | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.Q5_K_M.gguf) | Q5_K_M | 0.9 | | +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.Q6_K.gguf) | Q6_K | 1.1 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.Q8_0.gguf) | Q8_0 | 1.3 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/LFM2.5-1.2B-Saiga-It-v2-GGUF/resolve/main/LFM2.5-1.2B-Saiga-It-v2.f16.gguf) | f16 | 2.4 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + +