From 17154a1ff7365976b97e2ed9ce4c2435dc40f83e Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sun, 24 May 2026 03:16:15 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/VezilkaLLM-GGUF Source: Original Platform --- .gitattributes | 47 ++++++++++++++++++++++++++++ README.md | 69 ++++++++++++++++++++++++++++++++++++++++++ VezilkaLLM.IQ4_XS.gguf | 3 ++ VezilkaLLM.Q2_K.gguf | 3 ++ VezilkaLLM.Q3_K_L.gguf | 3 ++ VezilkaLLM.Q3_K_M.gguf | 3 ++ VezilkaLLM.Q3_K_S.gguf | 3 ++ VezilkaLLM.Q4_K_M.gguf | 3 ++ VezilkaLLM.Q4_K_S.gguf | 3 ++ VezilkaLLM.Q5_K_M.gguf | 3 ++ VezilkaLLM.Q5_K_S.gguf | 3 ++ VezilkaLLM.Q6_K.gguf | 3 ++ VezilkaLLM.Q8_0.gguf | 3 ++ VezilkaLLM.f16.gguf | 3 ++ 14 files changed, 152 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 VezilkaLLM.IQ4_XS.gguf create mode 100644 VezilkaLLM.Q2_K.gguf create mode 100644 VezilkaLLM.Q3_K_L.gguf create mode 100644 VezilkaLLM.Q3_K_M.gguf create mode 100644 VezilkaLLM.Q3_K_S.gguf create mode 100644 VezilkaLLM.Q4_K_M.gguf create mode 100644 VezilkaLLM.Q4_K_S.gguf create mode 100644 VezilkaLLM.Q5_K_M.gguf create mode 100644 VezilkaLLM.Q5_K_S.gguf create mode 100644 VezilkaLLM.Q6_K.gguf create mode 100644 VezilkaLLM.Q8_0.gguf create mode 100644 VezilkaLLM.f16.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..b5006da --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +VezilkaLLM.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..c854348 --- /dev/null +++ b/README.md @@ -0,0 +1,69 @@ +--- +base_model: peshevskidimitar/VezilkaLLM +language: +- en +library_name: transformers +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: [] +--- +## About + + + + + + +static quants of https://huggingface.co/peshevskidimitar/VezilkaLLM + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#VezilkaLLM-GGUF).*** + +weighted/imatrix quants are available at https://huggingface.co/mradermacher/VezilkaLLM-i1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.Q2_K.gguf) | Q2_K | 1.8 | | +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.Q3_K_S.gguf) | Q3_K_S | 2.0 | | +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.Q3_K_M.gguf) | Q3_K_M | 2.2 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.Q3_K_L.gguf) | Q3_K_L | 2.3 | | +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.IQ4_XS.gguf) | IQ4_XS | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.Q4_K_S.gguf) | Q4_K_S | 2.5 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.Q4_K_M.gguf) | Q4_K_M | 2.6 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.Q5_K_S.gguf) | Q5_K_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.Q5_K_M.gguf) | Q5_K_M | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.Q6_K.gguf) | Q6_K | 3.3 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.Q8_0.gguf) | Q8_0 | 4.2 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/VezilkaLLM-GGUF/resolve/main/VezilkaLLM.f16.gguf) | f16 | 7.9 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + + diff --git a/VezilkaLLM.IQ4_XS.gguf b/VezilkaLLM.IQ4_XS.gguf new file mode 100644 index 0000000..59a7148 --- /dev/null +++ b/VezilkaLLM.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4453b990281dc37edc77c3f98536f05cb15dbccad6a9d3bd8a2e93ec6cb423d1 +size 2279624256 diff --git a/VezilkaLLM.Q2_K.gguf b/VezilkaLLM.Q2_K.gguf new file mode 100644 index 0000000..d7b5c71 --- /dev/null +++ b/VezilkaLLM.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2f30307339f6d6ae800659c281f2078334900126f2b340b8c58f927e50b113b +size 1729162816 diff --git a/VezilkaLLM.Q3_K_L.gguf b/VezilkaLLM.Q3_K_L.gguf new file mode 100644 index 0000000..b5e5125 --- /dev/null +++ b/VezilkaLLM.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faaafc016bf2578ee5c1cd1c3f137704f8134892ae9063f6c52cfc76e27ca2cc +size 2236083776 diff --git a/VezilkaLLM.Q3_K_M.gguf b/VezilkaLLM.Q3_K_M.gguf new file mode 100644 index 0000000..ce568ad --- /dev/null +++ b/VezilkaLLM.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08750c909ff91b4b68bc751376d1dce560ad9916a3fd77922b31add162e56a26 +size 2098458176 diff --git a/VezilkaLLM.Q3_K_S.gguf b/VezilkaLLM.Q3_K_S.gguf new file mode 100644 index 0000000..3856c5c --- /dev/null +++ b/VezilkaLLM.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6e97ccc22b0fe5a6efafac0ed774936d5ed2235d02b96482d5ec411465eefb0 +size 1937362496 diff --git a/VezilkaLLM.Q4_K_M.gguf b/VezilkaLLM.Q4_K_M.gguf new file mode 100644 index 0000000..1f11b44 --- /dev/null +++ b/VezilkaLLM.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c0c15a7bf7b44e9ad21691ac1bd330f51e14e39b43fbd5e4d08668a080e3715 +size 2489892416 diff --git a/VezilkaLLM.Q4_K_S.gguf b/VezilkaLLM.Q4_K_S.gguf new file mode 100644 index 0000000..557a674 --- /dev/null +++ b/VezilkaLLM.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:493147a06b52f54dfeb881b7198976866a00e394264c12a44e9f65f0a8369dc9 +size 2377928256 diff --git a/VezilkaLLM.Q5_K_M.gguf b/VezilkaLLM.Q5_K_M.gguf new file mode 100644 index 0000000..3a1f89b --- /dev/null +++ b/VezilkaLLM.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8fdb7cace61af3e87a778e8a9859c8ecaf8160102742dae1b90c6cd7e86020c +size 2829696576 diff --git a/VezilkaLLM.Q5_K_S.gguf b/VezilkaLLM.Q5_K_S.gguf new file mode 100644 index 0000000..b2d7bc0 --- /dev/null +++ b/VezilkaLLM.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a85a88b28c0e2d7bcd5d9af4845d03af0c353890e1c98f6228e681dc85fb6ce +size 2764590656 diff --git a/VezilkaLLM.Q6_K.gguf b/VezilkaLLM.Q6_K.gguf new file mode 100644 index 0000000..5beb690 --- /dev/null +++ b/VezilkaLLM.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c1262ede29a8028bdd6e7f30467f98eba0e032e1c1699bf474e35957b2ea129 +size 3190738496 diff --git a/VezilkaLLM.Q8_0.gguf b/VezilkaLLM.Q8_0.gguf new file mode 100644 index 0000000..4cc312c --- /dev/null +++ b/VezilkaLLM.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a697f82544ecd9e048115005ec6fdfd8733ad7f2e6582e62bff3cd3e124b7cc +size 4130400576 diff --git a/VezilkaLLM.f16.gguf b/VezilkaLLM.f16.gguf new file mode 100644 index 0000000..ec1dc91 --- /dev/null +++ b/VezilkaLLM.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27d8fe877d2fe1bf61b0cc8c9a02476575b06e085b69b77b92862d3ef8976f1 +size 7767802176