commit 681bd65a47150e62edac0999df673f9469103829 Author: ModelHub XC Date: Wed Apr 22 07:46:08 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Sala-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..1ec88ed --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Sala.imatrix.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Sala.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..46977dd --- /dev/null +++ b/README.md @@ -0,0 +1,87 @@ +--- +base_model: Finisha-F-scratch/Sala +language: +- en +library_name: transformers +license: other +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- text-generation-inference +--- +## About + + + + + + + + + +weighted/imatrix quants of https://huggingface.co/Finisha-F-scratch/Sala + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Sala-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/Sala-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.imatrix.gguf) | imatrix | 0.1 | imatrix file (for creating your own quants) | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ1_S.gguf) | i1-IQ1_S | 0.1 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ1_M.gguf) | i1-IQ1_M | 0.2 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ2_S.gguf) | i1-IQ2_S | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ2_M.gguf) | i1-IQ2_M | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.2 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.2 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q2_K.gguf) | i1-Q2_K | 0.2 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ3_S.gguf) | i1-IQ3_S | 0.2 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q3_K_S.gguf) | i1-Q3_K_S | 0.2 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ3_M.gguf) | i1-IQ3_M | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q3_K_M.gguf) | i1-Q3_K_M | 0.2 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ4_XS.gguf) | i1-IQ4_XS | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-IQ4_NL.gguf) | i1-IQ4_NL | 0.2 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q4_0.gguf) | i1-Q4_0 | 0.2 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q4_K_S.gguf) | i1-Q4_K_S | 0.2 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q3_K_L.gguf) | i1-Q3_K_L | 0.2 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q4_1.gguf) | i1-Q4_1 | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q4_K_M.gguf) | i1-Q4_K_M | 0.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q5_K_S.gguf) | i1-Q5_K_S | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q5_K_M.gguf) | i1-Q5_K_M | 0.2 | | +| [GGUF](https://huggingface.co/mradermacher/Sala-i1-GGUF/resolve/main/Sala.i1-Q6_K.gguf) | i1-Q6_K | 0.2 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/Sala.i1-IQ1_M.gguf b/Sala.i1-IQ1_M.gguf new file mode 100644 index 0000000..88dc414 --- /dev/null +++ b/Sala.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bfdeb9621b044aa6e7fdcaadea64ea8b74bc7c7bab7cf58a854518ca0ef1f19 +size 51056800 diff --git a/Sala.i1-IQ1_S.gguf b/Sala.i1-IQ1_S.gguf new file mode 100644 index 0000000..71873e2 --- /dev/null +++ b/Sala.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:370d9c2189d5003b623695f6b2373afc5b8d8b0d48f870502c3c3b7e3c96287d +size 49287328 diff --git a/Sala.i1-IQ2_M.gguf b/Sala.i1-IQ2_M.gguf new file mode 100644 index 0000000..2dc4562 --- /dev/null +++ b/Sala.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e215dfd523abc2bf3476af40bdb99a1478c2a637ba07f5ab6320a3fe659bbcfd +size 60180640 diff --git a/Sala.i1-IQ2_S.gguf b/Sala.i1-IQ2_S.gguf new file mode 100644 index 0000000..6186a2a --- /dev/null +++ b/Sala.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a97df33f00b32530f6e01fb4e308393ee9eb1cec4349a599737e2e8bb4fb054 +size 57821344 diff --git a/Sala.i1-IQ2_XS.gguf b/Sala.i1-IQ2_XS.gguf new file mode 100644 index 0000000..f4744f2 --- /dev/null +++ b/Sala.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ab9465bf0ec84338e657a02155ce0799cd706e64732615c5ee2d061d764c73c +size 56586400 diff --git a/Sala.i1-IQ2_XXS.gguf b/Sala.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..42d930d --- /dev/null +++ b/Sala.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf26c3c77d4068bac947e4efd0fc73e5a4f0e7b95e8688dc09c1146e2016a6d +size 54005920 diff --git a/Sala.i1-IQ3_M.gguf b/Sala.i1-IQ3_M.gguf new file mode 100644 index 0000000..f7452b6 --- /dev/null +++ b/Sala.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d640e8fe25dac485d1640d84233e4d454ca912835c0f7b9747f4b4210d52737 +size 77637856 diff --git a/Sala.i1-IQ3_S.gguf b/Sala.i1-IQ3_S.gguf new file mode 100644 index 0000000..affe3b8 --- /dev/null +++ b/Sala.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b67de2d6a46a0c4a5e8f97e7f2ceb53f2bd20109c5c02e89f62281d92289d89 +size 73564384 diff --git a/Sala.i1-IQ3_XS.gguf b/Sala.i1-IQ3_XS.gguf new file mode 100644 index 0000000..cc5ed2f --- /dev/null +++ b/Sala.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e929ddaa10f3f94bf7ca4adf30b0fd529aeef397d1eb3564d4683cc8670b4ca6 +size 72569056 diff --git a/Sala.i1-IQ3_XXS.gguf b/Sala.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..71db73e --- /dev/null +++ b/Sala.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d870f371bfe9928ac377cb272e31c07042771ee226d6fdffb3dc0270cc7ddeb +size 64788640 diff --git a/Sala.i1-IQ4_NL.gguf b/Sala.i1-IQ4_NL.gguf new file mode 100644 index 0000000..256f072 --- /dev/null +++ b/Sala.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b078647fb336e31f5bd5bcebc656c06922303357b251ee8f4504629b6300bf +size 84844768 diff --git a/Sala.i1-IQ4_XS.gguf b/Sala.i1-IQ4_XS.gguf new file mode 100644 index 0000000..d9a702d --- /dev/null +++ b/Sala.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1951417d3d17c3186db8edc79144f2a0224a38e872b3b58949be77fc2576adbe +size 82190560 diff --git a/Sala.i1-Q2_K.gguf b/Sala.i1-Q2_K.gguf new file mode 100644 index 0000000..addcc1e --- /dev/null +++ b/Sala.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55ea6a60bacb721b27e598810ad54235e3543a3fad6394ab2ec3480ad700b25 +size 68532448 diff --git a/Sala.i1-Q2_K_S.gguf b/Sala.i1-Q2_K_S.gguf new file mode 100644 index 0000000..6e45b31 --- /dev/null +++ b/Sala.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f5ac9ceb3d606c9d41ebe0d21c3fede923ce43f495a27d408dcda015f7bb63 +size 65491168 diff --git a/Sala.i1-Q3_K_L.gguf b/Sala.i1-Q3_K_L.gguf new file mode 100644 index 0000000..f214560 --- /dev/null +++ b/Sala.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d035d7f40ff4a6b93ba8ba58dc611b20ea599c4bd3b64a00eceb2c30a150f3e +size 85508320 diff --git a/Sala.i1-Q3_K_M.gguf b/Sala.i1-Q3_K_M.gguf new file mode 100644 index 0000000..d337e21 --- /dev/null +++ b/Sala.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67f6a2053f326a913ec8363f69342d6e818519547f3cd161befbfc6fdde2e5c6 +size 81084640 diff --git a/Sala.i1-Q3_K_S.gguf b/Sala.i1-Q3_K_S.gguf new file mode 100644 index 0000000..7275f4e --- /dev/null +++ b/Sala.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2094aee264c36bf65b5e66c916ddd778d197404f61174612cbd648cc5218e917 +size 73564384 diff --git a/Sala.i1-Q4_0.gguf b/Sala.i1-Q4_0.gguf new file mode 100644 index 0000000..2ee11f7 --- /dev/null +++ b/Sala.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eefd0f3ed898f2546f268ed05e2dbb5e3e07ce31af548092d2f2bc74c65154dd +size 84992224 diff --git a/Sala.i1-Q4_1.gguf b/Sala.i1-Q4_1.gguf new file mode 100644 index 0000000..06a3749 --- /dev/null +++ b/Sala.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df454884a1b3025a8242f7c5d933ae6fd53b0fa317ca35521aa9bca2fde9e6a0 +size 90153184 diff --git a/Sala.i1-Q4_K_M.gguf b/Sala.i1-Q4_K_M.gguf new file mode 100644 index 0000000..a43bf0e --- /dev/null +++ b/Sala.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ae17e6e59b30f97f5c4195bcea4922144c59b15e4dbce5d1004e2887eb19502 +size 91148512 diff --git a/Sala.i1-Q4_K_S.gguf b/Sala.i1-Q4_K_S.gguf new file mode 100644 index 0000000..e416ab5 --- /dev/null +++ b/Sala.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fedfcc7e64d6dc48d1d95921bbe9444506ceee5e098d292b604e9d6732d16cf7 +size 85139680 diff --git a/Sala.i1-Q5_K_M.gguf b/Sala.i1-Q5_K_M.gguf new file mode 100644 index 0000000..802552e --- /dev/null +++ b/Sala.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78ed1d283f80b9deb895d456f63574b61898a5874788f0ae871a05c7d4f72775 +size 100161760 diff --git a/Sala.i1-Q5_K_S.gguf b/Sala.i1-Q5_K_S.gguf new file mode 100644 index 0000000..5d8fe3a --- /dev/null +++ b/Sala.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:014976ae18c58bd790a80c11b1b39731fc053cab407da7db75b65257658ef9a5 +size 95461600 diff --git a/Sala.i1-Q6_K.gguf b/Sala.i1-Q6_K.gguf new file mode 100644 index 0000000..0bbe699 --- /dev/null +++ b/Sala.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:309e8f365d76ec1f0fea62ebe9b79541f673cd5d81e7bb0857fc314fdfa4ffff +size 106741984 diff --git a/Sala.imatrix.gguf b/Sala.imatrix.gguf new file mode 100644 index 0000000..dce799e --- /dev/null +++ b/Sala.imatrix.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7101b0826e05c9dde1ec79d07640abf7ff9f4c7d7866d1a8c5f04cdb2f1618ce +size 265664