commit abab13b375520dc4ff04d5c6097f80e114b1f9f8 Author: ModelHub XC Date: Fri May 1 02:28:00 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Superswallow-7b-v0.3-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..b44e7a1 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,47 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Superswallow-7b-v0.3.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..dba6f11 --- /dev/null +++ b/README.md @@ -0,0 +1,69 @@ +--- +base_model: nitky/Superswallow-7b-v0.3 +language: +- en +- ja +library_name: transformers +license: llama2 +model_type: llama +quantized_by: mradermacher +tags: +- mergekit +- merge +--- +## About + + + + + + +static quants of https://huggingface.co/nitky/Superswallow-7b-v0.3 + + +weighted/imatrix quants are available at https://huggingface.co/mradermacher/Superswallow-7b-v0.3-i1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.Q2_K.gguf) | Q2_K | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.Q3_K_S.gguf) | Q3_K_S | 3.1 | | +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.Q3_K_M.gguf) | Q3_K_M | 3.5 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.Q3_K_L.gguf) | Q3_K_L | 3.8 | | +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.IQ4_XS.gguf) | IQ4_XS | 3.8 | | +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.Q4_K_S.gguf) | Q4_K_S | 4.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.Q4_K_M.gguf) | Q4_K_M | 4.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.Q5_K_S.gguf) | Q5_K_S | 4.8 | | +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.Q5_K_M.gguf) | Q5_K_M | 5.0 | | +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.Q6_K.gguf) | Q6_K | 5.7 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.Q8_0.gguf) | Q8_0 | 7.4 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/Superswallow-7b-v0.3-GGUF/resolve/main/Superswallow-7b-v0.3.f16.gguf) | f16 | 13.8 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + + diff --git a/Superswallow-7b-v0.3.IQ4_XS.gguf b/Superswallow-7b-v0.3.IQ4_XS.gguf new file mode 100644 index 0000000..94703e8 --- /dev/null +++ b/Superswallow-7b-v0.3.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df741dc1a9244816dd63ca84b2c45ec233be0d9cd9eb43d97bfdd5f521d4b875 +size 3709643232 diff --git a/Superswallow-7b-v0.3.Q2_K.gguf b/Superswallow-7b-v0.3.Q2_K.gguf new file mode 100644 index 0000000..974d675 --- /dev/null +++ b/Superswallow-7b-v0.3.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:682b42a818459cb854b9a5a754ffab2bd0fbf295e6d0f9c16eb901dbcd483ab9 +size 2585692128 diff --git a/Superswallow-7b-v0.3.Q3_K_L.gguf b/Superswallow-7b-v0.3.Q3_K_L.gguf new file mode 100644 index 0000000..18b47b6 --- /dev/null +++ b/Superswallow-7b-v0.3.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8f496fd0054937f3cfe1f2a00c44b5a01fe6082c28e6e6fe57d764fef20487 +size 3654588640 diff --git a/Superswallow-7b-v0.3.Q3_K_M.gguf b/Superswallow-7b-v0.3.Q3_K_M.gguf new file mode 100644 index 0000000..b0a1d0c --- /dev/null +++ b/Superswallow-7b-v0.3.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4671aec27475822cf23ec803907214745efd78dac21f6a2bb08a597e2053c0b4 +size 3355482336 diff --git a/Superswallow-7b-v0.3.Q3_K_S.gguf b/Superswallow-7b-v0.3.Q3_K_S.gguf new file mode 100644 index 0000000..c5c026f --- /dev/null +++ b/Superswallow-7b-v0.3.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c0e4eb64f9c9b8b249001e2d94478814711fadcc495803d7da9a85850ca8b25 +size 3005782240 diff --git a/Superswallow-7b-v0.3.Q4_K_M.gguf b/Superswallow-7b-v0.3.Q4_K_M.gguf new file mode 100644 index 0000000..60a7178 --- /dev/null +++ b/Superswallow-7b-v0.3.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f90d2e2c810d67efaad91f558f6091f7c89bc6cb14d03bd7b477e2a1d19591f +size 4144561632 diff --git a/Superswallow-7b-v0.3.Q4_K_S.gguf b/Superswallow-7b-v0.3.Q4_K_S.gguf new file mode 100644 index 0000000..0a3be99 --- /dev/null +++ b/Superswallow-7b-v0.3.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:353072c8b2d38518a63d3a1327532494bba22d226f309c4f27a9ff4a461dd5ce +size 3920297440 diff --git a/Superswallow-7b-v0.3.Q5_K_M.gguf b/Superswallow-7b-v0.3.Q5_K_M.gguf new file mode 100644 index 0000000..108429c --- /dev/null +++ b/Superswallow-7b-v0.3.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:465bc34b149c4c06692cb3926cae93f198db4162e30059b874af855114d89957 +size 4852436448 diff --git a/Superswallow-7b-v0.3.Q5_K_S.gguf b/Superswallow-7b-v0.3.Q5_K_S.gguf new file mode 100644 index 0000000..505a137 --- /dev/null +++ b/Superswallow-7b-v0.3.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8044ade8e759181719a33368fd47e8c2a27cf3bb0c56d5a5ff4d70cfec611065 +size 4720971232 diff --git a/Superswallow-7b-v0.3.Q6_K.gguf b/Superswallow-7b-v0.3.Q6_K.gguf new file mode 100644 index 0000000..fffab68 --- /dev/null +++ b/Superswallow-7b-v0.3.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3463ac060c0b3892b598483a0384e438c14ced4a57f9cce8ea0f73c5325c53b +size 5604553440 diff --git a/Superswallow-7b-v0.3.Q8_0.gguf b/Superswallow-7b-v0.3.Q8_0.gguf new file mode 100644 index 0000000..77283ec --- /dev/null +++ b/Superswallow-7b-v0.3.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eb79b6be2289fd24e3a387ba726613a17036e96fdcf468cda74938a25a9e3a1 +size 7258622176 diff --git a/Superswallow-7b-v0.3.f16.gguf b/Superswallow-7b-v0.3.f16.gguf new file mode 100644 index 0000000..c84bd2b --- /dev/null +++ b/Superswallow-7b-v0.3.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6a58f2bd692daad1d72b26386b313563d79bd4f20f5ce9f77b50ed25f7eae4 +size 13661468896