commit 9b62b0b45c74f66bf9b2cccbca5c7f6c7b188ba2 Author: ModelHub XC Date: Sat Apr 11 18:55:02 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Zeta-2-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..19faa98 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Zeta-2.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..127c5e9 --- /dev/null +++ b/README.md @@ -0,0 +1,90 @@ +--- +base_model: Zeta-DGC/Zeta-2 +datasets: +- DiamondGotCat/Zeta-2-Dataset +language: +- zho +- eng +- fra +- spa +- por +- deu +- ita +- rus +- jpn +- kor +- vie +- tha +- ara +library_name: transformers +license: mit +quantized_by: mradermacher +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/Zeta-DGC/Zeta-2 + + +static quants are available at https://huggingface.co/mradermacher/Zeta-2-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ1_S.gguf) | i1-IQ1_S | 0.3 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ1_M.gguf) | i1-IQ1_M | 0.3 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.3 | | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.3 | | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ2_S.gguf) | i1-IQ2_S | 0.3 | | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ2_M.gguf) | i1-IQ2_M | 0.3 | | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.3 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.3 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q2_K.gguf) | i1-Q2_K | 0.3 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ3_S.gguf) | i1-IQ3_S | 0.4 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q3_K_S.gguf) | i1-Q3_K_S | 0.4 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ3_M.gguf) | i1-IQ3_M | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q3_K_M.gguf) | i1-Q3_K_M | 0.4 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q3_K_L.gguf) | i1-Q3_K_L | 0.4 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ4_XS.gguf) | i1-IQ4_XS | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-IQ4_NL.gguf) | i1-IQ4_NL | 0.4 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q4_0.gguf) | i1-Q4_0 | 0.4 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q4_K_S.gguf) | i1-Q4_K_S | 0.4 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q4_K_M.gguf) | i1-Q4_K_M | 0.4 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q4_1.gguf) | i1-Q4_1 | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q5_K_S.gguf) | i1-Q5_K_S | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q5_K_M.gguf) | i1-Q5_K_M | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Zeta-2-i1-GGUF/resolve/main/Zeta-2.i1-Q6_K.gguf) | i1-Q6_K | 0.5 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/Zeta-2.i1-IQ1_M.gguf b/Zeta-2.i1-IQ1_M.gguf new file mode 100644 index 0000000..9594e5c --- /dev/null +++ b/Zeta-2.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:925d564316350bb818e5a0fd9d191e3766beb3db1c891ac3fb2586888c2c8142 +size 185523680 diff --git a/Zeta-2.i1-IQ1_S.gguf b/Zeta-2.i1-IQ1_S.gguf new file mode 100644 index 0000000..d7049f6 --- /dev/null +++ b/Zeta-2.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d8d02b018e8aeea3251d2ba6edb121bc2b87213055dee2a6e3df91edc1cc08 +size 179680736 diff --git a/Zeta-2.i1-IQ2_M.gguf b/Zeta-2.i1-IQ2_M.gguf new file mode 100644 index 0000000..c61a2bb --- /dev/null +++ b/Zeta-2.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26b44f2de51b500371b8adcfa209b3f892a97b28a83dd5cbaf705f18be1c31cf +size 218602976 diff --git a/Zeta-2.i1-IQ2_S.gguf b/Zeta-2.i1-IQ2_S.gguf new file mode 100644 index 0000000..3fa14a1 --- /dev/null +++ b/Zeta-2.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aad15c08bbeb8a44cea2cdb1266be9767fd4ab13729cfc7ce33e0766a799a6e8 +size 210812384 diff --git a/Zeta-2.i1-IQ2_XS.gguf b/Zeta-2.i1-IQ2_XS.gguf new file mode 100644 index 0000000..ac0e89f --- /dev/null +++ b/Zeta-2.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f81010d27b269ee631ab27dd255e8b7669a5f88e2d8c1d3246e9302d01a0d5ed +size 203838944 diff --git a/Zeta-2.i1-IQ2_XXS.gguf b/Zeta-2.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..b507aa4 --- /dev/null +++ b/Zeta-2.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3e6c0d7ecb26f2c8974d472f96fe35677664a1f1c8ca01914a5a9072bd239a2 +size 195261920 diff --git a/Zeta-2.i1-IQ3_M.gguf b/Zeta-2.i1-IQ3_M.gguf new file mode 100644 index 0000000..7fa8f3f --- /dev/null +++ b/Zeta-2.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff277c16537d6315676a8a88ca661eddda352190c43615d29a86294c866fb4cf +size 274366944 diff --git a/Zeta-2.i1-IQ3_S.gguf b/Zeta-2.i1-IQ3_S.gguf new file mode 100644 index 0000000..5008ce0 --- /dev/null +++ b/Zeta-2.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ab33bb5ead360c2b28ff6d88821c8db003f815ea6a1adc484086f14167e7aed +size 266533344 diff --git a/Zeta-2.i1-IQ3_XS.gguf b/Zeta-2.i1-IQ3_XS.gguf new file mode 100644 index 0000000..b959134 --- /dev/null +++ b/Zeta-2.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9437d6686159599f7a15c0ce7cf4e134933e1831e4d16bb0059c40ed8fdfffa7 +size 259308000 diff --git a/Zeta-2.i1-IQ3_XXS.gguf b/Zeta-2.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..9d3cb3a --- /dev/null +++ b/Zeta-2.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28eeb5d3018296a8a1e0ddc139468761b18e23f1426cd839399a6b746fdc9d15 +size 229453280 diff --git a/Zeta-2.i1-IQ4_NL.gguf b/Zeta-2.i1-IQ4_NL.gguf new file mode 100644 index 0000000..65752b9 --- /dev/null +++ b/Zeta-2.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513e98e9eeefe4f845ccafdbd66b373a3c0d30850055da5ad191ea81da2e8bad +size 307476960 diff --git a/Zeta-2.i1-IQ4_XS.gguf b/Zeta-2.i1-IQ4_XS.gguf new file mode 100644 index 0000000..e6a0a01 --- /dev/null +++ b/Zeta-2.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73d0e4d10919ef29c980200228751feeb13dab816ff07d80b208bcd652718982 +size 297843168 diff --git a/Zeta-2.i1-Q2_K.gguf b/Zeta-2.i1-Q2_K.gguf new file mode 100644 index 0000000..0f20a16 --- /dev/null +++ b/Zeta-2.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fa67a10f855107573befb4d833587f3ed1e3a925536cf514fcaf9bbc9b13f6 +size 247364064 diff --git a/Zeta-2.i1-Q2_K_S.gguf b/Zeta-2.i1-Q2_K_S.gguf new file mode 100644 index 0000000..418c557 --- /dev/null +++ b/Zeta-2.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:184bc76bc7076ac556bd44d08e12a714c2493c2eb559793bed645c45a488ffe1 +size 237251040 diff --git a/Zeta-2.i1-Q3_K_L.gguf b/Zeta-2.i1-Q3_K_L.gguf new file mode 100644 index 0000000..bb20c78 --- /dev/null +++ b/Zeta-2.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f29014f8a31ed56506f7217dc9a5d5e1d01fae577aa1aa0c947be6a46848393 +size 297351648 diff --git a/Zeta-2.i1-Q3_K_M.gguf b/Zeta-2.i1-Q3_K_M.gguf new file mode 100644 index 0000000..8550ee7 --- /dev/null +++ b/Zeta-2.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d18db52b201fecdd9f437f7bbd851f0cdae86097a1ad9d76ce81d48a41f8ccb1 +size 283032032 diff --git a/Zeta-2.i1-Q3_K_S.gguf b/Zeta-2.i1-Q3_K_S.gguf new file mode 100644 index 0000000..3515bd4 --- /dev/null +++ b/Zeta-2.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f25ff3e54c3dd37c11966e2490e7e4d73f33932b3aac0eeda97f32ed71e245d +size 266533344 diff --git a/Zeta-2.i1-Q4_0.gguf b/Zeta-2.i1-Q4_0.gguf new file mode 100644 index 0000000..f77f03d --- /dev/null +++ b/Zeta-2.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54c0483131c45224a2e7b79360d545edb6973a5bca03801516074187b29339c7 +size 308017632 diff --git a/Zeta-2.i1-Q4_1.gguf b/Zeta-2.i1-Q4_1.gguf new file mode 100644 index 0000000..50ce340 --- /dev/null +++ b/Zeta-2.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e53ad14bfc8dc0ab731cd27ec66818f0314283ad05e8c6f3e40d3ff0add0be9d +size 326744544 diff --git a/Zeta-2.i1-Q4_K_M.gguf b/Zeta-2.i1-Q4_K_M.gguf new file mode 100644 index 0000000..e607a1a --- /dev/null +++ b/Zeta-2.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0700487f9cbfc6b205a51d44d1b3f6febab1b9d76342af42d0213f0a2dd65f75 +size 319642080 diff --git a/Zeta-2.i1-Q4_K_S.gguf b/Zeta-2.i1-Q4_K_S.gguf new file mode 100644 index 0000000..ee30635 --- /dev/null +++ b/Zeta-2.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e9593b931a95ba1a8274ff39f832e6aae9e044ba7463005a8b45a0426b679c5 +size 309082592 diff --git a/Zeta-2.i1-Q5_K_M.gguf b/Zeta-2.i1-Q5_K_M.gguf new file mode 100644 index 0000000..21b65c1 --- /dev/null +++ b/Zeta-2.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e87d7d262c5be6c1a18ec74f28b7cfcea63e1282707ab89cb096277fa41f7df +size 352279008 diff --git a/Zeta-2.i1-Q5_K_S.gguf b/Zeta-2.i1-Q5_K_S.gguf new file mode 100644 index 0000000..662df08 --- /dev/null +++ b/Zeta-2.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff2c8a97389a4cbc57a38914aeb54b0b9a1ae70395c89804bf74a034c1b5e208 +size 346012128 diff --git a/Zeta-2.i1-Q6_K.gguf b/Zeta-2.i1-Q6_K.gguf new file mode 100644 index 0000000..8ac8c68 --- /dev/null +++ b/Zeta-2.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1385fe7aa80aec186575f3284b6f288bc5f39d53f014d30953574f60bb63e77b +size 386955744 diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..fa1bd0d --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f78479323630416c06a676af705c239fcf912187a65f53fafa7413be5751285 +size 865717