commit 29fbc80af1d799758f10286aad38f71473bf2fd6 Author: ModelHub XC Date: Mon May 4 17:14:44 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/zephyr-dpo-v2-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..b1b7a57 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,58 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +zephyr-dpo-v2.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..e38f82f --- /dev/null +++ b/README.md @@ -0,0 +1,84 @@ +--- +base_model: BarraHome/zephyr-dpo-v2 +datasets: +- jondurbin/truthy-dpo-v0.1 +- BarraHome/ultrafeedback_binarized +language: +- en +- es +library_name: transformers +license: mit +quantized_by: mradermacher +tags: +- text-generation-inference +- transformers +- unsloth +- mistral +- trl +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/BarraHome/zephyr-dpo-v2 + + +static quants are available at https://huggingface.co/mradermacher/zephyr-dpo-v2-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-IQ1_S.gguf) | i1-IQ1_S | 1.7 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-IQ1_M.gguf) | i1-IQ1_M | 1.9 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.1 | | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.3 | | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-IQ2_S.gguf) | i1-IQ2_S | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-IQ2_M.gguf) | i1-IQ2_M | 2.6 | | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-Q2_K_S.gguf) | i1-Q2_K_S | 2.6 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-Q2_K.gguf) | i1-Q2_K | 2.8 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 2.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.1 | | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.3 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-IQ3_S.gguf) | i1-IQ3_S | 3.3 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-IQ3_M.gguf) | i1-IQ3_M | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-Q3_K_M.gguf) | i1-Q3_K_M | 3.6 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-Q3_K_L.gguf) | i1-Q3_K_L | 3.9 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.0 | | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-Q4_0.gguf) | i1-Q4_0 | 4.2 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.2 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-Q4_K_M.gguf) | i1-Q4_K_M | 4.5 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.1 | | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.2 | | +| [GGUF](https://huggingface.co/mradermacher/zephyr-dpo-v2-i1-GGUF/resolve/main/zephyr-dpo-v2.i1-Q6_K.gguf) | i1-Q6_K | 6.0 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..6831e42 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cf85b25f74b3d0b4339931cf68d646ff66cd0ecbbb81936c47010a8bd30ad4f +size 4988157 diff --git a/zephyr-dpo-v2.i1-IQ1_M.gguf b/zephyr-dpo-v2.i1-IQ1_M.gguf new file mode 100644 index 0000000..69b3145 --- /dev/null +++ b/zephyr-dpo-v2.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:255160c09be4c5b795946a6188f27a973b0bd4c44495012965bf81330f6e74a2 +size 1754448064 diff --git a/zephyr-dpo-v2.i1-IQ1_S.gguf b/zephyr-dpo-v2.i1-IQ1_S.gguf new file mode 100644 index 0000000..25ee3b5 --- /dev/null +++ b/zephyr-dpo-v2.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a07f105b384752aae6db2bd9735ce10c5e5689ff339112d658decc835a8d9c4 +size 1612103872 diff --git a/zephyr-dpo-v2.i1-IQ2_M.gguf b/zephyr-dpo-v2.i1-IQ2_M.gguf new file mode 100644 index 0000000..4bd045e --- /dev/null +++ b/zephyr-dpo-v2.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c36f8a442dd34d4bfeebc54c49b787a0dc12de41f870ead070e2906a11d64305 +size 2500714688 diff --git a/zephyr-dpo-v2.i1-IQ2_S.gguf b/zephyr-dpo-v2.i1-IQ2_S.gguf new file mode 100644 index 0000000..cf063be --- /dev/null +++ b/zephyr-dpo-v2.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63da66fbb4008ba16d6c5ed06e3cc9e447d084a4ca72c255dba3efcaaac7435c +size 2310922432 diff --git a/zephyr-dpo-v2.i1-IQ2_XS.gguf b/zephyr-dpo-v2.i1-IQ2_XS.gguf new file mode 100644 index 0000000..4135b03 --- /dev/null +++ b/zephyr-dpo-v2.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd5cc6d318b6f4ea5c38de3e3edd31d41f54ef2c224723dd6178a8c5d1393f9 +size 2198257856 diff --git a/zephyr-dpo-v2.i1-IQ2_XXS.gguf b/zephyr-dpo-v2.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..30446aa --- /dev/null +++ b/zephyr-dpo-v2.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c070ad1886a7c1d6edb4f3ea2fff5837a3fa5a95fbf780807115dce548657d81 +size 1991688384 diff --git a/zephyr-dpo-v2.i1-IQ3_M.gguf b/zephyr-dpo-v2.i1-IQ3_M.gguf new file mode 100644 index 0000000..3aa2f41 --- /dev/null +++ b/zephyr-dpo-v2.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ad255502f649bcb066bb04f13bc3098859c28c37c2a6be6d83bea7c723e084d +size 3284893888 diff --git a/zephyr-dpo-v2.i1-IQ3_S.gguf b/zephyr-dpo-v2.i1-IQ3_S.gguf new file mode 100644 index 0000000..7ed2e0e --- /dev/null +++ b/zephyr-dpo-v2.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99097dd25d90fc76bbc5de0363d570a2d9d16d1b73dc78ace33f37ba7ac2ce65 +size 3182395584 diff --git a/zephyr-dpo-v2.i1-IQ3_XS.gguf b/zephyr-dpo-v2.i1-IQ3_XS.gguf new file mode 100644 index 0000000..fbe096a --- /dev/null +++ b/zephyr-dpo-v2.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bf479736b0f5932a264a048d6702da0f826c6e99bc60c66eefee06187f52067 +size 3018817728 diff --git a/zephyr-dpo-v2.i1-IQ3_XXS.gguf b/zephyr-dpo-v2.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..560cd31 --- /dev/null +++ b/zephyr-dpo-v2.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cff84d87645fff54c9fa96e047c9ffd8710142ac80568fd24b08cf7475be91d9 +size 2827346112 diff --git a/zephyr-dpo-v2.i1-IQ4_XS.gguf b/zephyr-dpo-v2.i1-IQ4_XS.gguf new file mode 100644 index 0000000..dbfff9d --- /dev/null +++ b/zephyr-dpo-v2.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f555c194d0600e6bceee57d0669a45831138708e9e27c0c288aa77906d7b3068 +size 3907690688 diff --git a/zephyr-dpo-v2.i1-Q2_K.gguf b/zephyr-dpo-v2.i1-Q2_K.gguf new file mode 100644 index 0000000..e7089f9 --- /dev/null +++ b/zephyr-dpo-v2.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce3bb5d2ec45b937eeb47af5de643a806e6330d3761cbe218ac20927c0d33d9 +size 2719244480 diff --git a/zephyr-dpo-v2.i1-Q2_K_S.gguf b/zephyr-dpo-v2.i1-Q2_K_S.gguf new file mode 100644 index 0000000..8b5bf0e --- /dev/null +++ b/zephyr-dpo-v2.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6383780c7c2b9364a583bd247eeef96c2e0e3283a9a62ff6d66a3350b1d446be +size 2528927936 diff --git a/zephyr-dpo-v2.i1-Q3_K_L.gguf b/zephyr-dpo-v2.i1-Q3_K_L.gguf new file mode 100644 index 0000000..c68ab47 --- /dev/null +++ b/zephyr-dpo-v2.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad61cbf93ea9881e7fad3e40873d66cf91858d46bbc74d629133ef3d6e44322 +size 3822026944 diff --git a/zephyr-dpo-v2.i1-Q3_K_M.gguf b/zephyr-dpo-v2.i1-Q3_K_M.gguf new file mode 100644 index 0000000..794592b --- /dev/null +++ b/zephyr-dpo-v2.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87e7e94db344888bb073618f25c2d83497cc26e2d378984acbd70479e33076b4 +size 3518988480 diff --git a/zephyr-dpo-v2.i1-Q3_K_S.gguf b/zephyr-dpo-v2.i1-Q3_K_S.gguf new file mode 100644 index 0000000..b24a7c7 --- /dev/null +++ b/zephyr-dpo-v2.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ed0184d510c0c67ff5c162d760e0ddbde0257de5c15580db8c5036f618e58b +size 3164569792 diff --git a/zephyr-dpo-v2.i1-Q4_0.gguf b/zephyr-dpo-v2.i1-Q4_0.gguf new file mode 100644 index 0000000..51c93de --- /dev/null +++ b/zephyr-dpo-v2.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b238006664f81d039f66f6eeccadee5eab14f384b2b1d5490c22d7f1a308938 +size 4123599040 diff --git a/zephyr-dpo-v2.i1-Q4_K_M.gguf b/zephyr-dpo-v2.i1-Q4_K_M.gguf new file mode 100644 index 0000000..701351a --- /dev/null +++ b/zephyr-dpo-v2.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:229f919e90b2df93fe6785ed08063faed7122c740260812f7e700903dc0ef5be +size 4368441536 diff --git a/zephyr-dpo-v2.i1-Q4_K_S.gguf b/zephyr-dpo-v2.i1-Q4_K_S.gguf new file mode 100644 index 0000000..82e14f1 --- /dev/null +++ b/zephyr-dpo-v2.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:658e6f5094f26ea39bc53932c1aba13e397e82faf6f89f4b8e94279bc16ce1af +size 4140376256 diff --git a/zephyr-dpo-v2.i1-Q5_K_M.gguf b/zephyr-dpo-v2.i1-Q5_K_M.gguf new file mode 100644 index 0000000..7368116 --- /dev/null +++ b/zephyr-dpo-v2.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fabb572d2bce2fc10824718113a74aff6aa6951111a7486440f19be83f9e45de +size 5131411648 diff --git a/zephyr-dpo-v2.i1-Q5_K_S.gguf b/zephyr-dpo-v2.i1-Q5_K_S.gguf new file mode 100644 index 0000000..7b13089 --- /dev/null +++ b/zephyr-dpo-v2.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2022f6eb9cc73c328458b4d6fb16eced43b187c81714d4b4b00fad7b5f49639b +size 4997718208 diff --git a/zephyr-dpo-v2.i1-Q6_K.gguf b/zephyr-dpo-v2.i1-Q6_K.gguf new file mode 100644 index 0000000..7fab280 --- /dev/null +++ b/zephyr-dpo-v2.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca58186a015a2eb88dfa2e5b17df84f03bb788216de837602d435e7119ac144 +size 5942067392