From d782287a7025c782938d7645bd24195397d5de81 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 11 Apr 2026 11:39:02 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/Qwen2-0.5B-DPO-i1-GGUF Source: Original Platform --- .gitattributes | 60 ++++++++++++++++++++++++ Qwen2-0.5B-DPO.i1-IQ1_M.gguf | 3 ++ Qwen2-0.5B-DPO.i1-IQ1_S.gguf | 3 ++ Qwen2-0.5B-DPO.i1-IQ2_M.gguf | 3 ++ Qwen2-0.5B-DPO.i1-IQ2_S.gguf | 3 ++ Qwen2-0.5B-DPO.i1-IQ2_XS.gguf | 3 ++ Qwen2-0.5B-DPO.i1-IQ2_XXS.gguf | 3 ++ Qwen2-0.5B-DPO.i1-IQ3_M.gguf | 3 ++ Qwen2-0.5B-DPO.i1-IQ3_S.gguf | 3 ++ Qwen2-0.5B-DPO.i1-IQ3_XS.gguf | 3 ++ Qwen2-0.5B-DPO.i1-IQ3_XXS.gguf | 3 ++ Qwen2-0.5B-DPO.i1-IQ4_NL.gguf | 3 ++ Qwen2-0.5B-DPO.i1-IQ4_XS.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q2_K.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q2_K_S.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q3_K_L.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q3_K_M.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q3_K_S.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q4_0.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q4_1.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q4_K_M.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q4_K_S.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q5_K_M.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q5_K_S.gguf | 3 ++ Qwen2-0.5B-DPO.i1-Q6_K.gguf | 3 ++ README.md | 86 ++++++++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 27 files changed, 221 insertions(+) create mode 100644 .gitattributes create mode 100644 Qwen2-0.5B-DPO.i1-IQ1_M.gguf create mode 100644 Qwen2-0.5B-DPO.i1-IQ1_S.gguf create mode 100644 Qwen2-0.5B-DPO.i1-IQ2_M.gguf create mode 100644 Qwen2-0.5B-DPO.i1-IQ2_S.gguf create mode 100644 Qwen2-0.5B-DPO.i1-IQ2_XS.gguf create mode 100644 Qwen2-0.5B-DPO.i1-IQ2_XXS.gguf create mode 100644 Qwen2-0.5B-DPO.i1-IQ3_M.gguf create mode 100644 Qwen2-0.5B-DPO.i1-IQ3_S.gguf create mode 100644 Qwen2-0.5B-DPO.i1-IQ3_XS.gguf create mode 100644 Qwen2-0.5B-DPO.i1-IQ3_XXS.gguf create mode 100644 Qwen2-0.5B-DPO.i1-IQ4_NL.gguf create mode 100644 Qwen2-0.5B-DPO.i1-IQ4_XS.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q2_K.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q2_K_S.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q3_K_L.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q3_K_M.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q3_K_S.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q4_0.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q4_1.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q4_K_M.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q4_K_S.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q5_K_M.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q5_K_S.gguf create mode 100644 Qwen2-0.5B-DPO.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..1a9d51e --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Qwen2-0.5B-DPO.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Qwen2-0.5B-DPO.i1-IQ1_M.gguf b/Qwen2-0.5B-DPO.i1-IQ1_M.gguf new file mode 100644 index 0000000..8e429cd --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfdeb96baa10e06acafba4fa7a5cd3dd8f5a070438c1948e25027ba6db7e3862 +size 317972832 diff --git a/Qwen2-0.5B-DPO.i1-IQ1_S.gguf b/Qwen2-0.5B-DPO.i1-IQ1_S.gguf new file mode 100644 index 0000000..6768eca --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a4d980ef93ba2000ccd7a4baa95a0bee005a1448bb48e7b5dce33e32f167d6e +size 315827808 diff --git a/Qwen2-0.5B-DPO.i1-IQ2_M.gguf b/Qwen2-0.5B-DPO.i1-IQ2_M.gguf new file mode 100644 index 0000000..30f7eda --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0a307339655d4419f2f19ebd479d14bf33ea40d87a4ab6c867e675bbf6c66b4 +size 328595808 diff --git a/Qwen2-0.5B-DPO.i1-IQ2_S.gguf b/Qwen2-0.5B-DPO.i1-IQ2_S.gguf new file mode 100644 index 0000000..265374e --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f245feb88ec9584ed4dc2bae910878e889da0ed98ba7886a72898977cf375d +size 325735776 diff --git a/Qwen2-0.5B-DPO.i1-IQ2_XS.gguf b/Qwen2-0.5B-DPO.i1-IQ2_XS.gguf new file mode 100644 index 0000000..eb30781 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd8c356e19c544096cb042a59181b317e70a28dd310c91368bb230ea3c86ba0d +size 324407904 diff --git a/Qwen2-0.5B-DPO.i1-IQ2_XXS.gguf b/Qwen2-0.5B-DPO.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..4983db7 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ee8e4f89c984f7889f06bc5d3851b709929fab0f818f7b52f7077f74fb516d +size 321547872 diff --git a/Qwen2-0.5B-DPO.i1-IQ3_M.gguf b/Qwen2-0.5B-DPO.i1-IQ3_M.gguf new file mode 100644 index 0000000..f2616d2 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ccba3859f406bc8a4230e51ad5250b2caf33f2058e31b9361fe8ae5b5a37851 +size 342750816 diff --git a/Qwen2-0.5B-DPO.i1-IQ3_S.gguf b/Qwen2-0.5B-DPO.i1-IQ3_S.gguf new file mode 100644 index 0000000..8c2c8dd --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:574e4794ad707c7297fa18c47b39c009be0f14f894b37427036cae702f2e1f7a +size 338605920 diff --git a/Qwen2-0.5B-DPO.i1-IQ3_XS.gguf b/Qwen2-0.5B-DPO.i1-IQ3_XS.gguf new file mode 100644 index 0000000..11b001b --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e5b6aef95b96bcda8b9e70ced6315eaa6f83d08c80e598675d2f5df0345e4c +size 338605920 diff --git a/Qwen2-0.5B-DPO.i1-IQ3_XXS.gguf b/Qwen2-0.5B-DPO.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..8867494 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1924f9f58fd5c6330b98c254434a84e7f9fa287828010889b01450e185e517b5 +size 333703008 diff --git a/Qwen2-0.5B-DPO.i1-IQ4_NL.gguf b/Qwen2-0.5B-DPO.i1-IQ4_NL.gguf new file mode 100644 index 0000000..8a4c1e8 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e64711ad0513f313f504a57dd29bbe6f0777c58d571232cd4824f321da7b646 +size 352669536 diff --git a/Qwen2-0.5B-DPO.i1-IQ4_XS.gguf b/Qwen2-0.5B-DPO.i1-IQ4_XS.gguf new file mode 100644 index 0000000..806f3de --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d031295ba091835ad1e72e588c5845105cf8a48f13b227edcb422a61a176a996 +size 349400928 diff --git a/Qwen2-0.5B-DPO.i1-Q2_K.gguf b/Qwen2-0.5B-DPO.i1-Q2_K.gguf new file mode 100644 index 0000000..6930601 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da3ee15fb07b7329de2d21b2b25b6c975a273338953929f7fbd8b3ace8ea7f11 +size 338605920 diff --git a/Qwen2-0.5B-DPO.i1-Q2_K_S.gguf b/Qwen2-0.5B-DPO.i1-Q2_K_S.gguf new file mode 100644 index 0000000..7063b11 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f83f0beacd3dc7bd7cd8bfa2ff0a4d7aeb4528a006cb495b5a433496ca007f73 +size 331047264 diff --git a/Qwen2-0.5B-DPO.i1-Q3_K_L.gguf b/Qwen2-0.5B-DPO.i1-Q3_K_L.gguf new file mode 100644 index 0000000..24a98a5 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1cf812d067ef9273bb50edcb1555d2cc94d87375e692e0d3f957cd88cbc3081 +size 369356640 diff --git a/Qwen2-0.5B-DPO.i1-Q3_K_M.gguf b/Qwen2-0.5B-DPO.i1-Q3_K_M.gguf new file mode 100644 index 0000000..97851c9 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2fa508ea5f1bf26ab77aa93ee104d3448c88ee3ec7514dadb55233601c71037 +size 355465056 diff --git a/Qwen2-0.5B-DPO.i1-Q3_K_S.gguf b/Qwen2-0.5B-DPO.i1-Q3_K_S.gguf new file mode 100644 index 0000000..137186f --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2061ac355128fc5e60747739319599376193dca0dcc1728a6973bd6f4ff1e435 +size 338261856 diff --git a/Qwen2-0.5B-DPO.i1-Q4_0.gguf b/Qwen2-0.5B-DPO.i1-Q4_0.gguf new file mode 100644 index 0000000..2e4a33b --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:118889acb2e19d251e9786b1a9281a86eef2218dff26559e2d8cc25780b87d1f +size 352970592 diff --git a/Qwen2-0.5B-DPO.i1-Q4_1.gguf b/Qwen2-0.5B-DPO.i1-Q4_1.gguf new file mode 100644 index 0000000..14a21e1 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cc6b551fdf8757fac91d7a1a024684c49ac49dea9697201b571b5f72465295d +size 374517600 diff --git a/Qwen2-0.5B-DPO.i1-Q4_K_M.gguf b/Qwen2-0.5B-DPO.i1-Q4_K_M.gguf new file mode 100644 index 0000000..a96a481 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2065e4b83fca2128020834afedbc810e4a182227de9ab5fbde74377cba4b901 +size 397806432 diff --git a/Qwen2-0.5B-DPO.i1-Q4_K_S.gguf b/Qwen2-0.5B-DPO.i1-Q4_K_S.gguf new file mode 100644 index 0000000..ea19e81 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed79b2bde4290fcb2febc559283fa185dbdc83b77246e5f0fca863a82b9fbe2f +size 385470304 diff --git a/Qwen2-0.5B-DPO.i1-Q5_K_M.gguf b/Qwen2-0.5B-DPO.i1-Q5_K_M.gguf new file mode 100644 index 0000000..4e90573 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6de263bfcd8ff05328714926459d44829da014ee7c1f5c5c3607340697de630e +size 420084576 diff --git a/Qwen2-0.5B-DPO.i1-Q5_K_S.gguf b/Qwen2-0.5B-DPO.i1-Q5_K_S.gguf new file mode 100644 index 0000000..7199083 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a12e0b524412894e1964e6ab7a3785ae47ed956f7644b4fde76ae6bddefbb94 +size 412708704 diff --git a/Qwen2-0.5B-DPO.i1-Q6_K.gguf b/Qwen2-0.5B-DPO.i1-Q6_K.gguf new file mode 100644 index 0000000..5039437 --- /dev/null +++ b/Qwen2-0.5B-DPO.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1299445745223ab7144886f5d35a7ae85c28c59ba395edb56b83ec4aecc6ba +size 505735008 diff --git a/README.md b/README.md new file mode 100644 index 0000000..95da9c7 --- /dev/null +++ b/README.md @@ -0,0 +1,86 @@ +--- +base_model: trl-lib/Qwen2-0.5B-DPO +datasets: trl-lib/Capybara-Preferences +language: +- en +library_name: transformers +model_name: dpo-qwen2 +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- generated_from_trainer +- trl +- dpo +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/trl-lib/Qwen2-0.5B-DPO + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#Qwen2-0.5B-DPO-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ1_S.gguf) | i1-IQ1_S | 0.4 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ1_M.gguf) | i1-IQ1_M | 0.4 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ2_XS.gguf) | i1-IQ2_XS | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ2_S.gguf) | i1-IQ2_S | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ2_M.gguf) | i1-IQ2_M | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q2_K_S.gguf) | i1-Q2_K_S | 0.4 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 0.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q3_K_S.gguf) | i1-Q3_K_S | 0.4 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ3_S.gguf) | i1-IQ3_S | 0.4 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ3_XS.gguf) | i1-IQ3_XS | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q2_K.gguf) | i1-Q2_K | 0.4 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ3_M.gguf) | i1-IQ3_M | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ4_XS.gguf) | i1-IQ4_XS | 0.4 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-IQ4_NL.gguf) | i1-IQ4_NL | 0.5 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q4_0.gguf) | i1-Q4_0 | 0.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q3_K_M.gguf) | i1-Q3_K_M | 0.5 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q3_K_L.gguf) | i1-Q3_K_L | 0.5 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q4_1.gguf) | i1-Q4_1 | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q4_K_S.gguf) | i1-Q4_K_S | 0.5 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q4_K_M.gguf) | i1-Q4_K_M | 0.5 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q5_K_S.gguf) | i1-Q5_K_S | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q5_K_M.gguf) | i1-Q5_K_M | 0.5 | | +| [GGUF](https://huggingface.co/mradermacher/Qwen2-0.5B-DPO-i1-GGUF/resolve/main/Qwen2-0.5B-DPO.i1-Q6_K.gguf) | i1-Q6_K | 0.6 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..53ef704 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4115e0a1c7c25b495c9fb9dbdb6f6b3ad2a6ad308b382768569931f303ee0bb1 +size 988597