From f6d609f092fe1c2d0635a544a28cf83fa592fb7b Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Wed, 6 May 2026 15:01:10 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF Source: Original Platform --- .gitattributes | 60 ++++++++++++++++++ MagpieLM-8B-Chat-v0.1.i1-IQ1_M.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-IQ1_S.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-IQ2_M.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-IQ2_S.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-IQ2_XS.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-IQ2_XXS.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-IQ3_M.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-IQ3_S.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-IQ3_XS.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-IQ3_XXS.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-IQ4_XS.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q2_K.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q3_K_L.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q3_K_M.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q3_K_S.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q4_0.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_4.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_8.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q4_0_8_8.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q4_K_M.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q4_K_S.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q5_K_M.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q5_K_S.gguf | 3 + MagpieLM-8B-Chat-v0.1.i1-Q6_K.gguf | 3 + README.md | 84 ++++++++++++++++++++++++++ imatrix.dat | 3 + 27 files changed, 219 insertions(+) create mode 100644 .gitattributes create mode 100644 MagpieLM-8B-Chat-v0.1.i1-IQ1_M.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-IQ1_S.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-IQ2_M.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-IQ2_S.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-IQ2_XS.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-IQ2_XXS.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-IQ3_M.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-IQ3_S.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-IQ3_XS.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-IQ3_XXS.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-IQ4_XS.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q2_K.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q3_K_L.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q3_K_M.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q3_K_S.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q4_0.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_4.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_8.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q4_0_8_8.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q4_K_M.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q4_K_S.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q5_K_M.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q5_K_S.gguf create mode 100644 MagpieLM-8B-Chat-v0.1.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..1d82754 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_8.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-Q4_0_8_8.gguf filter=lfs diff=lfs merge=lfs -text +MagpieLM-8B-Chat-v0.1.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/MagpieLM-8B-Chat-v0.1.i1-IQ1_M.gguf b/MagpieLM-8B-Chat-v0.1.i1-IQ1_M.gguf new file mode 100644 index 0000000..e036e8c --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef4be8e92857319395ad417789248cca076893caf2f7408b9f79f56fef07b9da +size 2161973568 diff --git a/MagpieLM-8B-Chat-v0.1.i1-IQ1_S.gguf b/MagpieLM-8B-Chat-v0.1.i1-IQ1_S.gguf new file mode 100644 index 0000000..74a463f --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cffff25dde960bb902ebb9d53ed9478c340813db2a9a9e9629e37e53daea4a52 +size 2019629376 diff --git a/MagpieLM-8B-Chat-v0.1.i1-IQ2_M.gguf b/MagpieLM-8B-Chat-v0.1.i1-IQ2_M.gguf new file mode 100644 index 0000000..da81161 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c1cca038b42879f5eb12bdb5f24cbf8374002136a8913eedf887e475a5ca53 +size 2948282688 diff --git a/MagpieLM-8B-Chat-v0.1.i1-IQ2_S.gguf b/MagpieLM-8B-Chat-v0.1.i1-IQ2_S.gguf new file mode 100644 index 0000000..5187b46 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:177df02553c6eb100fd1c8792d2d3425732dcc2c465181516344c4bfb7e30aa9 +size 2758490432 diff --git a/MagpieLM-8B-Chat-v0.1.i1-IQ2_XS.gguf b/MagpieLM-8B-Chat-v0.1.i1-IQ2_XS.gguf new file mode 100644 index 0000000..1a82ffb --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:672916696c6f9fba1ce7e8612832e11eeb0337e47eb38a01d141632e57937c7f +size 2605783360 diff --git a/MagpieLM-8B-Chat-v0.1.i1-IQ2_XXS.gguf b/MagpieLM-8B-Chat-v0.1.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..fd91ce0 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd350b0c23ecb2702ae6ce611684443b0d391b4c2f9cd63dd0d430a9f2a97900 +size 2399213888 diff --git a/MagpieLM-8B-Chat-v0.1.i1-IQ3_M.gguf b/MagpieLM-8B-Chat-v0.1.i1-IQ3_M.gguf new file mode 100644 index 0000000..686495f --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edf6a6ed1202093401115d70c8a0c689fddb4c7a6e87155844bf5fe7cee78404 +size 3784825152 diff --git a/MagpieLM-8B-Chat-v0.1.i1-IQ3_S.gguf b/MagpieLM-8B-Chat-v0.1.i1-IQ3_S.gguf new file mode 100644 index 0000000..d3b755f --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab0055202512f8c5f065aa2ded615051c695222ba516f1a3a4377a59b17524be +size 3682326848 diff --git a/MagpieLM-8B-Chat-v0.1.i1-IQ3_XS.gguf b/MagpieLM-8B-Chat-v0.1.i1-IQ3_XS.gguf new file mode 100644 index 0000000..a7b69c8 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91693a9a48156541a9e2fc6ef744b8930e89ceef990393341c4dfd6c969a8c29 +size 3518748992 diff --git a/MagpieLM-8B-Chat-v0.1.i1-IQ3_XXS.gguf b/MagpieLM-8B-Chat-v0.1.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..b8cba58 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b454a410ef16bc27c39a7086bdb8a2a0483b99cecb2a3e54acec9dce2000cd3 +size 3274914112 diff --git a/MagpieLM-8B-Chat-v0.1.i1-IQ4_XS.gguf b/MagpieLM-8B-Chat-v0.1.i1-IQ4_XS.gguf new file mode 100644 index 0000000..e7e923e --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43656866424cf0678a9c1d1a2b60fc03c0866172184bf01c42affe46787c8aff +size 4447664448 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q2_K.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q2_K.gguf new file mode 100644 index 0000000..0af58fd --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f82325b0e2f540ef81f60ccc4b340fdfe51b6fe66b75455563e508dfc413d650 +size 3179133248 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q3_K_L.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q3_K_L.gguf new file mode 100644 index 0000000..02c37e8 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e7769eb32244df780f9c551bcb9d3fe15caba43632f47d04575c8255289eacd +size 4321958208 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q3_K_M.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q3_K_M.gguf new file mode 100644 index 0000000..17022c9 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9ba638e980495e3bb372dbb99654e56db7e0d5c8f1de6ae5e73428a0c81f3b7 +size 4018919744 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q3_K_S.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q3_K_S.gguf new file mode 100644 index 0000000..6e37ae5 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5138f82b8660e741c8a4b44b5dce43f5b5efb4f7c8f8d75f53eb3c5d4f921c +size 3664501056 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q4_0.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q4_0.gguf new file mode 100644 index 0000000..d946092 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d21d9f7e917ea264685dd3abc0b39e1f7d41086116ccdbcc083be05ad1d7edaf +size 4675893568 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_4.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_4.gguf new file mode 100644 index 0000000..0e355cb --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_4.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464b34d649cb3d0fb822e2cd876d4b48df609f156bb4daa3d8538f0071f74dd3 +size 4661213504 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_8.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_8.gguf new file mode 100644 index 0000000..872a701 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:273dd86f3e7ee5f8ff05b90e44a25ae7cf0d4205ad67b8e82d3b52173b27ff24 +size 4661213504 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q4_0_8_8.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q4_0_8_8.gguf new file mode 100644 index 0000000..41edc3a --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q4_0_8_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db6637a91bdaff722dd1d0b3300a2fb32f97689177f1423e5066d41621f4635f +size 4661213504 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q4_K_M.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q4_K_M.gguf new file mode 100644 index 0000000..2ebcf4f --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd2ffc47dc7b64ca408c225fa8ca324a5ae5c75fb016a51f022d396ee3057d65 +size 4920736064 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q4_K_S.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q4_K_S.gguf new file mode 100644 index 0000000..5d26f72 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5d7493c98bbea9dd1059413c3606f1af4c13339868348a501f090c7ef1f90ea +size 4692670784 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q5_K_M.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q5_K_M.gguf new file mode 100644 index 0000000..91a596f --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e93257983b782f4b31a9b60483e0e790dc17d5c9c00d77b23528af76d4500e7 +size 5732989248 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q5_K_S.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q5_K_S.gguf new file mode 100644 index 0000000..6551c64 --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17cc3b0ea2689c304b13f39c21633affd82ffd1134c6ca8c76aadbb8de423de0 +size 5599295808 diff --git a/MagpieLM-8B-Chat-v0.1.i1-Q6_K.gguf b/MagpieLM-8B-Chat-v0.1.i1-Q6_K.gguf new file mode 100644 index 0000000..2ab939e --- /dev/null +++ b/MagpieLM-8B-Chat-v0.1.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbcb3fa75de6100aa663844ee16ef88b24ecd279951d3b7e831b50e250893b0f +size 6596008256 diff --git a/README.md b/README.md new file mode 100644 index 0000000..2d0216a --- /dev/null +++ b/README.md @@ -0,0 +1,84 @@ +--- +base_model: Magpie-Align/MagpieLM-8B-Chat-v0.1 +datasets: +- Magpie-Align/MagpieLM-SFT-Data-v0.1 +- Magpie-Align/MagpieLM-DPO-Data-v0.1 +language: +- en +library_name: transformers +license: llama3.1 +quantized_by: mradermacher +tags: +- alignment-handbook +- trl +- dpo +- generated_from_trainer +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/Magpie-Align/MagpieLM-8B-Chat-v0.1 + + +static quants are available at https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-IQ1_S.gguf) | i1-IQ1_S | 2.1 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-IQ1_M.gguf) | i1-IQ1_M | 2.3 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.5 | | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-IQ2_S.gguf) | i1-IQ2_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-IQ2_M.gguf) | i1-IQ2_M | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q2_K.gguf) | i1-Q2_K | 3.3 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.6 | | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.8 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-IQ3_S.gguf) | i1-IQ3_S | 3.8 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-IQ3_M.gguf) | i1-IQ3_M | 3.9 | | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q3_K_M.gguf) | i1-Q3_K_M | 4.1 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.4 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.5 | | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_4.gguf) | i1-Q4_0_4_4 | 4.8 | fast on arm, low quality | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q4_0_4_8.gguf) | i1-Q4_0_4_8 | 4.8 | fast on arm+i8mm, low quality | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q4_0_8_8.gguf) | i1-Q4_0_8_8 | 4.8 | fast on arm+sve, low quality | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q4_0.gguf) | i1-Q4_0 | 4.8 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.8 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q4_K_M.gguf) | i1-Q4_K_M | 5.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.7 | | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.8 | | +| [GGUF](https://huggingface.co/mradermacher/MagpieLM-8B-Chat-v0.1-i1-GGUF/resolve/main/MagpieLM-8B-Chat-v0.1.i1-Q6_K.gguf) | i1-Q6_K | 6.7 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..43443e6 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:289f934d00c4e01a7fe2241b7d8dc7ed3eb753ce157392c3a144f402f58c1333 +size 4988157