From a43299a6d80e6f490d8604acaef356a048e89af2 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Tue, 5 May 2026 10:36:21 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/DPOB-INMTOB-7B-i1-GGUF Source: Original Platform --- .gitattributes | 60 ++++++++++++++++++++++++ DPOB-INMTOB-7B.i1-IQ1_M.gguf | 3 ++ DPOB-INMTOB-7B.i1-IQ1_S.gguf | 3 ++ DPOB-INMTOB-7B.i1-IQ2_M.gguf | 3 ++ DPOB-INMTOB-7B.i1-IQ2_S.gguf | 3 ++ DPOB-INMTOB-7B.i1-IQ2_XS.gguf | 3 ++ DPOB-INMTOB-7B.i1-IQ2_XXS.gguf | 3 ++ DPOB-INMTOB-7B.i1-IQ3_M.gguf | 3 ++ DPOB-INMTOB-7B.i1-IQ3_S.gguf | 3 ++ DPOB-INMTOB-7B.i1-IQ3_XS.gguf | 3 ++ DPOB-INMTOB-7B.i1-IQ3_XXS.gguf | 3 ++ DPOB-INMTOB-7B.i1-IQ4_XS.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q2_K.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q3_K_L.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q3_K_M.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q3_K_S.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q4_0.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q4_0_4_4.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q4_0_4_8.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q4_0_8_8.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q4_K_M.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q4_K_S.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q5_K_M.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q5_K_S.gguf | 3 ++ DPOB-INMTOB-7B.i1-Q6_K.gguf | 3 ++ README.md | 82 +++++++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 27 files changed, 217 insertions(+) create mode 100644 .gitattributes create mode 100644 DPOB-INMTOB-7B.i1-IQ1_M.gguf create mode 100644 DPOB-INMTOB-7B.i1-IQ1_S.gguf create mode 100644 DPOB-INMTOB-7B.i1-IQ2_M.gguf create mode 100644 DPOB-INMTOB-7B.i1-IQ2_S.gguf create mode 100644 DPOB-INMTOB-7B.i1-IQ2_XS.gguf create mode 100644 DPOB-INMTOB-7B.i1-IQ2_XXS.gguf create mode 100644 DPOB-INMTOB-7B.i1-IQ3_M.gguf create mode 100644 DPOB-INMTOB-7B.i1-IQ3_S.gguf create mode 100644 DPOB-INMTOB-7B.i1-IQ3_XS.gguf create mode 100644 DPOB-INMTOB-7B.i1-IQ3_XXS.gguf create mode 100644 DPOB-INMTOB-7B.i1-IQ4_XS.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q2_K.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q3_K_L.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q3_K_M.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q3_K_S.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q4_0.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q4_0_4_4.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q4_0_4_8.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q4_0_8_8.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q4_K_M.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q4_K_S.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q5_K_M.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q5_K_S.gguf create mode 100644 DPOB-INMTOB-7B.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..16f36a0 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q4_0_4_8.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-Q4_0_8_8.gguf filter=lfs diff=lfs merge=lfs -text +DPOB-INMTOB-7B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/DPOB-INMTOB-7B.i1-IQ1_M.gguf b/DPOB-INMTOB-7B.i1-IQ1_M.gguf new file mode 100644 index 0000000..b78fe05 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95ce49fc9145afdaa4bf2faf22184d8b6f8c2e234b79e9df1030dab37ffaea03 +size 1754447232 diff --git a/DPOB-INMTOB-7B.i1-IQ1_S.gguf b/DPOB-INMTOB-7B.i1-IQ1_S.gguf new file mode 100644 index 0000000..08f7e15 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc7b22358e105609a960a16578a69e4c7636c3d210db091d235aeaa72994844 +size 1612103040 diff --git a/DPOB-INMTOB-7B.i1-IQ2_M.gguf b/DPOB-INMTOB-7B.i1-IQ2_M.gguf new file mode 100644 index 0000000..5d2455c --- /dev/null +++ b/DPOB-INMTOB-7B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b7e07e7041789030ad00c802372b03e1deb37dcd70121adea59daac803604ec +size 2500713856 diff --git a/DPOB-INMTOB-7B.i1-IQ2_S.gguf b/DPOB-INMTOB-7B.i1-IQ2_S.gguf new file mode 100644 index 0000000..e1aca6e --- /dev/null +++ b/DPOB-INMTOB-7B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8681d2426347af9b19c51874900e78ce3126f4d7388f6f83f219ec4833032d94 +size 2310921600 diff --git a/DPOB-INMTOB-7B.i1-IQ2_XS.gguf b/DPOB-INMTOB-7B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..b5f898c --- /dev/null +++ b/DPOB-INMTOB-7B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:563ea7a056dc148d8af10248749a337977fdb349560e1acd1a020636f9d45828 +size 2198257024 diff --git a/DPOB-INMTOB-7B.i1-IQ2_XXS.gguf b/DPOB-INMTOB-7B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..3299847 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8180b5ef5330292cb92f04309c39f4bdef367c40c341eb76a3aa7d08334646a6 +size 1991687552 diff --git a/DPOB-INMTOB-7B.i1-IQ3_M.gguf b/DPOB-INMTOB-7B.i1-IQ3_M.gguf new file mode 100644 index 0000000..1c225d5 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27daa7408755c8bc3c74753a9a705dc4124a984d4567285024546f6244b94f97 +size 3284893056 diff --git a/DPOB-INMTOB-7B.i1-IQ3_S.gguf b/DPOB-INMTOB-7B.i1-IQ3_S.gguf new file mode 100644 index 0000000..c5dcc94 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83f9925ca36f4ec0b10e865bd0359659d3249f6bca54f851a4932672c45c2d70 +size 3182394752 diff --git a/DPOB-INMTOB-7B.i1-IQ3_XS.gguf b/DPOB-INMTOB-7B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..5b296ac --- /dev/null +++ b/DPOB-INMTOB-7B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8731e6dc85baa4aef749d34d7629f06319a5226b6f4be07dd39e321d1c17ef36 +size 3018816896 diff --git a/DPOB-INMTOB-7B.i1-IQ3_XXS.gguf b/DPOB-INMTOB-7B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..9ac7a3c --- /dev/null +++ b/DPOB-INMTOB-7B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a59aae37ffe816c50ff335a6f736babe4227ee7a87f50253f1936367a090aa +size 2827345280 diff --git a/DPOB-INMTOB-7B.i1-IQ4_XS.gguf b/DPOB-INMTOB-7B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..d780b0a --- /dev/null +++ b/DPOB-INMTOB-7B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a360e7a48d04e455d9ec725f9d31c804e25551a5c48d57ecaf3718d93d75c8c +size 3907689856 diff --git a/DPOB-INMTOB-7B.i1-Q2_K.gguf b/DPOB-INMTOB-7B.i1-Q2_K.gguf new file mode 100644 index 0000000..be322b4 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99aed707e8a169124f712d1621017e6608f918869c18bb1d25a4468b614ab7a3 +size 2719243648 diff --git a/DPOB-INMTOB-7B.i1-Q3_K_L.gguf b/DPOB-INMTOB-7B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..ddd25d8 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2d49a482933b020339f6a4d872e1c429c180d669712f37e7ae587eb61a6027a +size 3822026112 diff --git a/DPOB-INMTOB-7B.i1-Q3_K_M.gguf b/DPOB-INMTOB-7B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..c20fea1 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b993f3bc5c994f0cc99ba9cc70af0a1a2a1d2dca326206fa37a1ac41122733d0 +size 3518987648 diff --git a/DPOB-INMTOB-7B.i1-Q3_K_S.gguf b/DPOB-INMTOB-7B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..9cb3c91 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:749116fcf7e69b89ec90faf7ba0db0f9e2b7f77e15842f62350cd4b18c1a1089 +size 3164568960 diff --git a/DPOB-INMTOB-7B.i1-Q4_0.gguf b/DPOB-INMTOB-7B.i1-Q4_0.gguf new file mode 100644 index 0000000..afbe131 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdd627332d863b7f6d31158d5d808159276db14e50340c8ea3648cf54631fc19 +size 4123598208 diff --git a/DPOB-INMTOB-7B.i1-Q4_0_4_4.gguf b/DPOB-INMTOB-7B.i1-Q4_0_4_4.gguf new file mode 100644 index 0000000..b5180b8 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q4_0_4_4.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8967362cdbb7abddf235163d606f893a477d4e52d670d7c06aeea0c3a731bd58 +size 4108918144 diff --git a/DPOB-INMTOB-7B.i1-Q4_0_4_8.gguf b/DPOB-INMTOB-7B.i1-Q4_0_4_8.gguf new file mode 100644 index 0000000..de97b2f --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q4_0_4_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b49ebbc8ac113b8e4c1a8406876e6a09c92a19b201241240a213b096b526f01 +size 4108918144 diff --git a/DPOB-INMTOB-7B.i1-Q4_0_8_8.gguf b/DPOB-INMTOB-7B.i1-Q4_0_8_8.gguf new file mode 100644 index 0000000..9d62887 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q4_0_8_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eece360a10ea300cfa58f51a0029c1e43461a756906176027f55834944eb677 +size 4108918144 diff --git a/DPOB-INMTOB-7B.i1-Q4_K_M.gguf b/DPOB-INMTOB-7B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..a3452ce --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99adc8f083f41ca6e763c363dfb7813785e05ae51f7c5767571a87d11a902452 +size 4368440704 diff --git a/DPOB-INMTOB-7B.i1-Q4_K_S.gguf b/DPOB-INMTOB-7B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..d2089b2 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a89a869a0c4bc0b122306f8fdea5e2a5742da8ee45e6ed1a9110b40188c4e3a0 +size 4140375424 diff --git a/DPOB-INMTOB-7B.i1-Q5_K_M.gguf b/DPOB-INMTOB-7B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..e4e46ce --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2996dac4d76b5d903e66187179d0d1ba34b6b23c1b5e8ea8e1f4d064b72b0d7 +size 5131410816 diff --git a/DPOB-INMTOB-7B.i1-Q5_K_S.gguf b/DPOB-INMTOB-7B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..48520df --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ad69c301df20c81c654c104008155bbda8926bd5bb2f78777776f17ab5104d4 +size 4997717376 diff --git a/DPOB-INMTOB-7B.i1-Q6_K.gguf b/DPOB-INMTOB-7B.i1-Q6_K.gguf new file mode 100644 index 0000000..e592847 --- /dev/null +++ b/DPOB-INMTOB-7B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed70459ffb5640bfae2f0e0cbeb3fa142cb97ff0ed3521af01d473e7717932f0 +size 5942066560 diff --git a/README.md b/README.md new file mode 100644 index 0000000..d382ae2 --- /dev/null +++ b/README.md @@ -0,0 +1,82 @@ +--- +base_model: paulml/DPOB-INMTOB-7B +language: +- en +library_name: transformers +license: cc-by-nc-4.0 +quantized_by: mradermacher +tags: +- merge +- mergekit +- lazymergekit +- liminerity/Omningotex-7b-slerp +- eren23/merged-dpo-binarized-NeutrixOmnibe-7B +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/paulml/DPOB-INMTOB-7B + + +static quants are available at https://huggingface.co/mradermacher/DPOB-INMTOB-7B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-IQ1_S.gguf) | i1-IQ1_S | 1.7 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-IQ1_M.gguf) | i1-IQ1_M | 1.9 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.1 | | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.3 | | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-IQ2_S.gguf) | i1-IQ2_S | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-IQ2_M.gguf) | i1-IQ2_M | 2.6 | | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q2_K.gguf) | i1-Q2_K | 2.8 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 2.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.1 | | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.3 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-IQ3_S.gguf) | i1-IQ3_S | 3.3 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-IQ3_M.gguf) | i1-IQ3_M | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 3.6 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 3.9 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.0 | | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q4_0_4_4.gguf) | i1-Q4_0_4_4 | 4.2 | fast on arm, low quality | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q4_0_4_8.gguf) | i1-Q4_0_4_8 | 4.2 | fast on arm+i8mm, low quality | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q4_0_8_8.gguf) | i1-Q4_0_8_8 | 4.2 | fast on arm+sve, low quality | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q4_0.gguf) | i1-Q4_0 | 4.2 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.2 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 4.5 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.1 | | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.2 | | +| [GGUF](https://huggingface.co/mradermacher/DPOB-INMTOB-7B-i1-GGUF/resolve/main/DPOB-INMTOB-7B.i1-Q6_K.gguf) | i1-Q6_K | 6.0 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..16d3e57 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e476c6c9dd5a055d182d12c0a39b601fc6b19d1df5715cb39932fa3541cec2e +size 4988157