From 3d1fdaa52024b8c7b54c8b65b8454d8325e06a65 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Mon, 8 Jun 2026 00:59:17 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/An4-7Bv2-i1-GGUF Source: Original Platform --- .gitattributes | 60 +++++++++++++++++++++++++++++ An4-7Bv2.i1-IQ1_M.gguf | 3 ++ An4-7Bv2.i1-IQ1_S.gguf | 3 ++ An4-7Bv2.i1-IQ2_M.gguf | 3 ++ An4-7Bv2.i1-IQ2_S.gguf | 3 ++ An4-7Bv2.i1-IQ2_XS.gguf | 3 ++ An4-7Bv2.i1-IQ2_XXS.gguf | 3 ++ An4-7Bv2.i1-IQ3_M.gguf | 3 ++ An4-7Bv2.i1-IQ3_S.gguf | 3 ++ An4-7Bv2.i1-IQ3_XS.gguf | 3 ++ An4-7Bv2.i1-IQ3_XXS.gguf | 3 ++ An4-7Bv2.i1-IQ4_NL.gguf | 3 ++ An4-7Bv2.i1-IQ4_XS.gguf | 3 ++ An4-7Bv2.i1-Q2_K.gguf | 3 ++ An4-7Bv2.i1-Q2_K_S.gguf | 3 ++ An4-7Bv2.i1-Q3_K_L.gguf | 3 ++ An4-7Bv2.i1-Q3_K_M.gguf | 3 ++ An4-7Bv2.i1-Q3_K_S.gguf | 3 ++ An4-7Bv2.i1-Q4_0.gguf | 3 ++ An4-7Bv2.i1-Q4_1.gguf | 3 ++ An4-7Bv2.i1-Q4_K_M.gguf | 3 ++ An4-7Bv2.i1-Q4_K_S.gguf | 3 ++ An4-7Bv2.i1-Q5_K_M.gguf | 3 ++ An4-7Bv2.i1-Q5_K_S.gguf | 3 ++ An4-7Bv2.i1-Q6_K.gguf | 3 ++ README.md | 83 ++++++++++++++++++++++++++++++++++++++++ imatrix.dat | 3 ++ 27 files changed, 218 insertions(+) create mode 100644 .gitattributes create mode 100644 An4-7Bv2.i1-IQ1_M.gguf create mode 100644 An4-7Bv2.i1-IQ1_S.gguf create mode 100644 An4-7Bv2.i1-IQ2_M.gguf create mode 100644 An4-7Bv2.i1-IQ2_S.gguf create mode 100644 An4-7Bv2.i1-IQ2_XS.gguf create mode 100644 An4-7Bv2.i1-IQ2_XXS.gguf create mode 100644 An4-7Bv2.i1-IQ3_M.gguf create mode 100644 An4-7Bv2.i1-IQ3_S.gguf create mode 100644 An4-7Bv2.i1-IQ3_XS.gguf create mode 100644 An4-7Bv2.i1-IQ3_XXS.gguf create mode 100644 An4-7Bv2.i1-IQ4_NL.gguf create mode 100644 An4-7Bv2.i1-IQ4_XS.gguf create mode 100644 An4-7Bv2.i1-Q2_K.gguf create mode 100644 An4-7Bv2.i1-Q2_K_S.gguf create mode 100644 An4-7Bv2.i1-Q3_K_L.gguf create mode 100644 An4-7Bv2.i1-Q3_K_M.gguf create mode 100644 An4-7Bv2.i1-Q3_K_S.gguf create mode 100644 An4-7Bv2.i1-Q4_0.gguf create mode 100644 An4-7Bv2.i1-Q4_1.gguf create mode 100644 An4-7Bv2.i1-Q4_K_M.gguf create mode 100644 An4-7Bv2.i1-Q4_K_S.gguf create mode 100644 An4-7Bv2.i1-Q5_K_M.gguf create mode 100644 An4-7Bv2.i1-Q5_K_S.gguf create mode 100644 An4-7Bv2.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..8794466 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +An4-7Bv2.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/An4-7Bv2.i1-IQ1_M.gguf b/An4-7Bv2.i1-IQ1_M.gguf new file mode 100644 index 0000000..c3cc4b9 --- /dev/null +++ b/An4-7Bv2.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8b0bf3e90e77f958b3ca443f3278b5290656d86d2f1985898cf41cd0f228a9c +size 1754447168 diff --git a/An4-7Bv2.i1-IQ1_S.gguf b/An4-7Bv2.i1-IQ1_S.gguf new file mode 100644 index 0000000..e4c88db --- /dev/null +++ b/An4-7Bv2.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd13cc9770ac591a69b9bb1ba58bcf5acb7bb09129735d04120a3326aed059ff +size 1612102976 diff --git a/An4-7Bv2.i1-IQ2_M.gguf b/An4-7Bv2.i1-IQ2_M.gguf new file mode 100644 index 0000000..3129e73 --- /dev/null +++ b/An4-7Bv2.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc531ca2d4ccd5cac3bc0c2e492cb3bde2d8468ab2438f79d3d2ca1a72ae02ca +size 2500713792 diff --git a/An4-7Bv2.i1-IQ2_S.gguf b/An4-7Bv2.i1-IQ2_S.gguf new file mode 100644 index 0000000..9de4279 --- /dev/null +++ b/An4-7Bv2.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5340c7c2f868426e3cd40802adaa2cda8af9b4a0d4a94cbcc27c94cb76c8fa84 +size 2310921536 diff --git a/An4-7Bv2.i1-IQ2_XS.gguf b/An4-7Bv2.i1-IQ2_XS.gguf new file mode 100644 index 0000000..b56c337 --- /dev/null +++ b/An4-7Bv2.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bb46d20ff6bc52ccb553bbad68f55e2b31d5c804806c75318d76acce35ca870 +size 2198256960 diff --git a/An4-7Bv2.i1-IQ2_XXS.gguf b/An4-7Bv2.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..918215c --- /dev/null +++ b/An4-7Bv2.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:110507a65b736ccc216e40a1bb9a6a1a8556cbcfd343ef304ee1b343aef2048d +size 1991687488 diff --git a/An4-7Bv2.i1-IQ3_M.gguf b/An4-7Bv2.i1-IQ3_M.gguf new file mode 100644 index 0000000..dd4891f --- /dev/null +++ b/An4-7Bv2.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94b1f2673372e5aba9494518de3794c94ddc9d7260beee4b0323e29fff05631c +size 3284892992 diff --git a/An4-7Bv2.i1-IQ3_S.gguf b/An4-7Bv2.i1-IQ3_S.gguf new file mode 100644 index 0000000..416456d --- /dev/null +++ b/An4-7Bv2.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30961b03b8f1eb38734ce16c310d13946556d2ac8a4c55f0c7b61ec6f9209a88 +size 3182394688 diff --git a/An4-7Bv2.i1-IQ3_XS.gguf b/An4-7Bv2.i1-IQ3_XS.gguf new file mode 100644 index 0000000..d0bad68 --- /dev/null +++ b/An4-7Bv2.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d03f547add0af6c07ddab52f32caf9d79438f7a2a5a777a2a53856df95ce1c0 +size 3018816832 diff --git a/An4-7Bv2.i1-IQ3_XXS.gguf b/An4-7Bv2.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..866646d --- /dev/null +++ b/An4-7Bv2.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a09285b9014411b3d0907d43c3f07ee6fde6c67c3bb2ee14875d3bb11fdecbdc +size 2827345216 diff --git a/An4-7Bv2.i1-IQ4_NL.gguf b/An4-7Bv2.i1-IQ4_NL.gguf new file mode 100644 index 0000000..aee2176 --- /dev/null +++ b/An4-7Bv2.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:178117c4a280fcca5ab53324eb3be0e8cc65e19410d5c5c65e6eb2cba1fe0c10 +size 4125695296 diff --git a/An4-7Bv2.i1-IQ4_XS.gguf b/An4-7Bv2.i1-IQ4_XS.gguf new file mode 100644 index 0000000..7c32aa0 --- /dev/null +++ b/An4-7Bv2.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56ae718cf9f964964b020e591b055fbd5138185efcdb8a52d922180099544cc9 +size 3907689792 diff --git a/An4-7Bv2.i1-Q2_K.gguf b/An4-7Bv2.i1-Q2_K.gguf new file mode 100644 index 0000000..5959a3d --- /dev/null +++ b/An4-7Bv2.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a11e97c3660379f625bd92c70fb514257c405bf989056d4736e94813c0b79779 +size 2719243584 diff --git a/An4-7Bv2.i1-Q2_K_S.gguf b/An4-7Bv2.i1-Q2_K_S.gguf new file mode 100644 index 0000000..7536e6c --- /dev/null +++ b/An4-7Bv2.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126c3d99ca5b5ba48e495b83eb21fd242155ccd634431a4c0601a35b6ddcaef3 +size 2528927040 diff --git a/An4-7Bv2.i1-Q3_K_L.gguf b/An4-7Bv2.i1-Q3_K_L.gguf new file mode 100644 index 0000000..6136fff --- /dev/null +++ b/An4-7Bv2.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4141b84c28a4c50b6aac5baec24423f1b52e1f6224bb0cafe737f5867fdce78 +size 3822026048 diff --git a/An4-7Bv2.i1-Q3_K_M.gguf b/An4-7Bv2.i1-Q3_K_M.gguf new file mode 100644 index 0000000..a57dfd9 --- /dev/null +++ b/An4-7Bv2.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be4afc52d44f3bd1c192c3969dbea904d5c66a4a54ea40571f3762e6cea1d170 +size 3518987584 diff --git a/An4-7Bv2.i1-Q3_K_S.gguf b/An4-7Bv2.i1-Q3_K_S.gguf new file mode 100644 index 0000000..c6412b7 --- /dev/null +++ b/An4-7Bv2.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fef925a825b6197b54e78a68c5b3e11383ca71de04b2ce835709426b09789b0 +size 3164568896 diff --git a/An4-7Bv2.i1-Q4_0.gguf b/An4-7Bv2.i1-Q4_0.gguf new file mode 100644 index 0000000..9f863b1 --- /dev/null +++ b/An4-7Bv2.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3155f6432505c48934b69bdadab5a1222321d3614622f48db4401805e41f19d2 +size 4123598144 diff --git a/An4-7Bv2.i1-Q4_1.gguf b/An4-7Bv2.i1-Q4_1.gguf new file mode 100644 index 0000000..4c4e4fd --- /dev/null +++ b/An4-7Bv2.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f72b89ea717076d93d7638590b45af8e725320ba96610254c43d4ea5484bef8 +size 4553317696 diff --git a/An4-7Bv2.i1-Q4_K_M.gguf b/An4-7Bv2.i1-Q4_K_M.gguf new file mode 100644 index 0000000..b4a9222 --- /dev/null +++ b/An4-7Bv2.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ca36a390eafcfdaa973fbfbe6f62235d9df67ca5f1827bf20c6ec54a284130 +size 4368440640 diff --git a/An4-7Bv2.i1-Q4_K_S.gguf b/An4-7Bv2.i1-Q4_K_S.gguf new file mode 100644 index 0000000..5d62498 --- /dev/null +++ b/An4-7Bv2.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe2a4e75566cf3b979e09f240a914b032cf858c29c685d7d17b6b93614ef8cd1 +size 4140375360 diff --git a/An4-7Bv2.i1-Q5_K_M.gguf b/An4-7Bv2.i1-Q5_K_M.gguf new file mode 100644 index 0000000..abc9e0d --- /dev/null +++ b/An4-7Bv2.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd3107953c20467779e67d5f78891c5b732341a02c8da5b261c5c94c1ebdc6c2 +size 5131410752 diff --git a/An4-7Bv2.i1-Q5_K_S.gguf b/An4-7Bv2.i1-Q5_K_S.gguf new file mode 100644 index 0000000..29ae4b3 --- /dev/null +++ b/An4-7Bv2.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada9b3b7ba51abf2a20fe2b3c7c45b21701b6907e3a9ae63bfe12309cdef63d0 +size 4997717312 diff --git a/An4-7Bv2.i1-Q6_K.gguf b/An4-7Bv2.i1-Q6_K.gguf new file mode 100644 index 0000000..3c8a064 --- /dev/null +++ b/An4-7Bv2.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7a0bb92dd37d3adb2d36444cd15b115e92b9f49af52f2a2381a455df94da399 +size 5942066496 diff --git a/README.md b/README.md new file mode 100644 index 0000000..c6114e3 --- /dev/null +++ b/README.md @@ -0,0 +1,83 @@ +--- +base_model: Smuggling1710/An4-7Bv2 +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- text-generation-inference +- transformers +- unsloth +- mistral +- trl +- sft +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/Smuggling1710/An4-7Bv2 + + +static quants are available at https://huggingface.co/mradermacher/An4-7Bv2-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ1_S.gguf) | i1-IQ1_S | 1.7 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ1_M.gguf) | i1-IQ1_M | 1.9 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.1 | | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.3 | | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ2_S.gguf) | i1-IQ2_S | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ2_M.gguf) | i1-IQ2_M | 2.6 | | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q2_K_S.gguf) | i1-Q2_K_S | 2.6 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q2_K.gguf) | i1-Q2_K | 2.8 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 2.9 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.1 | | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.3 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ3_S.gguf) | i1-IQ3_S | 3.3 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ3_M.gguf) | i1-IQ3_M | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q3_K_M.gguf) | i1-Q3_K_M | 3.6 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q3_K_L.gguf) | i1-Q3_K_L | 3.9 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.0 | | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q4_0.gguf) | i1-Q4_0 | 4.2 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-IQ4_NL.gguf) | i1-IQ4_NL | 4.2 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.2 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q4_K_M.gguf) | i1-Q4_K_M | 4.5 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q4_1.gguf) | i1-Q4_1 | 4.7 | | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.1 | | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.2 | | +| [GGUF](https://huggingface.co/mradermacher/An4-7Bv2-i1-GGUF/resolve/main/An4-7Bv2.i1-Q6_K.gguf) | i1-Q6_K | 6.0 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..21987cb --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1b9a68e31b85a1a024ae596d1ff3d49a209ab41ef0abf6e79a0e6e8dc74f651 +size 4988157