From 47703cd15c1b75f43d58f34e1bd94fd9856fdb35 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 8 May 2026 16:05:47 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF Source: Original Platform --- .gitattributes | 59 +++++++++++++++++ AceMath-RL-Nemotron-7B.i1-IQ1_M.gguf | 3 + AceMath-RL-Nemotron-7B.i1-IQ1_S.gguf | 3 + AceMath-RL-Nemotron-7B.i1-IQ2_M.gguf | 3 + AceMath-RL-Nemotron-7B.i1-IQ2_S.gguf | 3 + AceMath-RL-Nemotron-7B.i1-IQ2_XS.gguf | 3 + AceMath-RL-Nemotron-7B.i1-IQ2_XXS.gguf | 3 + AceMath-RL-Nemotron-7B.i1-IQ3_M.gguf | 3 + AceMath-RL-Nemotron-7B.i1-IQ3_S.gguf | 3 + AceMath-RL-Nemotron-7B.i1-IQ3_XS.gguf | 3 + AceMath-RL-Nemotron-7B.i1-IQ3_XXS.gguf | 3 + AceMath-RL-Nemotron-7B.i1-IQ4_NL.gguf | 3 + AceMath-RL-Nemotron-7B.i1-IQ4_XS.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q2_K.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q2_K_S.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q3_K_L.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q3_K_M.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q3_K_S.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q4_0.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q4_1.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q4_K_M.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q4_K_S.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q5_K_M.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q5_K_S.gguf | 3 + AceMath-RL-Nemotron-7B.i1-Q6_K.gguf | 3 + README.md | 89 ++++++++++++++++++++++++++ imatrix.dat | 3 + 27 files changed, 223 insertions(+) create mode 100644 .gitattributes create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ1_M.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ1_S.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ2_M.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ2_S.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ2_XS.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ2_XXS.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ3_M.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ3_S.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ3_XS.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ3_XXS.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ4_NL.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-IQ4_XS.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q2_K.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q2_K_S.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q3_K_L.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q3_K_M.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q3_K_S.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q4_0.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q4_1.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q4_K_M.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q4_K_S.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q5_K_M.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q5_K_S.gguf create mode 100644 AceMath-RL-Nemotron-7B.i1-Q6_K.gguf create mode 100644 README.md create mode 100644 imatrix.dat diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..e3b71c0 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,59 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +AceMath-RL-Nemotron-7B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/AceMath-RL-Nemotron-7B.i1-IQ1_M.gguf b/AceMath-RL-Nemotron-7B.i1-IQ1_M.gguf new file mode 100644 index 0000000..9f90e0a --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96aac9b5e39e332e0247e85a3a9dc45a884b00e6f3990053d08a8a89ba29ba4a +size 2042196768 diff --git a/AceMath-RL-Nemotron-7B.i1-IQ1_S.gguf b/AceMath-RL-Nemotron-7B.i1-IQ1_S.gguf new file mode 100644 index 0000000..32d9e2e --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68840c5e705850123027b3472263b861e14dfe89e293d18359c9a587305b9ad3 +size 1903668000 diff --git a/AceMath-RL-Nemotron-7B.i1-IQ2_M.gguf b/AceMath-RL-Nemotron-7B.i1-IQ2_M.gguf new file mode 100644 index 0000000..a79d827 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9e8185db26baab556b1fd891675178f5acb9c0a4516b3d9f19cafa1d6f5727f +size 2780343072 diff --git a/AceMath-RL-Nemotron-7B.i1-IQ2_S.gguf b/AceMath-RL-Nemotron-7B.i1-IQ2_S.gguf new file mode 100644 index 0000000..5c357e4 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ddba921a5e7b4fe4d234747dadbcfd8171057f8daf663aa9b873173f100e8b1 +size 2595638048 diff --git a/AceMath-RL-Nemotron-7B.i1-IQ2_XS.gguf b/AceMath-RL-Nemotron-7B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..b176a4a --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b216bcbaa38647b43a497c62d1ae742a3cf53e048c8a5704aef483cfbf7b983 +size 2469022496 diff --git a/AceMath-RL-Nemotron-7B.i1-IQ2_XXS.gguf b/AceMath-RL-Nemotron-7B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..4b358cd --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:141da2011b1d2299af76616f4c1205bd56551ec370ea36630076aa8a57e14232 +size 2273078048 diff --git a/AceMath-RL-Nemotron-7B.i1-IQ3_M.gguf b/AceMath-RL-Nemotron-7B.i1-IQ3_M.gguf new file mode 100644 index 0000000..d8603b6 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86f3cf95a0fb04d5376e2a7068b094bb5afc80e9155b9688079ab902aab4cca7 +size 3574012704 diff --git a/AceMath-RL-Nemotron-7B.i1-IQ3_S.gguf b/AceMath-RL-Nemotron-7B.i1-IQ3_S.gguf new file mode 100644 index 0000000..5b7f96b --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d8c345f6a0fbd850a8ff763cfae2dea2ada26e46607a6c95cc9ceeb3c5a73a4 +size 3499193120 diff --git a/AceMath-RL-Nemotron-7B.i1-IQ3_XS.gguf b/AceMath-RL-Nemotron-7B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..f61ddb8 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e55635e6b2c95c97bebdef3a80c89c37063e88bca7d835e538cb9e98393029a8 +size 3346256672 diff --git a/AceMath-RL-Nemotron-7B.i1-IQ3_XXS.gguf b/AceMath-RL-Nemotron-7B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..b455ea2 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d55f36cb93ba72d045792bb1458e67077ac24bf9f1dfabc072e91a520e3fd701 +size 3114515232 diff --git a/AceMath-RL-Nemotron-7B.i1-IQ4_NL.gguf b/AceMath-RL-Nemotron-7B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..c4ffad9 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41fa308aa387f98a4aa1a7dbf749ecb9af1ec187922a55710c4035acddefb3cb +size 4437814048 diff --git a/AceMath-RL-Nemotron-7B.i1-IQ4_XS.gguf b/AceMath-RL-Nemotron-7B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..34f561f --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a63f9a1e8e2f906a47799532450b546733d8ab920ad577ea34976e94ed7424f5 +size 4218473248 diff --git a/AceMath-RL-Nemotron-7B.i1-Q2_K.gguf b/AceMath-RL-Nemotron-7B.i1-Q2_K.gguf new file mode 100644 index 0000000..130b0d8 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079b7a1cd00c0eaf9bd1081cd6e425bbd5a9d980f8e65f4366aafc057c955da5 +size 3015940896 diff --git a/AceMath-RL-Nemotron-7B.i1-Q2_K_S.gguf b/AceMath-RL-Nemotron-7B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..1ea81b7 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adf3847ddf02075cce5565d6c36c18cb46fd26bbdbc3b4153a1a96ea03e3c6c7 +size 2834074400 diff --git a/AceMath-RL-Nemotron-7B.i1-Q3_K_L.gguf b/AceMath-RL-Nemotron-7B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..7d2e8bb --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb4016db66777310ec172391086e2aeb36fc723e59745d487d3b795ef3ea2ac8 +size 4088460064 diff --git a/AceMath-RL-Nemotron-7B.i1-Q3_K_M.gguf b/AceMath-RL-Nemotron-7B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..fa99550 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27050fd0eac3ae6b809a848fd67311941dd787b8a8999df61ef51247754c98aa +size 3808391968 diff --git a/AceMath-RL-Nemotron-7B.i1-Q3_K_S.gguf b/AceMath-RL-Nemotron-7B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..c081cde --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88a9f0dfa4f172e109509190b1fe5435516568f9e4faa2359ce459a0931f485a +size 3492369184 diff --git a/AceMath-RL-Nemotron-7B.i1-Q4_0.gguf b/AceMath-RL-Nemotron-7B.i1-Q4_0.gguf new file mode 100644 index 0000000..bba975b --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea5eba5e9c8743073143f11b3d15ff2622a4b9f13a00284c3f14fee157da4bf +size 4444121888 diff --git a/AceMath-RL-Nemotron-7B.i1-Q4_1.gguf b/AceMath-RL-Nemotron-7B.i1-Q4_1.gguf new file mode 100644 index 0000000..4961801 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:966feb733e7f0136adee80ffe9469781220b2bd560198d3bb3b60f80049218b1 +size 4873284384 diff --git a/AceMath-RL-Nemotron-7B.i1-Q4_K_M.gguf b/AceMath-RL-Nemotron-7B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..06992cd --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba004941db35a3d68f777acf163b3db232cda353023073a8f3599864976da35d +size 4683074336 diff --git a/AceMath-RL-Nemotron-7B.i1-Q4_K_S.gguf b/AceMath-RL-Nemotron-7B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..a460d2b --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:886c6fdc9a34d8ad7ec1aa0af3e3c7f345de521f252725fb4e0975f9b6a0dbcc +size 4457769760 diff --git a/AceMath-RL-Nemotron-7B.i1-Q5_K_M.gguf b/AceMath-RL-Nemotron-7B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..b8d785c --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9341032440b4a527f72be8192d94b8dfa3c1f7b0d71129c1ba3db6aabb8d51 +size 5444832032 diff --git a/AceMath-RL-Nemotron-7B.i1-Q5_K_S.gguf b/AceMath-RL-Nemotron-7B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..05310b0 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15a3dcdf0601d1f628faad6ec0fd64364af7877d914c2f7d35345b897296e602 +size 5315177248 diff --git a/AceMath-RL-Nemotron-7B.i1-Q6_K.gguf b/AceMath-RL-Nemotron-7B.i1-Q6_K.gguf new file mode 100644 index 0000000..ca61e11 --- /dev/null +++ b/AceMath-RL-Nemotron-7B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc84a0fdbc9aba8b68a7c5e3f886a602040eb2f123a9d3167aa46215c675ac2b +size 6254199584 diff --git a/README.md b/README.md new file mode 100644 index 0000000..db1f74a --- /dev/null +++ b/README.md @@ -0,0 +1,89 @@ +--- +base_model: nvidia/AceMath-RL-Nemotron-7B +language: +- en +library_name: transformers +license: other +license_link: https://www.nvidia.com/en-us/agreements/enterprise-software/nvidia-open-model-license/ +license_name: nvidia-open-model-license +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +tags: +- nvidia +- reasoning +- math +- reinforcement learning +- pytorch +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/nvidia/AceMath-RL-Nemotron-7B + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#AceMath-RL-Nemotron-7B-i1-GGUF).*** + +static quants are available at https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ1_S.gguf) | i1-IQ1_S | 2.0 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ1_M.gguf) | i1-IQ1_M | 2.1 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.4 | | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.6 | | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ2_S.gguf) | i1-IQ2_S | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ2_M.gguf) | i1-IQ2_M | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 2.9 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q2_K.gguf) | i1-Q2_K | 3.1 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.2 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.4 | | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.6 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ3_S.gguf) | i1-IQ3_S | 3.6 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ3_M.gguf) | i1-IQ3_M | 3.7 | | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 3.9 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.2 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.3 | | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 4.5 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q4_0.gguf) | i1-Q4_0 | 4.5 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.6 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 4.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q4_1.gguf) | i1-Q4_1 | 5.0 | | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.4 | | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.5 | | +| [GGUF](https://huggingface.co/mradermacher/AceMath-RL-Nemotron-7B-i1-GGUF/resolve/main/AceMath-RL-Nemotron-7B.i1-Q6_K.gguf) | i1-Q6_K | 6.4 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..9f4e36e --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8534588d5c462c6918ddd1b8e53d9836ead88d1113f9eed1c1967d2cf611a1d9 +size 4536665