commit 6cb363b53e6e160e9d4a428fde1155da411e98d6 Author: ModelHub XC Date: Wed Apr 22 11:50:37 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..38dada5 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +DoublePotato-Mistral-Nemo-13B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ1_M.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ1_M.gguf new file mode 100644 index 0000000..ce279a7 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dc2fa9fa54790dad125d9e3d3910ba80cdb81c300567d38bc09973b64209393 +size 3470827456 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ1_S.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ1_S.gguf new file mode 100644 index 0000000..df4bd3b --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2346e01f601c588ef52fc89eafdb002732739d3556360a4b547fed694699aa4 +size 3225313216 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ2_M.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ2_M.gguf new file mode 100644 index 0000000..ac9a090 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26c21962f55eb0fcc61cc3edb3b3b9068cccf6b340edc9822152f4599b8b0c93 +size 4798750656 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ2_S.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ2_S.gguf new file mode 100644 index 0000000..bfc21ea --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cba8615b659dda4916a836c10f6764e783bdae860765e164ce429b3bffebcb +size 4471398336 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ2_XS.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..6a6316c --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:705710e1add9a6339da1edac26793e05f3eb2495ed0f237a12db592102acfeaf +size 4236206016 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ2_XXS.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..469da1d --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f23a1f385e08373be0cfa3756260218c858019aef76c3d18b9e0238872264a00 +size 3880017856 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ3_M.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ3_M.gguf new file mode 100644 index 0000000..022dc83 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6eb094e6755a94364fbfc16342f45e8cdf091bdd9941c577db3a683ce688ca7 +size 6204907456 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ3_S.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ3_S.gguf new file mode 100644 index 0000000..ce48485 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69cddf7470b1abd3a9786cd8aaf3f261d1cef406b90f9f6a91f489953ca3a88e +size 6033612736 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ3_XS.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..a595e14 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d964a9779db4d87a21e4d228947c168df90afd39f44f72736930c3fbdaa4f0f3 +size 5752463296 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ3_XXS.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..b6d308a --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95d256f4e623bbf60068c72cc56b6b01c8f914e9dc8eb7940d58e4f0962087d6 +size 5364162496 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ4_NL.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..0b55bb1 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1521d888b7529e073e258630af68f435638443be8f9e9d9bd4143cdaed51e9f +size 7714119616 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-IQ4_XS.gguf b/DoublePotato-Mistral-Nemo-13B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..884a932 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783510aef3b08bd931e0e1a0ce727763302b3cc9dc4d0b89097f09ae1c8ef8d4 +size 7325491136 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q2_K.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q2_K.gguf new file mode 100644 index 0000000..94b80cf --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a8b8cd64eea34b2f9b0e8886a3de0f031985695e4c71c1d6082c2e42a8207d3 +size 5192294336 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q2_K_S.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..2c705b0 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d3705e108fbf5aa7c915d2061853b42d70ba0d8ce2eef6c76559bf9a700238 +size 4856586176 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_L.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..e6ea114 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95f60eb647e6d47b0e4e71050e0ffdbd7d3fb8157018f0b778e1d80d00483c0 +size 7132979136 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_M.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..51b5b42 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5853dd8153e6088b90f9a7317630188baad19e2f24bc88a52fec782a445af982 +size 6604758976 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_S.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..b8bba76 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c42e84820d6872f3dc2f80896b3591cccb019039316f81ad0b2240904cf3484 +size 6002974656 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q4_0.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q4_0.gguf new file mode 100644 index 0000000..ed30217 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a40df3fd072168adf184996aadb26d6cbf742bc03cd38e192a23b6f8405be37f +size 7708221376 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q4_1.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q4_1.gguf new file mode 100644 index 0000000..4396502 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e974bab59ce2cd7f00239eb0d03cea35b378ca80e60ecfec86e48fd58642e7 +size 8476958656 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q4_K_M.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..94e6372 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaab120f5fd4a39c4384d6b477dd38730861b00794e816f88602e074f6c62915 +size 8131338176 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q4_K_S.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..eb612d5 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59d45418200dbd5836ee5c85c1a1bfc50b7399d297ba1fab6a6445c4606b1ed +size 7733780416 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q5_K_M.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..e98865f --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9780cf3917eb81423c9c6f8bcc236d71c31a473f68a9407e39c1099e3bdd5080 +size 9498419136 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q5_K_S.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..3a38d44 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e7d2d72a4876fe02de1e7127ccd23462011bc1d190c603cd163c6a60c81fba8 +size 9268633536 diff --git a/DoublePotato-Mistral-Nemo-13B.i1-Q6_K.gguf b/DoublePotato-Mistral-Nemo-13B.i1-Q6_K.gguf new file mode 100644 index 0000000..0905c37 --- /dev/null +++ b/DoublePotato-Mistral-Nemo-13B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b533d3df7426de70c5f35435d2a616333dfe5a0212a77c6d1d0ed268300fb9ed +size 10950942656 diff --git a/README.md b/README.md new file mode 100644 index 0000000..ccf6ff2 --- /dev/null +++ b/README.md @@ -0,0 +1,78 @@ +--- +base_model: nbeerbower/DoublePotato-Mistral-Nemo-13B +language: +- en +library_name: transformers +quantized_by: mradermacher +tags: +- mergekit +- merge +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/nbeerbower/DoublePotato-Mistral-Nemo-13B + + +static quants are available at https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ1_S.gguf) | i1-IQ1_S | 3.3 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ1_M.gguf) | i1-IQ1_M | 3.6 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 4.0 | | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 4.3 | | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ2_S.gguf) | i1-IQ2_S | 4.6 | | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ2_M.gguf) | i1-IQ2_M | 4.9 | | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 5.0 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q2_K.gguf) | i1-Q2_K | 5.3 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 5.5 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 5.9 | | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 6.1 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ3_S.gguf) | i1-IQ3_S | 6.1 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ3_M.gguf) | i1-IQ3_M | 6.3 | | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 6.7 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 7.2 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 7.4 | | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q4_0.gguf) | i1-Q4_0 | 7.8 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 7.8 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 7.8 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 8.2 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q4_1.gguf) | i1-Q4_1 | 8.6 | | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 9.4 | | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 9.6 | | +| [GGUF](https://huggingface.co/mradermacher/DoublePotato-Mistral-Nemo-13B-i1-GGUF/resolve/main/DoublePotato-Mistral-Nemo-13B.i1-Q6_K.gguf) | i1-Q6_K | 11.1 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..aa11daf --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c48c4ea5eb5ab10c1b91e4129cd6e36b5105098c86aa14876eab7ff50287b7b8 +size 7759849