commit a134882e8d91fb9fdd7d8f105c5f7593d3ad092f Author: ModelHub XC Date: Thu Apr 30 22:05:23 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..e54bcd6 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Mantella-Skyrim-Llama-3-8B.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ1_M.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ1_M.gguf new file mode 100644 index 0000000..fe28dec --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdcf268c367f28fa2f24d5530a9fb9228a3c1177cd26d409ae1a3e3b18ab902a +size 2161972992 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ1_S.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ1_S.gguf new file mode 100644 index 0000000..1245ef5 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:619309076b94fc47b743a906da9e7c5bc370bf460e13159370784ef4411123d9 +size 2019628800 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ2_M.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ2_M.gguf new file mode 100644 index 0000000..08f2808 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a66a6f2e5a7438583e3ec36d6f06f7d7aa56f8be0013746541a7e795210c26c8 +size 2948282112 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ2_S.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ2_S.gguf new file mode 100644 index 0000000..c3d9a10 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dc419212c2bce7b38ee1e8f9782e4a75cd76c1352e97b37b778a61931a39928 +size 2758489856 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ2_XS.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ2_XS.gguf new file mode 100644 index 0000000..be7b1b9 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd18a984c6a22df5b3b6492e17683101a6dda5b45db35d8ae03d382c2854fed2 +size 2605782784 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ2_XXS.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..f725f38 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8a9762d276cdd6a4316981c03102789443b2fb66ac84db172b545f005f29fc9 +size 2399213312 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ3_M.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ3_M.gguf new file mode 100644 index 0000000..ec2ccf1 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d6c572a9d765de900685582baf4fc8db553d9b7a831777e7ea4383f98306588 +size 3784824576 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ3_S.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ3_S.gguf new file mode 100644 index 0000000..35465e8 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:297a755f3a39ae7e3855249d31436f0ea5b7de5b621faa599774a4d5409a0996 +size 3682326272 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ3_XS.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ3_XS.gguf new file mode 100644 index 0000000..7185e38 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dd8f80633c8a5db4e3083755a066a62b3ff716c4787dcf441e0c3da574b45dd +size 3518748416 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ3_XXS.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..b1a98b9 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aa0dc00faa37dcf46946e69e8854b29e87e8c127d6131b948319764a7624b11 +size 3274913536 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ4_NL.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ4_NL.gguf new file mode 100644 index 0000000..e042932 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf1dfbc25748c74bcbc295b9cc3c6bce59fb7b967ea7e7114b29d0503638fb2a +size 4677990144 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-IQ4_XS.gguf b/Mantella-Skyrim-Llama-3-8B.i1-IQ4_XS.gguf new file mode 100644 index 0000000..5db99b9 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b27c3b223df60ccde0aae51be8d59d0c41d6c43483e529a3441b4c864c55255 +size 4447663872 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q2_K.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q2_K.gguf new file mode 100644 index 0000000..df81d40 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c03a2b99b517393b5dda213a86fd0775148feb7bade83408a55ffd0717e0e6db +size 3179132672 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q2_K_S.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q2_K_S.gguf new file mode 100644 index 0000000..fdac5b4 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c226289c069b995c63f45016d18aad2fa8ebe03d74930786efc57ea048d7557e +size 2988816128 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_L.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_L.gguf new file mode 100644 index 0000000..6529c54 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db51c1ad9b9bd3f1c947543c57ea5bd8f8093128fd1e1a9b6b6b5a200794d5e3 +size 4321957632 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_M.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_M.gguf new file mode 100644 index 0000000..1f79580 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:798c5cc41a30608fdffd3490209cd2cd510afb6edb32ab6d0feec012e8978d24 +size 4018919168 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_S.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_S.gguf new file mode 100644 index 0000000..c3513d4 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c1edb05d83bcc89614db5f2666d894a783d43ee07c06031ffb13d8966046fe5 +size 3664500480 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q4_0.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q4_0.gguf new file mode 100644 index 0000000..94d226c --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b5f58074eb3bb47cac3b572a6544c3a3e3d92472199f6fe609ee8cf0a26b6b2 +size 4675892992 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q4_1.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q4_1.gguf new file mode 100644 index 0000000..16432e0 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:410f2c41cc53531a420bee927d8ad2eb6e6baf1be50434a44e182354d11a55c9 +size 5130254080 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q4_K_M.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q4_K_M.gguf new file mode 100644 index 0000000..33f925b --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7f255f9b8c43c92586fe13a86dfac59dfdf595dce6e2b078296bc70dce5f2a0 +size 4920735488 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q4_K_S.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q4_K_S.gguf new file mode 100644 index 0000000..a2b179d --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5100c2b9e339afa7b00edc492b69bd6924c89ca84d337e1d51fad09e60e8366f +size 4692670208 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q5_K_M.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q5_K_M.gguf new file mode 100644 index 0000000..c0042d2 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c6137550ae17eba40ee558c4abc13bf97139bd2312655ba7893e5bd59634cce +size 5732988672 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q5_K_S.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q5_K_S.gguf new file mode 100644 index 0000000..f165e16 --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e39203740b2f2219e3120ddbed79ef0d61d956d9dc8ca752086c8b0690b0993 +size 5599295232 diff --git a/Mantella-Skyrim-Llama-3-8B.i1-Q6_K.gguf b/Mantella-Skyrim-Llama-3-8B.i1-Q6_K.gguf new file mode 100644 index 0000000..a22533d --- /dev/null +++ b/Mantella-Skyrim-Llama-3-8B.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:648452e7fbddbf073eb624df25add48fad8363bbec7c9eaa05cb0088e5a3a5a3 +size 6596007680 diff --git a/README.md b/README.md new file mode 100644 index 0000000..112ec40 --- /dev/null +++ b/README.md @@ -0,0 +1,82 @@ +--- +base_model: art-from-the-machine/Mantella-Skyrim-Llama-3-8B +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +tags: +- text-generation-inference +- transformers +- unsloth +- llama +- gguf +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/art-from-the-machine/Mantella-Skyrim-Llama-3-8B + + +static quants are available at https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ1_S.gguf) | i1-IQ1_S | 2.1 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ1_M.gguf) | i1-IQ1_M | 2.3 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.5 | | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ2_S.gguf) | i1-IQ2_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ2_M.gguf) | i1-IQ2_M | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q2_K_S.gguf) | i1-Q2_K_S | 3.1 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q2_K.gguf) | i1-Q2_K | 3.3 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.6 | | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.8 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ3_S.gguf) | i1-IQ3_S | 3.8 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ3_M.gguf) | i1-IQ3_M | 3.9 | | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_M.gguf) | i1-Q3_K_M | 4.1 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.4 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.5 | | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q4_0.gguf) | i1-Q4_0 | 4.8 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-IQ4_NL.gguf) | i1-IQ4_NL | 4.8 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.8 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q4_K_M.gguf) | i1-Q4_K_M | 5.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q4_1.gguf) | i1-Q4_1 | 5.2 | | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.7 | | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.8 | | +| [GGUF](https://huggingface.co/mradermacher/Mantella-Skyrim-Llama-3-8B-i1-GGUF/resolve/main/Mantella-Skyrim-Llama-3-8B.i1-Q6_K.gguf) | i1-Q6_K | 6.7 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..a493f49 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fef851b6bb2f7e75787529d918bd8fd249b12636450024526c6445b92ad2f146 +size 4988157