commit f8ab566490267874bae32bd57b9b3de7a7f453e2 Author: ModelHub XC Date: Thu Jun 18 07:24:17 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: mradermacher/llama3-8b-SlimHermes-i1-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..2fafb37 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +llama3-8b-SlimHermes.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..d1da46d --- /dev/null +++ b/README.md @@ -0,0 +1,78 @@ +--- +base_model: g-ronimo/llama3-8b-SlimHermes +language: +- en +library_name: transformers +license: other +license_name: llama3 +quantized_by: mradermacher +tags: [] +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/g-ronimo/llama3-8b-SlimHermes + + +static quants are available at https://huggingface.co/mradermacher/llama3-8b-SlimHermes-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ1_S.gguf) | i1-IQ1_S | 2.1 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ1_M.gguf) | i1-IQ1_M | 2.3 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.5 | | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ2_S.gguf) | i1-IQ2_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ2_M.gguf) | i1-IQ2_M | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q2_K_S.gguf) | i1-Q2_K_S | 3.1 | very low quality | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q2_K.gguf) | i1-Q2_K | 3.3 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.6 | | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.8 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ3_S.gguf) | i1-IQ3_S | 3.8 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ3_M.gguf) | i1-IQ3_M | 3.9 | | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q3_K_M.gguf) | i1-Q3_K_M | 4.1 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.4 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.5 | | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q4_0.gguf) | i1-Q4_0 | 4.8 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-IQ4_NL.gguf) | i1-IQ4_NL | 4.8 | prefer IQ4_XS | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.8 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q4_K_M.gguf) | i1-Q4_K_M | 5.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q4_1.gguf) | i1-Q4_1 | 5.2 | | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.7 | | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.8 | | +| [GGUF](https://huggingface.co/mradermacher/llama3-8b-SlimHermes-i1-GGUF/resolve/main/llama3-8b-SlimHermes.i1-Q6_K.gguf) | i1-Q6_K | 6.7 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..9ddac29 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8a79055fd5e05f9310303db44bd805e1bb4d2a99c5cf72994e565344f69eb83 +size 4988157 diff --git a/llama3-8b-SlimHermes.i1-IQ1_M.gguf b/llama3-8b-SlimHermes.i1-IQ1_M.gguf new file mode 100644 index 0000000..afa3d25 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:990038a99c9058ef7181a615bda8cdb3a78f90a25e19062efbb25cbbf124baa3 +size 2161972288 diff --git a/llama3-8b-SlimHermes.i1-IQ1_S.gguf b/llama3-8b-SlimHermes.i1-IQ1_S.gguf new file mode 100644 index 0000000..ab00b86 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb81f5e05429f55bd018632d3f8ef3e965f6130b6625adefdc94df37faf16d1d +size 2019628096 diff --git a/llama3-8b-SlimHermes.i1-IQ2_M.gguf b/llama3-8b-SlimHermes.i1-IQ2_M.gguf new file mode 100644 index 0000000..8a4e872 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6572489e0d500ed5ba52030221446adedf21dfe010275b0391cf3d909d667916 +size 2948281408 diff --git a/llama3-8b-SlimHermes.i1-IQ2_S.gguf b/llama3-8b-SlimHermes.i1-IQ2_S.gguf new file mode 100644 index 0000000..7984725 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8855f67ba479c461bbb025f4166f32df991265e52b21cff186f2589c4b0dc81 +size 2758489152 diff --git a/llama3-8b-SlimHermes.i1-IQ2_XS.gguf b/llama3-8b-SlimHermes.i1-IQ2_XS.gguf new file mode 100644 index 0000000..e14806c --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4334226060516962ca8166c5ee7cd284c0abc1b4e1e47ea15612f882339c963b +size 2605782080 diff --git a/llama3-8b-SlimHermes.i1-IQ2_XXS.gguf b/llama3-8b-SlimHermes.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..c20cde2 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d266baa0976c52623b8341d79a41d3b20205d9168551148e84dd00d479d7d5a +size 2399212608 diff --git a/llama3-8b-SlimHermes.i1-IQ3_M.gguf b/llama3-8b-SlimHermes.i1-IQ3_M.gguf new file mode 100644 index 0000000..59d26ca --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167507dfa4410c381bcade0c8e696c539750f65cd95ab815f84ca8485a2a74a9 +size 3784823872 diff --git a/llama3-8b-SlimHermes.i1-IQ3_S.gguf b/llama3-8b-SlimHermes.i1-IQ3_S.gguf new file mode 100644 index 0000000..0bcec80 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13963cae1a993d73e05a7d6e2f42a2890a1111be338b019c07908cfb445f20a5 +size 3682325568 diff --git a/llama3-8b-SlimHermes.i1-IQ3_XS.gguf b/llama3-8b-SlimHermes.i1-IQ3_XS.gguf new file mode 100644 index 0000000..0ce7022 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3875887f61e05619b78b8c658ef8afa49a5d360a552ed656e8058fe1184bba64 +size 3518747712 diff --git a/llama3-8b-SlimHermes.i1-IQ3_XXS.gguf b/llama3-8b-SlimHermes.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..e9dc138 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f443848205492fa476063c90886d32166f48e95b8c820673ba5ca989caa67900 +size 3274912832 diff --git a/llama3-8b-SlimHermes.i1-IQ4_NL.gguf b/llama3-8b-SlimHermes.i1-IQ4_NL.gguf new file mode 100644 index 0000000..f2a7104 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6acbde8f8628f7ac8d7c8c8cd162ad846ef15373eb6a581a38de1007a46724c1 +size 4677989440 diff --git a/llama3-8b-SlimHermes.i1-IQ4_XS.gguf b/llama3-8b-SlimHermes.i1-IQ4_XS.gguf new file mode 100644 index 0000000..ed297dc --- /dev/null +++ b/llama3-8b-SlimHermes.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d9eb0fe02024bfd02577c641c07992a826627972889030223a5cba54ff5da85 +size 4447663168 diff --git a/llama3-8b-SlimHermes.i1-Q2_K.gguf b/llama3-8b-SlimHermes.i1-Q2_K.gguf new file mode 100644 index 0000000..8e5260a --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfd97ac0b6d8f7ea35e7520f741785bac83aa0db45acf8ded1b26971596fe9b2 +size 3179131968 diff --git a/llama3-8b-SlimHermes.i1-Q2_K_S.gguf b/llama3-8b-SlimHermes.i1-Q2_K_S.gguf new file mode 100644 index 0000000..1b1624d --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ffb174b245b2ef4519b3b86b8c0e42ed65c1817c466626e76e8d39d924858e3 +size 2988815424 diff --git a/llama3-8b-SlimHermes.i1-Q3_K_L.gguf b/llama3-8b-SlimHermes.i1-Q3_K_L.gguf new file mode 100644 index 0000000..07d0641 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a11d9cc8b4241a35b31e01a94260b2251c0799e88a2ccf2c38284355c3f9b5e +size 4321956928 diff --git a/llama3-8b-SlimHermes.i1-Q3_K_M.gguf b/llama3-8b-SlimHermes.i1-Q3_K_M.gguf new file mode 100644 index 0000000..5bd96c2 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89b04bd43a9a4c54e20264716c5facea8fe44f83ae8caaaae5fef8f6e04490a3 +size 4018918464 diff --git a/llama3-8b-SlimHermes.i1-Q3_K_S.gguf b/llama3-8b-SlimHermes.i1-Q3_K_S.gguf new file mode 100644 index 0000000..5a780c6 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68059425a622e70fc55c839c9bb90da3edf300b42b54470326d00c8cffc67ca5 +size 3664499776 diff --git a/llama3-8b-SlimHermes.i1-Q4_0.gguf b/llama3-8b-SlimHermes.i1-Q4_0.gguf new file mode 100644 index 0000000..742c29d --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d23c90ba7855d60568ac2124286c7efa91fc0fd57c8d6f2d43596fd94fe8cfc +size 4675892288 diff --git a/llama3-8b-SlimHermes.i1-Q4_1.gguf b/llama3-8b-SlimHermes.i1-Q4_1.gguf new file mode 100644 index 0000000..2507e45 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8c65cbfe086486fd590f96250a1c7dbb233092683f4389eaf4b75cae9dab32e +size 5130253376 diff --git a/llama3-8b-SlimHermes.i1-Q4_K_M.gguf b/llama3-8b-SlimHermes.i1-Q4_K_M.gguf new file mode 100644 index 0000000..03fa1c6 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:088f5d665b2e87557a9511a9fbde7444741e8ef5bb7ed87f92d5232f87ba4858 +size 4920734784 diff --git a/llama3-8b-SlimHermes.i1-Q4_K_S.gguf b/llama3-8b-SlimHermes.i1-Q4_K_S.gguf new file mode 100644 index 0000000..562b386 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab5dc1ccac9eb7f927306d3b598cff048ef7e7e90b2916378a63d445748fe92 +size 4692669504 diff --git a/llama3-8b-SlimHermes.i1-Q5_K_M.gguf b/llama3-8b-SlimHermes.i1-Q5_K_M.gguf new file mode 100644 index 0000000..1a84cbf --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e6f1b1acef36c2513f2ab098172313d2f785f463aac66995d5b2e71684b8dc0 +size 5732987968 diff --git a/llama3-8b-SlimHermes.i1-Q5_K_S.gguf b/llama3-8b-SlimHermes.i1-Q5_K_S.gguf new file mode 100644 index 0000000..ee7644f --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e044cfec67d52c4ab9e749410d211c358c37c2959752bf7a2df605b6beb56ac +size 5599294528 diff --git a/llama3-8b-SlimHermes.i1-Q6_K.gguf b/llama3-8b-SlimHermes.i1-Q6_K.gguf new file mode 100644 index 0000000..8d7cc67 --- /dev/null +++ b/llama3-8b-SlimHermes.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368ebf8d63f92e9bfd688f5a92d3df5fb2dd1f4035efcd719debcf2ffcfa1c15 +size 6596006976