From 5bd78af0e35a0122b9b0e07e23e5c3bbc5385a97 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Wed, 17 Jun 2026 23:28:21 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF Source: Original Platform --- .gitattributes | 60 ++++++++++++++++ README.md | 76 +++++++++++++++++++++ imatrix.dat | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_M.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_S.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_M.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_S.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XS.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XXS.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_M.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_S.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XS.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XXS.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-IQ4_XS.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q2_K.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_L.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_M.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_S.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_4.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_8.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_8_8.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_M.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_S.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_M.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_S.gguf | 3 + ldm_soup_Llama-3.1-8B-Inst.i1-Q6_K.gguf | 3 + 27 files changed, 211 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 imatrix.dat create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_M.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_S.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_M.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_S.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XS.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XXS.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_M.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_S.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XS.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XXS.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-IQ4_XS.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q2_K.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_L.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_M.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_S.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_4.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_8.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_8_8.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_M.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_S.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_M.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_S.gguf create mode 100644 ldm_soup_Llama-3.1-8B-Inst.i1-Q6_K.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..71fca8c --- /dev/null +++ b/.gitattributes @@ -0,0 +1,60 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +imatrix.dat filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_8.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_8_8.gguf filter=lfs diff=lfs merge=lfs -text +ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..2f80251 --- /dev/null +++ b/README.md @@ -0,0 +1,76 @@ +--- +base_model: DeepAuto-AI/ldm_soup_Llama-3.1-8B-Inst +language: +- en +library_name: transformers +license: apache-2.0 +quantized_by: mradermacher +--- +## About + + + + + + +weighted/imatrix quants of https://huggingface.co/DeepAuto-AI/ldm_soup_Llama-3.1-8B-Inst + + +static quants are available at https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-GGUF +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_S.gguf) | i1-IQ1_S | 2.1 | for the desperate | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_M.gguf) | i1-IQ1_M | 2.3 | mostly desperate | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XXS.gguf) | i1-IQ2_XXS | 2.5 | | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XS.gguf) | i1-IQ2_XS | 2.7 | | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_S.gguf) | i1-IQ2_S | 2.9 | | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_M.gguf) | i1-IQ2_M | 3.0 | | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q2_K.gguf) | i1-Q2_K | 3.3 | IQ3_XXS probably better | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XXS.gguf) | i1-IQ3_XXS | 3.4 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XS.gguf) | i1-IQ3_XS | 3.6 | | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_S.gguf) | i1-Q3_K_S | 3.8 | IQ3_XS probably better | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_S.gguf) | i1-IQ3_S | 3.8 | beats Q3_K* | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_M.gguf) | i1-IQ3_M | 3.9 | | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_M.gguf) | i1-Q3_K_M | 4.1 | IQ3_S probably better | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_L.gguf) | i1-Q3_K_L | 4.4 | IQ3_M probably better | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-IQ4_XS.gguf) | i1-IQ4_XS | 4.5 | | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_4.gguf) | i1-Q4_0_4_4 | 4.8 | fast on arm, low quality | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_8.gguf) | i1-Q4_0_4_8 | 4.8 | fast on arm+i8mm, low quality | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_8_8.gguf) | i1-Q4_0_8_8 | 4.8 | fast on arm+sve, low quality | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0.gguf) | i1-Q4_0 | 4.8 | fast, low quality | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_S.gguf) | i1-Q4_K_S | 4.8 | optimal size/speed/quality | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_M.gguf) | i1-Q4_K_M | 5.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_S.gguf) | i1-Q5_K_S | 5.7 | | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_M.gguf) | i1-Q5_K_M | 5.8 | | +| [GGUF](https://huggingface.co/mradermacher/ldm_soup_Llama-3.1-8B-Inst-i1-GGUF/resolve/main/ldm_soup_Llama-3.1-8B-Inst.i1-Q6_K.gguf) | i1-Q6_K | 6.7 | practically like static Q6_K | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. Additional thanks to [@nicoboss](https://huggingface.co/nicoboss) for giving me access to his private supercomputer, enabling me to provide many more imatrix quants, at much higher quality, than I would otherwise be able to. + + diff --git a/imatrix.dat b/imatrix.dat new file mode 100644 index 0000000..2b15bd5 --- /dev/null +++ b/imatrix.dat @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76e4a757e0ea6203e4cbbf76e6743a13d7bcd975ee8c5103f15fcdbc0032701a +size 4988157 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_M.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_M.gguf new file mode 100644 index 0000000..c85d177 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29c81ebfbde40d489d0ffdd4ad76070eb62f955cd1da084c3f83f98b0dcbe373 +size 2161973024 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_S.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_S.gguf new file mode 100644 index 0000000..5a3b620 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de081d05d6865c02b00a42f1b1e671d55f9316b96e8abb7ef19cb7e534480b99 +size 2019628832 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_M.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_M.gguf new file mode 100644 index 0000000..c7c7c23 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9edaba6283660284eab96ca57220f68c4f1864c9d0d647ef4e9071f094ed17f +size 2948282144 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_S.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_S.gguf new file mode 100644 index 0000000..fcb3663 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e477dcd13d4d981c11758165d93987524e8814f69a698f456001ae2fe0100582 +size 2758489888 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XS.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XS.gguf new file mode 100644 index 0000000..8bb70e5 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac270135a9e56ee009c5b0aec2d7babac2b03e5411fbb4c55a3ba5dfb3700954 +size 2605782816 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XXS.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XXS.gguf new file mode 100644 index 0000000..139d59d --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15c01d0a5c3d7ed97e906a7385c5149179c71377346afa8d298a8a8482e6f3d5 +size 2399213344 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_M.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_M.gguf new file mode 100644 index 0000000..282eda4 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61881131320c8caf2608fe11644dbef3ea1fcac7fdbff54631ee035c23ce50d7 +size 3784824608 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_S.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_S.gguf new file mode 100644 index 0000000..5ec2d3a --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d998e35e57f16fc93bda1d60da4563d24529b510548c80def4c199a1e16b1a8 +size 3682326304 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XS.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XS.gguf new file mode 100644 index 0000000..c5d7ce3 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03e2fcb034fccfe3b6964aea3b03c4490e1b6f949be0ebcce1e68d2f3b719ce7 +size 3518748448 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XXS.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XXS.gguf new file mode 100644 index 0000000..0eb4fda --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8ab20780d3ce887a9e1d61b211bf5ff83b6a20800c1cd33617e8a8f5b3f3004 +size 3274913568 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-IQ4_XS.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ4_XS.gguf new file mode 100644 index 0000000..944d7fd --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30b052f9c0ec3a092dde2035be6dce2e30b2f412813ad3b61e0f03a9a1c6ab45 +size 4447663904 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q2_K.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q2_K.gguf new file mode 100644 index 0000000..8ee3b0c --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:addd4126d48e9c33c1b7a9fdab1c976da44a5315d91c75548c900bb847cfdcf7 +size 3179132704 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_L.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_L.gguf new file mode 100644 index 0000000..a5df77b --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5535a6f8e025f387498628e1fc7ac55b2b1d91609fcabec75e45441e5f068298 +size 4321957664 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_M.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_M.gguf new file mode 100644 index 0000000..24d0431 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:240910032e48041c6884e1cc114b9f7a0576c3b497af322541bddb7e9d9d69de +size 4018919200 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_S.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_S.gguf new file mode 100644 index 0000000..7cc66d4 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e03e0220074a48ae7c1fe7a7387be908def80e666ad3fb2ab80eb109a1ee917b +size 3664500512 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0.gguf new file mode 100644 index 0000000..15d39e0 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cff7aea1a89b24d4324333372361110743b5d5c734f8bf46642666cf4a3121ea +size 4675893024 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_4.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_4.gguf new file mode 100644 index 0000000..d89e524 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_4.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7afdecc3c9f3ea74ae16ea3e7b3055dbb782be8638180ce9d389d71ad8cdacd9 +size 4661212960 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_8.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_8.gguf new file mode 100644 index 0000000..a984a0e --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_4_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f58d3888846df3191ed934d6173dae8eb36eeb174c2cb9d7d1adededc4bb1ad +size 4661212960 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_8_8.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_8_8.gguf new file mode 100644 index 0000000..42b379b --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_0_8_8.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:366a1b4eb862f9de167f48cb8b90eae3e07e0c9ca97a08b4e5f01413d4349b2a +size 4661212960 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_M.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_M.gguf new file mode 100644 index 0000000..2fcfe5e --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b60e5aad62d738f0f731636d8ff4c090110f4671100964bf000e2d8c91a3b08d +size 4920735520 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_S.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_S.gguf new file mode 100644 index 0000000..67103b3 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88f62c72d06de52176382da9a00f9aaaa03fe56cc638a2b846416c71e3ea5013 +size 4692670240 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_M.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_M.gguf new file mode 100644 index 0000000..db2be13 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ffb834aa7efd84a11de662300ce9a97d32bfb14747d2efab6bd8e63abbb4c1 +size 5732988704 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_S.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_S.gguf new file mode 100644 index 0000000..8b98ef3 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1123b73efc7504f9d9342829ad509f18a8f64e083be9e66176f9d1604640f0fc +size 5599295264 diff --git a/ldm_soup_Llama-3.1-8B-Inst.i1-Q6_K.gguf b/ldm_soup_Llama-3.1-8B-Inst.i1-Q6_K.gguf new file mode 100644 index 0000000..cacd958 --- /dev/null +++ b/ldm_soup_Llama-3.1-8B-Inst.i1-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee8e7414ab48135308ff328b38e24dda526c6b3a9d7ab4f023e0b3faad4249e +size 6596007712