From 0d1c1b271adfbfdae387b83a86b89e848361de30 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Mon, 22 Jun 2026 22:20:18 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF Source: Original Platform --- .gitattributes | 46 +++++++++++++++ KnowSelf-Llama3.1-8B-ALFWorld.IQ4_XS.gguf | 3 + KnowSelf-Llama3.1-8B-ALFWorld.Q2_K.gguf | 3 + KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_L.gguf | 3 + KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_M.gguf | 3 + KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_S.gguf | 3 + KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_M.gguf | 3 + KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_S.gguf | 3 + KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_M.gguf | 3 + KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_S.gguf | 3 + KnowSelf-Llama3.1-8B-ALFWorld.Q6_K.gguf | 3 + KnowSelf-Llama3.1-8B-ALFWorld.Q8_0.gguf | 3 + KnowSelf-Llama3.1-8B-ALFWorld.f16.gguf | 3 + README.md | 69 +++++++++++++++++++++++ 14 files changed, 151 insertions(+) create mode 100644 .gitattributes create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.IQ4_XS.gguf create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.Q2_K.gguf create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_L.gguf create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_M.gguf create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_S.gguf create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_M.gguf create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_S.gguf create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_M.gguf create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_S.gguf create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.Q6_K.gguf create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.Q8_0.gguf create mode 100644 KnowSelf-Llama3.1-8B-ALFWorld.f16.gguf create mode 100644 README.md diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..a75950f --- /dev/null +++ b/.gitattributes @@ -0,0 +1,46 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +KnowSelf-Llama3.1-8B-ALFWorld.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +KnowSelf-Llama3.1-8B-ALFWorld.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +KnowSelf-Llama3.1-8B-ALFWorld.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text +KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +KnowSelf-Llama3.1-8B-ALFWorld.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +KnowSelf-Llama3.1-8B-ALFWorld.f16.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.IQ4_XS.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.IQ4_XS.gguf new file mode 100644 index 0000000..f98ce88 --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d348f63ef847edd08a6d110fadbf276e6c6ca9cc69bc47dda36479d6f1534f8 +size 4484406752 diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.Q2_K.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.Q2_K.gguf new file mode 100644 index 0000000..0a50033 --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97cced222dd896ff8705db8cb08ed556b94f32215774911e46affb6314bfddfa +size 3179169568 diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_L.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_L.gguf new file mode 100644 index 0000000..cbdb4a3 --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0b8d453fcdc1be905359eaf27634c3d95c9e501b226c9ce7b81752585b75edd +size 4321997440 diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_M.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_M.gguf new file mode 100644 index 0000000..5ed69b2 --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf71bcdaf9f0ec827455b3caac6f9824ed50e687d0f1b43007e6c251b3b3280f +size 4018958976 diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_S.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_S.gguf new file mode 100644 index 0000000..cf2ecde --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2e78f78b6078427e8d24645fc426cceb161c18ecb468301a868b17c05a8de4c +size 3664540288 diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_M.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_M.gguf new file mode 100644 index 0000000..3a3806c --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1476b11261602551ae0ca8656a6924813b3bfbb4cdef033cbd94a68c29950b6c +size 4920779104 diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_S.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_S.gguf new file mode 100644 index 0000000..656f575 --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ef1d437f94ef5b2340414c6a5b2588188544980095fa12f30d244d8e1811e8b +size 4692713824 diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_M.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_M.gguf new file mode 100644 index 0000000..95e4e56 --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd31df0abf3063daaa8afbb698eb8f81dfcfbbbda116ea0e5a5e5636bedfc1fd +size 5733035872 diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_S.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_S.gguf new file mode 100644 index 0000000..eaf602c --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0654c75eaff17a6ac5447404dc1ea191cfa5667e7629e173bc1c13261c7fd09 +size 5599342432 diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.Q6_K.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.Q6_K.gguf new file mode 100644 index 0000000..796d20b --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e83cba241dbf57ac0e73d6bbe623568aa56cb2ca2355e2e91223998e2f72302 +size 6596058688 diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.Q8_0.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.Q8_0.gguf new file mode 100644 index 0000000..9670563 --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d213d3e07d17a4b45e6c9ffcdbdb09787c1b3ceb283851cac8f4ee1b09f015dc +size 8540836992 diff --git a/KnowSelf-Llama3.1-8B-ALFWorld.f16.gguf b/KnowSelf-Llama3.1-8B-ALFWorld.f16.gguf new file mode 100644 index 0000000..510f788 --- /dev/null +++ b/KnowSelf-Llama3.1-8B-ALFWorld.f16.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae24c79fe7b732471c4811bcb1c565dbcc7d5b75ac4fc6e29a99739bcca9d0e2 +size 16069011072 diff --git a/README.md b/README.md new file mode 100644 index 0000000..61832dc --- /dev/null +++ b/README.md @@ -0,0 +1,69 @@ +--- +base_model: zjunlp/KnowSelf-Llama3.1-8B-ALFWorld +language: +- en +library_name: transformers +license: mit +mradermacher: + readme_rev: 1 +quantized_by: mradermacher +--- +## About + + + + + + +static quants of https://huggingface.co/zjunlp/KnowSelf-Llama3.1-8B-ALFWorld + + + +***For a convenient overview and download list, visit our [model page for this model](https://hf.tst.eu/model#KnowSelf-Llama3.1-8B-ALFWorld-GGUF).*** + +weighted/imatrix quants seem not to be available (by me) at this time. If they do not show up a week or so after the static ones, I have probably not planned for them. Feel free to request them by opening a Community Discussion. +## Usage + +If you are unsure how to use GGUF files, refer to one of [TheBloke's +READMEs](https://huggingface.co/TheBloke/KafkaLM-70B-German-V0.1-GGUF) for +more details, including on how to concatenate multi-part files. + +## Provided Quants + +(sorted by size, not necessarily quality. IQ-quants are often preferable over similar sized non-IQ quants) + +| Link | Type | Size/GB | Notes | +|:-----|:-----|--------:|:------| +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.Q2_K.gguf) | Q2_K | 3.3 | | +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_S.gguf) | Q3_K_S | 3.8 | | +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_M.gguf) | Q3_K_M | 4.1 | lower quality | +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.Q3_K_L.gguf) | Q3_K_L | 4.4 | | +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.IQ4_XS.gguf) | IQ4_XS | 4.6 | | +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_S.gguf) | Q4_K_S | 4.8 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.Q4_K_M.gguf) | Q4_K_M | 5.0 | fast, recommended | +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_S.gguf) | Q5_K_S | 5.7 | | +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.Q5_K_M.gguf) | Q5_K_M | 5.8 | | +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.Q6_K.gguf) | Q6_K | 6.7 | very good quality | +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.Q8_0.gguf) | Q8_0 | 8.6 | fast, best quality | +| [GGUF](https://huggingface.co/mradermacher/KnowSelf-Llama3.1-8B-ALFWorld-GGUF/resolve/main/KnowSelf-Llama3.1-8B-ALFWorld.f16.gguf) | f16 | 16.2 | 16 bpw, overkill | + +Here is a handy graph by ikawrakow comparing some lower-quality quant +types (lower is better): + +![image.png](https://www.nethype.de/huggingface_embed/quantpplgraph.png) + +And here are Artefact2's thoughts on the matter: +https://gist.github.com/Artefact2/b5f810600771265fc1e39442288e8ec9 + +## FAQ / Model Request + +See https://huggingface.co/mradermacher/model_requests for some answers to +questions you might have and/or if you want some other model quantized. + +## Thanks + +I thank my company, [nethype GmbH](https://www.nethype.de/), for letting +me use its servers and providing upgrades to my workstation to enable +this work in my free time. + +