From 02dcd49140124aebe59415b0dc86c53106db9c05 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Wed, 17 Jun 2026 16:17:16 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: duyntnet/Llama-2-7b-chat-hf-imatrix-GGUF Source: Original Platform --- .gitattributes | 62 +++++++++++++++++++++++++++++++++ Llama-2-7b-chat-hf-IQ1_M.gguf | 3 ++ Llama-2-7b-chat-hf-IQ1_S.gguf | 3 ++ Llama-2-7b-chat-hf-IQ2_M.gguf | 3 ++ Llama-2-7b-chat-hf-IQ2_S.gguf | 3 ++ Llama-2-7b-chat-hf-IQ2_XS.gguf | 3 ++ Llama-2-7b-chat-hf-IQ2_XXS.gguf | 3 ++ Llama-2-7b-chat-hf-IQ3_M.gguf | 3 ++ Llama-2-7b-chat-hf-IQ3_S.gguf | 3 ++ Llama-2-7b-chat-hf-IQ3_XS.gguf | 3 ++ Llama-2-7b-chat-hf-IQ3_XXS.gguf | 3 ++ Llama-2-7b-chat-hf-IQ4_NL.gguf | 3 ++ Llama-2-7b-chat-hf-IQ4_XS.gguf | 3 ++ Llama-2-7b-chat-hf-Q2_K.gguf | 3 ++ Llama-2-7b-chat-hf-Q2_K_S.gguf | 3 ++ Llama-2-7b-chat-hf-Q3_K_L.gguf | 3 ++ Llama-2-7b-chat-hf-Q3_K_M.gguf | 3 ++ Llama-2-7b-chat-hf-Q3_K_S.gguf | 3 ++ Llama-2-7b-chat-hf-Q4_0.gguf | 3 ++ Llama-2-7b-chat-hf-Q4_1.gguf | 3 ++ Llama-2-7b-chat-hf-Q4_K_M.gguf | 3 ++ Llama-2-7b-chat-hf-Q4_K_S.gguf | 3 ++ Llama-2-7b-chat-hf-Q5_0.gguf | 3 ++ Llama-2-7b-chat-hf-Q5_1.gguf | 3 ++ Llama-2-7b-chat-hf-Q5_K_M.gguf | 3 ++ Llama-2-7b-chat-hf-Q5_K_S.gguf | 3 ++ Llama-2-7b-chat-hf-Q6_K.gguf | 3 ++ Llama-2-7b-chat-hf-Q8_0.gguf | 3 ++ README.md | 21 +++++++++++ 29 files changed, 164 insertions(+) create mode 100644 .gitattributes create mode 100644 Llama-2-7b-chat-hf-IQ1_M.gguf create mode 100644 Llama-2-7b-chat-hf-IQ1_S.gguf create mode 100644 Llama-2-7b-chat-hf-IQ2_M.gguf create mode 100644 Llama-2-7b-chat-hf-IQ2_S.gguf create mode 100644 Llama-2-7b-chat-hf-IQ2_XS.gguf create mode 100644 Llama-2-7b-chat-hf-IQ2_XXS.gguf create mode 100644 Llama-2-7b-chat-hf-IQ3_M.gguf create mode 100644 Llama-2-7b-chat-hf-IQ3_S.gguf create mode 100644 Llama-2-7b-chat-hf-IQ3_XS.gguf create mode 100644 Llama-2-7b-chat-hf-IQ3_XXS.gguf create mode 100644 Llama-2-7b-chat-hf-IQ4_NL.gguf create mode 100644 Llama-2-7b-chat-hf-IQ4_XS.gguf create mode 100644 Llama-2-7b-chat-hf-Q2_K.gguf create mode 100644 Llama-2-7b-chat-hf-Q2_K_S.gguf create mode 100644 Llama-2-7b-chat-hf-Q3_K_L.gguf create mode 100644 Llama-2-7b-chat-hf-Q3_K_M.gguf create mode 100644 Llama-2-7b-chat-hf-Q3_K_S.gguf create mode 100644 Llama-2-7b-chat-hf-Q4_0.gguf create mode 100644 Llama-2-7b-chat-hf-Q4_1.gguf create mode 100644 Llama-2-7b-chat-hf-Q4_K_M.gguf create mode 100644 Llama-2-7b-chat-hf-Q4_K_S.gguf create mode 100644 Llama-2-7b-chat-hf-Q5_0.gguf create mode 100644 Llama-2-7b-chat-hf-Q5_1.gguf create mode 100644 Llama-2-7b-chat-hf-Q5_K_M.gguf create mode 100644 Llama-2-7b-chat-hf-Q5_K_S.gguf create mode 100644 Llama-2-7b-chat-hf-Q6_K.gguf create mode 100644 Llama-2-7b-chat-hf-Q8_0.gguf create mode 100644 README.md diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..6dfc52e --- /dev/null +++ b/.gitattributes @@ -0,0 +1,62 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Llama-2-7b-chat-hf-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/Llama-2-7b-chat-hf-IQ1_M.gguf b/Llama-2-7b-chat-hf-IQ1_M.gguf new file mode 100644 index 0000000..bd01dd9 --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3aba0b1dcc9f657ec4b4ae37de5a58a9f8b69882166089bc5bab976cb8384e0 +size 1650972000 diff --git a/Llama-2-7b-chat-hf-IQ1_S.gguf b/Llama-2-7b-chat-hf-IQ1_S.gguf new file mode 100644 index 0000000..b5b9373 --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7be5b493f0a1bfeb2bf2246aba2c6d6486934a273b93dd40fd55387f2d45f121 +size 1528583520 diff --git a/Llama-2-7b-chat-hf-IQ2_M.gguf b/Llama-2-7b-chat-hf-IQ2_M.gguf new file mode 100644 index 0000000..8392b0f --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bf2ca8eb8707168195fbcf1d027290eced6511218b98426227cdfef6b5fccee +size 2359752032 diff --git a/Llama-2-7b-chat-hf-IQ2_S.gguf b/Llama-2-7b-chat-hf-IQ2_S.gguf new file mode 100644 index 0000000..1ccc834 --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9660cf05fcd924c6e8473d013c2bda6310c46ef8916266ac0959e1e7b8fae3 +size 2196567392 diff --git a/Llama-2-7b-chat-hf-IQ2_XS.gguf b/Llama-2-7b-chat-hf-IQ2_XS.gguf new file mode 100644 index 0000000..19ccb2d --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:843f5b7c61b641252bd482f2de9083de3d97fbdb42ebce11a09f56f160312c05 +size 2034914656 diff --git a/Llama-2-7b-chat-hf-IQ2_XXS.gguf b/Llama-2-7b-chat-hf-IQ2_XXS.gguf new file mode 100644 index 0000000..d08d764 --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:270b9418b779788c4fc326009a87da4fb83cbdbfff06f54ce6cbcf9ac41f8ac1 +size 1854952800 diff --git a/Llama-2-7b-chat-hf-IQ3_M.gguf b/Llama-2-7b-chat-hf-IQ3_M.gguf new file mode 100644 index 0000000..8f4f58e --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cb769b67b343e7334a687736f74e1951a2e70739d4761d79326af71770fd6d0 +size 3114866016 diff --git a/Llama-2-7b-chat-hf-IQ3_S.gguf b/Llama-2-7b-chat-hf-IQ3_S.gguf new file mode 100644 index 0000000..47edfb6 --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dccb7e9fd77c056860204deb027b6e32be24c5f6888eb6cdd0bd63c9d274ae09 +size 2948306272 diff --git a/Llama-2-7b-chat-hf-IQ3_XS.gguf b/Llama-2-7b-chat-hf-IQ3_XS.gguf new file mode 100644 index 0000000..95f70b5 --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59a1dfee37a322e5a7601362c73051bf50a362edf92737b6ccca692fc38b62a +size 2796524896 diff --git a/Llama-2-7b-chat-hf-IQ3_XXS.gguf b/Llama-2-7b-chat-hf-IQ3_XXS.gguf new file mode 100644 index 0000000..308ce4e --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c05de01131bb1baae15a1294f32e74a623740bd872c198f21ada05c2506df855 +size 2585392480 diff --git a/Llama-2-7b-chat-hf-IQ4_NL.gguf b/Llama-2-7b-chat-hf-IQ4_NL.gguf new file mode 100644 index 0000000..fad7c1f --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c739350603f47e1aef34247bc3d89ecdd48ca7801a91cec83b5c035e9d326f6c +size 3825808736 diff --git a/Llama-2-7b-chat-hf-IQ4_XS.gguf b/Llama-2-7b-chat-hf-IQ4_XS.gguf new file mode 100644 index 0000000..95f9cee --- /dev/null +++ b/Llama-2-7b-chat-hf-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28e8af7533692f5227fec40a3a9537a48136967601ce5b9a895053998c78e35b +size 3619337568 diff --git a/Llama-2-7b-chat-hf-Q2_K.gguf b/Llama-2-7b-chat-hf-Q2_K.gguf new file mode 100644 index 0000000..02a024d --- /dev/null +++ b/Llama-2-7b-chat-hf-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8df736aee9d846a14b627394e0f39396b678d87ee8eee88c075bce314bde40ab +size 2532865376 diff --git a/Llama-2-7b-chat-hf-Q2_K_S.gguf b/Llama-2-7b-chat-hf-Q2_K_S.gguf new file mode 100644 index 0000000..dc52569 --- /dev/null +++ b/Llama-2-7b-chat-hf-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea9af1796f1e80f4d3a3f3f9c76a491bb1e17ccb0d59d5b9adbadaead77bc7c3 +size 2319545696 diff --git a/Llama-2-7b-chat-hf-Q3_K_L.gguf b/Llama-2-7b-chat-hf-Q3_K_L.gguf new file mode 100644 index 0000000..c80d595 --- /dev/null +++ b/Llama-2-7b-chat-hf-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72bb5c818b8ffde7ebac50a01dcc5bc200be87a421be0d6cabb6591e8f5cf43b +size 3597112672 diff --git a/Llama-2-7b-chat-hf-Q3_K_M.gguf b/Llama-2-7b-chat-hf-Q3_K_M.gguf new file mode 100644 index 0000000..3fb032f --- /dev/null +++ b/Llama-2-7b-chat-hf-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8392e52ef3fc674f459fd716dfc718373cf47ca730785c1f5d1e16f905d87012 +size 3298006368 diff --git a/Llama-2-7b-chat-hf-Q3_K_S.gguf b/Llama-2-7b-chat-hf-Q3_K_S.gguf new file mode 100644 index 0000000..98e1910 --- /dev/null +++ b/Llama-2-7b-chat-hf-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a76489b1b3995d1cdcadbb1a268908a368f4e9b87ff97f410474fd8f1c41c19 +size 2948306272 diff --git a/Llama-2-7b-chat-hf-Q4_0.gguf b/Llama-2-7b-chat-hf-Q4_0.gguf new file mode 100644 index 0000000..730f31b --- /dev/null +++ b/Llama-2-7b-chat-hf-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa7402ce5b198abbe049003b5663e9b3ec2c1bd40c33caa40a27743a42b2733 +size 3837080928 diff --git a/Llama-2-7b-chat-hf-Q4_1.gguf b/Llama-2-7b-chat-hf-Q4_1.gguf new file mode 100644 index 0000000..43bf50b --- /dev/null +++ b/Llama-2-7b-chat-hf-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3abf014702f85a696549794094826da428fdf25f8f79e194d04b9817ddcdcd88 +size 4238751072 diff --git a/Llama-2-7b-chat-hf-Q4_K_M.gguf b/Llama-2-7b-chat-hf-Q4_K_M.gguf new file mode 100644 index 0000000..789c368 --- /dev/null +++ b/Llama-2-7b-chat-hf-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20e25408cc468b3aedee62f00d12472eecc6877570fc6c0092815b86968eb876 +size 4081005920 diff --git a/Llama-2-7b-chat-hf-Q4_K_S.gguf b/Llama-2-7b-chat-hf-Q4_K_S.gguf new file mode 100644 index 0000000..6c485ce --- /dev/null +++ b/Llama-2-7b-chat-hf-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d4d88390e0581b0af4c3ceef63257d4d40420b7b2d4af04748db3772aaf8afe +size 3856741728 diff --git a/Llama-2-7b-chat-hf-Q5_0.gguf b/Llama-2-7b-chat-hf-Q5_0.gguf new file mode 100644 index 0000000..58b32b3 --- /dev/null +++ b/Llama-2-7b-chat-hf-Q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f409fa0211983e2712d4c9129656534a4ef4711a57991a601d366a73a6604266 +size 4662965600 diff --git a/Llama-2-7b-chat-hf-Q5_1.gguf b/Llama-2-7b-chat-hf-Q5_1.gguf new file mode 100644 index 0000000..7918acc --- /dev/null +++ b/Llama-2-7b-chat-hf-Q5_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a81eed20ba124d64a53fa2868856e1bf1f4ec3ce564f2872c33b2c7bd7c60f0a +size 5064635744 diff --git a/Llama-2-7b-chat-hf-Q5_K_M.gguf b/Llama-2-7b-chat-hf-Q5_K_M.gguf new file mode 100644 index 0000000..f469cc2 --- /dev/null +++ b/Llama-2-7b-chat-hf-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26592efef71f50d739adc97198153a7da5e6a9db9600b6a760adeeff1f1d52df +size 4783158624 diff --git a/Llama-2-7b-chat-hf-Q5_K_S.gguf b/Llama-2-7b-chat-hf-Q5_K_S.gguf new file mode 100644 index 0000000..ad460af --- /dev/null +++ b/Llama-2-7b-chat-hf-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1382e694bf66984a55375d8d08e8d0fad7ee2d191cfb098d0a09ed5608f5c297 +size 4651693408 diff --git a/Llama-2-7b-chat-hf-Q6_K.gguf b/Llama-2-7b-chat-hf-Q6_K.gguf new file mode 100644 index 0000000..782e101 --- /dev/null +++ b/Llama-2-7b-chat-hf-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e468d93b6dc431d2ac8c02e4be2e88fc1c72046d74e79070e84746ae87cf8e98 +size 5529195872 diff --git a/Llama-2-7b-chat-hf-Q8_0.gguf b/Llama-2-7b-chat-hf-Q8_0.gguf new file mode 100644 index 0000000..9a9716d --- /dev/null +++ b/Llama-2-7b-chat-hf-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32544a43e59db71b103d4bfc05e6071a8f79059072dc541ad01c548cdd5881c2 +size 7161091424 diff --git a/README.md b/README.md new file mode 100644 index 0000000..c4cf615 --- /dev/null +++ b/README.md @@ -0,0 +1,21 @@ +--- +license: other +language: +- en +pipeline_tag: text-generation +inference: false +tags: +- transformers +- gguf +- imatrix +- Llama-2-7b-chat-hf +--- +Quantizations of https://huggingface.co/meta-llama/Llama-2-7b-chat-hf + + +# From original readme + +## Intended Use +**Intended Use Cases** Llama 2 is intended for commercial and research use in English. Tuned models are intended for assistant-like chat, whereas pretrained models can be adapted for a variety of natural language generation tasks. + +To get the expected features and performance for the chat versions, a specific formatting needs to be followed, including the `INST` and `<>` tags, `BOS` and `EOS` tokens, and the whitespaces and breaklines in between (we recommend calling `strip()` on inputs to avoid double-spaces). See our reference code in github for details: [`chat_completion`](https://github.com/facebookresearch/llama/blob/main/llama/generation.py#L212). \ No newline at end of file