From 02dcd49140124aebe59415b0dc86c53106db9c05 Mon Sep 17 00:00:00 2001
From: ModelHub XC <noreply@modelhub.org.cn>
Date: Wed, 17 Jun 2026 16:17:16 +0800
Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?=
 =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?=
 =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Model: duyntnet/Llama-2-7b-chat-hf-imatrix-GGUF
Source: Original Platform
---
 .gitattributes                  | 62 +++++++++++++++++++++++++++++++++
 Llama-2-7b-chat-hf-IQ1_M.gguf   |  3 ++
 Llama-2-7b-chat-hf-IQ1_S.gguf   |  3 ++
 Llama-2-7b-chat-hf-IQ2_M.gguf   |  3 ++
 Llama-2-7b-chat-hf-IQ2_S.gguf   |  3 ++
 Llama-2-7b-chat-hf-IQ2_XS.gguf  |  3 ++
 Llama-2-7b-chat-hf-IQ2_XXS.gguf |  3 ++
 Llama-2-7b-chat-hf-IQ3_M.gguf   |  3 ++
 Llama-2-7b-chat-hf-IQ3_S.gguf   |  3 ++
 Llama-2-7b-chat-hf-IQ3_XS.gguf  |  3 ++
 Llama-2-7b-chat-hf-IQ3_XXS.gguf |  3 ++
 Llama-2-7b-chat-hf-IQ4_NL.gguf  |  3 ++
 Llama-2-7b-chat-hf-IQ4_XS.gguf  |  3 ++
 Llama-2-7b-chat-hf-Q2_K.gguf    |  3 ++
 Llama-2-7b-chat-hf-Q2_K_S.gguf  |  3 ++
 Llama-2-7b-chat-hf-Q3_K_L.gguf  |  3 ++
 Llama-2-7b-chat-hf-Q3_K_M.gguf  |  3 ++
 Llama-2-7b-chat-hf-Q3_K_S.gguf  |  3 ++
 Llama-2-7b-chat-hf-Q4_0.gguf    |  3 ++
 Llama-2-7b-chat-hf-Q4_1.gguf    |  3 ++
 Llama-2-7b-chat-hf-Q4_K_M.gguf  |  3 ++
 Llama-2-7b-chat-hf-Q4_K_S.gguf  |  3 ++
 Llama-2-7b-chat-hf-Q5_0.gguf    |  3 ++
 Llama-2-7b-chat-hf-Q5_1.gguf    |  3 ++
 Llama-2-7b-chat-hf-Q5_K_M.gguf  |  3 ++
 Llama-2-7b-chat-hf-Q5_K_S.gguf  |  3 ++
 Llama-2-7b-chat-hf-Q6_K.gguf    |  3 ++
 Llama-2-7b-chat-hf-Q8_0.gguf    |  3 ++
 README.md                       | 21 +++++++++++
 29 files changed, 164 insertions(+)
 create mode 100644 .gitattributes
 create mode 100644 Llama-2-7b-chat-hf-IQ1_M.gguf
 create mode 100644 Llama-2-7b-chat-hf-IQ1_S.gguf
 create mode 100644 Llama-2-7b-chat-hf-IQ2_M.gguf
 create mode 100644 Llama-2-7b-chat-hf-IQ2_S.gguf
 create mode 100644 Llama-2-7b-chat-hf-IQ2_XS.gguf
 create mode 100644 Llama-2-7b-chat-hf-IQ2_XXS.gguf
 create mode 100644 Llama-2-7b-chat-hf-IQ3_M.gguf
 create mode 100644 Llama-2-7b-chat-hf-IQ3_S.gguf
 create mode 100644 Llama-2-7b-chat-hf-IQ3_XS.gguf
 create mode 100644 Llama-2-7b-chat-hf-IQ3_XXS.gguf
 create mode 100644 Llama-2-7b-chat-hf-IQ4_NL.gguf
 create mode 100644 Llama-2-7b-chat-hf-IQ4_XS.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q2_K.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q2_K_S.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q3_K_L.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q3_K_M.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q3_K_S.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q4_0.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q4_1.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q4_K_M.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q4_K_S.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q5_0.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q5_1.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q5_K_M.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q5_K_S.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q6_K.gguf
 create mode 100644 Llama-2-7b-chat-hf-Q8_0.gguf
 create mode 100644 README.md

diff --git a/.gitattributes b/.gitattributes
new file mode 100644
index 0000000..6dfc52e
--- /dev/null
+++ b/.gitattributes
@@ -0,0 +1,62 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
+Llama-2-7b-chat-hf-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
diff --git a/Llama-2-7b-chat-hf-IQ1_M.gguf b/Llama-2-7b-chat-hf-IQ1_M.gguf
new file mode 100644
index 0000000..bd01dd9
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ1_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f3aba0b1dcc9f657ec4b4ae37de5a58a9f8b69882166089bc5bab976cb8384e0
+size 1650972000
diff --git a/Llama-2-7b-chat-hf-IQ1_S.gguf b/Llama-2-7b-chat-hf-IQ1_S.gguf
new file mode 100644
index 0000000..b5b9373
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ1_S.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7be5b493f0a1bfeb2bf2246aba2c6d6486934a273b93dd40fd55387f2d45f121
+size 1528583520
diff --git a/Llama-2-7b-chat-hf-IQ2_M.gguf b/Llama-2-7b-chat-hf-IQ2_M.gguf
new file mode 100644
index 0000000..8392b0f
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ2_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4bf2ca8eb8707168195fbcf1d027290eced6511218b98426227cdfef6b5fccee
+size 2359752032
diff --git a/Llama-2-7b-chat-hf-IQ2_S.gguf b/Llama-2-7b-chat-hf-IQ2_S.gguf
new file mode 100644
index 0000000..1ccc834
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ2_S.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2f9660cf05fcd924c6e8473d013c2bda6310c46ef8916266ac0959e1e7b8fae3
+size 2196567392
diff --git a/Llama-2-7b-chat-hf-IQ2_XS.gguf b/Llama-2-7b-chat-hf-IQ2_XS.gguf
new file mode 100644
index 0000000..19ccb2d
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ2_XS.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:843f5b7c61b641252bd482f2de9083de3d97fbdb42ebce11a09f56f160312c05
+size 2034914656
diff --git a/Llama-2-7b-chat-hf-IQ2_XXS.gguf b/Llama-2-7b-chat-hf-IQ2_XXS.gguf
new file mode 100644
index 0000000..d08d764
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ2_XXS.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:270b9418b779788c4fc326009a87da4fb83cbdbfff06f54ce6cbcf9ac41f8ac1
+size 1854952800
diff --git a/Llama-2-7b-chat-hf-IQ3_M.gguf b/Llama-2-7b-chat-hf-IQ3_M.gguf
new file mode 100644
index 0000000..8f4f58e
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ3_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5cb769b67b343e7334a687736f74e1951a2e70739d4761d79326af71770fd6d0
+size 3114866016
diff --git a/Llama-2-7b-chat-hf-IQ3_S.gguf b/Llama-2-7b-chat-hf-IQ3_S.gguf
new file mode 100644
index 0000000..47edfb6
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ3_S.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dccb7e9fd77c056860204deb027b6e32be24c5f6888eb6cdd0bd63c9d274ae09
+size 2948306272
diff --git a/Llama-2-7b-chat-hf-IQ3_XS.gguf b/Llama-2-7b-chat-hf-IQ3_XS.gguf
new file mode 100644
index 0000000..95f70b5
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ3_XS.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a59a1dfee37a322e5a7601362c73051bf50a362edf92737b6ccca692fc38b62a
+size 2796524896
diff --git a/Llama-2-7b-chat-hf-IQ3_XXS.gguf b/Llama-2-7b-chat-hf-IQ3_XXS.gguf
new file mode 100644
index 0000000..308ce4e
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ3_XXS.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c05de01131bb1baae15a1294f32e74a623740bd872c198f21ada05c2506df855
+size 2585392480
diff --git a/Llama-2-7b-chat-hf-IQ4_NL.gguf b/Llama-2-7b-chat-hf-IQ4_NL.gguf
new file mode 100644
index 0000000..fad7c1f
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ4_NL.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c739350603f47e1aef34247bc3d89ecdd48ca7801a91cec83b5c035e9d326f6c
+size 3825808736
diff --git a/Llama-2-7b-chat-hf-IQ4_XS.gguf b/Llama-2-7b-chat-hf-IQ4_XS.gguf
new file mode 100644
index 0000000..95f9cee
--- /dev/null
+++ b/Llama-2-7b-chat-hf-IQ4_XS.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:28e8af7533692f5227fec40a3a9537a48136967601ce5b9a895053998c78e35b
+size 3619337568
diff --git a/Llama-2-7b-chat-hf-Q2_K.gguf b/Llama-2-7b-chat-hf-Q2_K.gguf
new file mode 100644
index 0000000..02a024d
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q2_K.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8df736aee9d846a14b627394e0f39396b678d87ee8eee88c075bce314bde40ab
+size 2532865376
diff --git a/Llama-2-7b-chat-hf-Q2_K_S.gguf b/Llama-2-7b-chat-hf-Q2_K_S.gguf
new file mode 100644
index 0000000..dc52569
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q2_K_S.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ea9af1796f1e80f4d3a3f3f9c76a491bb1e17ccb0d59d5b9adbadaead77bc7c3
+size 2319545696
diff --git a/Llama-2-7b-chat-hf-Q3_K_L.gguf b/Llama-2-7b-chat-hf-Q3_K_L.gguf
new file mode 100644
index 0000000..c80d595
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q3_K_L.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:72bb5c818b8ffde7ebac50a01dcc5bc200be87a421be0d6cabb6591e8f5cf43b
+size 3597112672
diff --git a/Llama-2-7b-chat-hf-Q3_K_M.gguf b/Llama-2-7b-chat-hf-Q3_K_M.gguf
new file mode 100644
index 0000000..3fb032f
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q3_K_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8392e52ef3fc674f459fd716dfc718373cf47ca730785c1f5d1e16f905d87012
+size 3298006368
diff --git a/Llama-2-7b-chat-hf-Q3_K_S.gguf b/Llama-2-7b-chat-hf-Q3_K_S.gguf
new file mode 100644
index 0000000..98e1910
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q3_K_S.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6a76489b1b3995d1cdcadbb1a268908a368f4e9b87ff97f410474fd8f1c41c19
+size 2948306272
diff --git a/Llama-2-7b-chat-hf-Q4_0.gguf b/Llama-2-7b-chat-hf-Q4_0.gguf
new file mode 100644
index 0000000..730f31b
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q4_0.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5aa7402ce5b198abbe049003b5663e9b3ec2c1bd40c33caa40a27743a42b2733
+size 3837080928
diff --git a/Llama-2-7b-chat-hf-Q4_1.gguf b/Llama-2-7b-chat-hf-Q4_1.gguf
new file mode 100644
index 0000000..43bf50b
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q4_1.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3abf014702f85a696549794094826da428fdf25f8f79e194d04b9817ddcdcd88
+size 4238751072
diff --git a/Llama-2-7b-chat-hf-Q4_K_M.gguf b/Llama-2-7b-chat-hf-Q4_K_M.gguf
new file mode 100644
index 0000000..789c368
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q4_K_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:20e25408cc468b3aedee62f00d12472eecc6877570fc6c0092815b86968eb876
+size 4081005920
diff --git a/Llama-2-7b-chat-hf-Q4_K_S.gguf b/Llama-2-7b-chat-hf-Q4_K_S.gguf
new file mode 100644
index 0000000..6c485ce
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q4_K_S.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d4d88390e0581b0af4c3ceef63257d4d40420b7b2d4af04748db3772aaf8afe
+size 3856741728
diff --git a/Llama-2-7b-chat-hf-Q5_0.gguf b/Llama-2-7b-chat-hf-Q5_0.gguf
new file mode 100644
index 0000000..58b32b3
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q5_0.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f409fa0211983e2712d4c9129656534a4ef4711a57991a601d366a73a6604266
+size 4662965600
diff --git a/Llama-2-7b-chat-hf-Q5_1.gguf b/Llama-2-7b-chat-hf-Q5_1.gguf
new file mode 100644
index 0000000..7918acc
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q5_1.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a81eed20ba124d64a53fa2868856e1bf1f4ec3ce564f2872c33b2c7bd7c60f0a
+size 5064635744
diff --git a/Llama-2-7b-chat-hf-Q5_K_M.gguf b/Llama-2-7b-chat-hf-Q5_K_M.gguf
new file mode 100644
index 0000000..f469cc2
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q5_K_M.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:26592efef71f50d739adc97198153a7da5e6a9db9600b6a760adeeff1f1d52df
+size 4783158624
diff --git a/Llama-2-7b-chat-hf-Q5_K_S.gguf b/Llama-2-7b-chat-hf-Q5_K_S.gguf
new file mode 100644
index 0000000..ad460af
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q5_K_S.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1382e694bf66984a55375d8d08e8d0fad7ee2d191cfb098d0a09ed5608f5c297
+size 4651693408
diff --git a/Llama-2-7b-chat-hf-Q6_K.gguf b/Llama-2-7b-chat-hf-Q6_K.gguf
new file mode 100644
index 0000000..782e101
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q6_K.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e468d93b6dc431d2ac8c02e4be2e88fc1c72046d74e79070e84746ae87cf8e98
+size 5529195872
diff --git a/Llama-2-7b-chat-hf-Q8_0.gguf b/Llama-2-7b-chat-hf-Q8_0.gguf
new file mode 100644
index 0000000..9a9716d
--- /dev/null
+++ b/Llama-2-7b-chat-hf-Q8_0.gguf
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:32544a43e59db71b103d4bfc05e6071a8f79059072dc541ad01c548cdd5881c2
+size 7161091424
diff --git a/README.md b/README.md
new file mode 100644
index 0000000..c4cf615
--- /dev/null
+++ b/README.md
@@ -0,0 +1,21 @@
+---
+license: other
+language:
+- en
+pipeline_tag: text-generation
+inference: false
+tags:
+- transformers
+- gguf
+- imatrix
+- Llama-2-7b-chat-hf
+---
+Quantizations of https://huggingface.co/meta-llama/Llama-2-7b-chat-hf
+
+
+# From original readme
+
+## Intended Use
+**Intended Use Cases** Llama 2 is intended for commercial and research use in English. Tuned models are intended for assistant-like chat, whereas pretrained models can be adapted for a variety of natural language generation tasks.
+
+To get the expected features and performance for the chat versions, a specific formatting needs to be followed, including the `INST` and `<<SYS>>` tags, `BOS` and `EOS` tokens, and the whitespaces and breaklines in between (we recommend calling `strip()` on inputs to avoid double-spaces). See our reference code in github for details: [`chat_completion`](https://github.com/facebookresearch/llama/blob/main/llama/generation.py#L212).
\ No newline at end of file