初始化项目,由ModelHub XC社区提供模型
Model: duyntnet/Llama-2-7b-chat-hf-imatrix-GGUF Source: Original Platform
This commit is contained in:
62
.gitattributes
vendored
Normal file
62
.gitattributes
vendored
Normal file
@@ -0,0 +1,62 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Llama-2-7b-chat-hf-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
3
Llama-2-7b-chat-hf-IQ1_M.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ1_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:f3aba0b1dcc9f657ec4b4ae37de5a58a9f8b69882166089bc5bab976cb8384e0
|
||||
size 1650972000
|
||||
3
Llama-2-7b-chat-hf-IQ1_S.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ1_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:7be5b493f0a1bfeb2bf2246aba2c6d6486934a273b93dd40fd55387f2d45f121
|
||||
size 1528583520
|
||||
3
Llama-2-7b-chat-hf-IQ2_M.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ2_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:4bf2ca8eb8707168195fbcf1d027290eced6511218b98426227cdfef6b5fccee
|
||||
size 2359752032
|
||||
3
Llama-2-7b-chat-hf-IQ2_S.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ2_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:2f9660cf05fcd924c6e8473d013c2bda6310c46ef8916266ac0959e1e7b8fae3
|
||||
size 2196567392
|
||||
3
Llama-2-7b-chat-hf-IQ2_XS.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ2_XS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:843f5b7c61b641252bd482f2de9083de3d97fbdb42ebce11a09f56f160312c05
|
||||
size 2034914656
|
||||
3
Llama-2-7b-chat-hf-IQ2_XXS.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ2_XXS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:270b9418b779788c4fc326009a87da4fb83cbdbfff06f54ce6cbcf9ac41f8ac1
|
||||
size 1854952800
|
||||
3
Llama-2-7b-chat-hf-IQ3_M.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ3_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:5cb769b67b343e7334a687736f74e1951a2e70739d4761d79326af71770fd6d0
|
||||
size 3114866016
|
||||
3
Llama-2-7b-chat-hf-IQ3_S.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ3_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:dccb7e9fd77c056860204deb027b6e32be24c5f6888eb6cdd0bd63c9d274ae09
|
||||
size 2948306272
|
||||
3
Llama-2-7b-chat-hf-IQ3_XS.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ3_XS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:a59a1dfee37a322e5a7601362c73051bf50a362edf92737b6ccca692fc38b62a
|
||||
size 2796524896
|
||||
3
Llama-2-7b-chat-hf-IQ3_XXS.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ3_XXS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:c05de01131bb1baae15a1294f32e74a623740bd872c198f21ada05c2506df855
|
||||
size 2585392480
|
||||
3
Llama-2-7b-chat-hf-IQ4_NL.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ4_NL.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:c739350603f47e1aef34247bc3d89ecdd48ca7801a91cec83b5c035e9d326f6c
|
||||
size 3825808736
|
||||
3
Llama-2-7b-chat-hf-IQ4_XS.gguf
Normal file
3
Llama-2-7b-chat-hf-IQ4_XS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:28e8af7533692f5227fec40a3a9537a48136967601ce5b9a895053998c78e35b
|
||||
size 3619337568
|
||||
3
Llama-2-7b-chat-hf-Q2_K.gguf
Normal file
3
Llama-2-7b-chat-hf-Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:8df736aee9d846a14b627394e0f39396b678d87ee8eee88c075bce314bde40ab
|
||||
size 2532865376
|
||||
3
Llama-2-7b-chat-hf-Q2_K_S.gguf
Normal file
3
Llama-2-7b-chat-hf-Q2_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:ea9af1796f1e80f4d3a3f3f9c76a491bb1e17ccb0d59d5b9adbadaead77bc7c3
|
||||
size 2319545696
|
||||
3
Llama-2-7b-chat-hf-Q3_K_L.gguf
Normal file
3
Llama-2-7b-chat-hf-Q3_K_L.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:72bb5c818b8ffde7ebac50a01dcc5bc200be87a421be0d6cabb6591e8f5cf43b
|
||||
size 3597112672
|
||||
3
Llama-2-7b-chat-hf-Q3_K_M.gguf
Normal file
3
Llama-2-7b-chat-hf-Q3_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:8392e52ef3fc674f459fd716dfc718373cf47ca730785c1f5d1e16f905d87012
|
||||
size 3298006368
|
||||
3
Llama-2-7b-chat-hf-Q3_K_S.gguf
Normal file
3
Llama-2-7b-chat-hf-Q3_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:6a76489b1b3995d1cdcadbb1a268908a368f4e9b87ff97f410474fd8f1c41c19
|
||||
size 2948306272
|
||||
3
Llama-2-7b-chat-hf-Q4_0.gguf
Normal file
3
Llama-2-7b-chat-hf-Q4_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:5aa7402ce5b198abbe049003b5663e9b3ec2c1bd40c33caa40a27743a42b2733
|
||||
size 3837080928
|
||||
3
Llama-2-7b-chat-hf-Q4_1.gguf
Normal file
3
Llama-2-7b-chat-hf-Q4_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:3abf014702f85a696549794094826da428fdf25f8f79e194d04b9817ddcdcd88
|
||||
size 4238751072
|
||||
3
Llama-2-7b-chat-hf-Q4_K_M.gguf
Normal file
3
Llama-2-7b-chat-hf-Q4_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:20e25408cc468b3aedee62f00d12472eecc6877570fc6c0092815b86968eb876
|
||||
size 4081005920
|
||||
3
Llama-2-7b-chat-hf-Q4_K_S.gguf
Normal file
3
Llama-2-7b-chat-hf-Q4_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:3d4d88390e0581b0af4c3ceef63257d4d40420b7b2d4af04748db3772aaf8afe
|
||||
size 3856741728
|
||||
3
Llama-2-7b-chat-hf-Q5_0.gguf
Normal file
3
Llama-2-7b-chat-hf-Q5_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:f409fa0211983e2712d4c9129656534a4ef4711a57991a601d366a73a6604266
|
||||
size 4662965600
|
||||
3
Llama-2-7b-chat-hf-Q5_1.gguf
Normal file
3
Llama-2-7b-chat-hf-Q5_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:a81eed20ba124d64a53fa2868856e1bf1f4ec3ce564f2872c33b2c7bd7c60f0a
|
||||
size 5064635744
|
||||
3
Llama-2-7b-chat-hf-Q5_K_M.gguf
Normal file
3
Llama-2-7b-chat-hf-Q5_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:26592efef71f50d739adc97198153a7da5e6a9db9600b6a760adeeff1f1d52df
|
||||
size 4783158624
|
||||
3
Llama-2-7b-chat-hf-Q5_K_S.gguf
Normal file
3
Llama-2-7b-chat-hf-Q5_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:1382e694bf66984a55375d8d08e8d0fad7ee2d191cfb098d0a09ed5608f5c297
|
||||
size 4651693408
|
||||
3
Llama-2-7b-chat-hf-Q6_K.gguf
Normal file
3
Llama-2-7b-chat-hf-Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:e468d93b6dc431d2ac8c02e4be2e88fc1c72046d74e79070e84746ae87cf8e98
|
||||
size 5529195872
|
||||
3
Llama-2-7b-chat-hf-Q8_0.gguf
Normal file
3
Llama-2-7b-chat-hf-Q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:32544a43e59db71b103d4bfc05e6071a8f79059072dc541ad01c548cdd5881c2
|
||||
size 7161091424
|
||||
21
README.md
Normal file
21
README.md
Normal file
@@ -0,0 +1,21 @@
|
||||
---
|
||||
license: other
|
||||
language:
|
||||
- en
|
||||
pipeline_tag: text-generation
|
||||
inference: false
|
||||
tags:
|
||||
- transformers
|
||||
- gguf
|
||||
- imatrix
|
||||
- Llama-2-7b-chat-hf
|
||||
---
|
||||
Quantizations of https://huggingface.co/meta-llama/Llama-2-7b-chat-hf
|
||||
|
||||
|
||||
# From original readme
|
||||
|
||||
## Intended Use
|
||||
**Intended Use Cases** Llama 2 is intended for commercial and research use in English. Tuned models are intended for assistant-like chat, whereas pretrained models can be adapted for a variety of natural language generation tasks.
|
||||
|
||||
To get the expected features and performance for the chat versions, a specific formatting needs to be followed, including the `INST` and `<<SYS>>` tags, `BOS` and `EOS` tokens, and the whitespaces and breaklines in between (we recommend calling `strip()` on inputs to avoid double-spaces). See our reference code in github for details: [`chat_completion`](https://github.com/facebookresearch/llama/blob/main/llama/generation.py#L212).
|
||||
Reference in New Issue
Block a user