初始化项目,由ModelHub XC社区提供模型
Model: shaowenchen/llama-2-7b-langchain-chat-gguf Source: Original Platform
This commit is contained in:
36
.gitattributes
vendored
Normal file
36
.gitattributes
vendored
Normal file
@@ -0,0 +1,36 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
*.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
74
README.md
Normal file
74
README.md
Normal file
@@ -0,0 +1,74 @@
|
||||
---
|
||||
inference: false
|
||||
language:
|
||||
- zh
|
||||
- en
|
||||
license: other
|
||||
model_creator: Photolens
|
||||
model_link: https://huggingface.co/Photolens/llama-2-7b-langchain-chat
|
||||
model_name: llama-2-7b-langchain-chat
|
||||
model_type: llama
|
||||
pipeline_tag: text-generation
|
||||
quantized_by: shaowenchen
|
||||
tasks:
|
||||
- text2text-generation
|
||||
tags:
|
||||
- meta
|
||||
- gguf
|
||||
- llama
|
||||
- llama-2
|
||||
- chinese
|
||||
- 7b
|
||||
---
|
||||
|
||||
## Provided files
|
||||
|
||||
| Name | Quant method | Size |
|
||||
| ------------------------------------- | ------------ | ------ |
|
||||
| llama-2-7b-langchain-chat.Q2_K.gguf | Q2_K | 2.6 GB |
|
||||
| llama-2-7b-langchain-chat.Q3_K.gguf | Q3_K | 3.1 GB |
|
||||
| llama-2-7b-langchain-chat.Q3_K_L.gguf | Q3_K_L | 3.3 GB |
|
||||
| llama-2-7b-langchain-chat.Q3_K_S.gguf | Q3_K_S | 2.7 GB |
|
||||
| llama-2-7b-langchain-chat.Q4_0.gguf | Q4_0 | 3.6 GB |
|
||||
| llama-2-7b-langchain-chat.Q4_1.gguf | Q4_1 | 3.9 GB |
|
||||
| llama-2-7b-langchain-chat.Q4_K.gguf | Q4_K | 3.8 GB |
|
||||
| llama-2-7b-langchain-chat.Q4_K_S.gguf | Q4_K_S | 3.6 GB |
|
||||
| llama-2-7b-langchain-chat.Q5_0.gguf | Q5_0 | 4.3 GB |
|
||||
| llama-2-7b-langchain-chat.Q5_1.gguf | Q5_1 | 4.7 GB |
|
||||
| llama-2-7b-langchain-chat.Q5_K.gguf | Q5_K | 4.5 GB |
|
||||
| llama-2-7b-langchain-chat.Q5_K_S.gguf | Q5_K_S | 4.3 GB |
|
||||
| llama-2-7b-langchain-chat.Q6_K.gguf | Q6_K | 5.1 GB |
|
||||
| llama-2-7b-langchain-chat.Q8_0.gguf | Q8_0 | 6.7 GB |
|
||||
| llama-2-7b-langchain-chat.gguf | full | 13 GB |
|
||||
|
||||
Usage:
|
||||
|
||||
```
|
||||
docker run --rm -it -p 8000:8000 -v /path/to/models:/models -e MODEL=/models/gguf-model-name.gguf hubimage/llama-cpp-python:latest
|
||||
```
|
||||
|
||||
and you can view http://localhost:8000/docs to see the swagger UI.
|
||||
|
||||
## Provided images
|
||||
|
||||
| Name | Quant method | Size |
|
||||
| ------------------------------------------------- | ------------ | ------- |
|
||||
| shaowenchen/llama-2-7b-langchain-chat-gguf:Q2_K | Q2_K | 6.72 GB |
|
||||
| shaowenchen/llama-2-7b-langchain-chat-gguf:Q3_K | Q3_K | 7.64 GB |
|
||||
| shaowenchen/llama-2-7b-langchain-chat-gguf:Q3_K_L | Q3_K_L | 8.27 GB |
|
||||
| shaowenchen/llama-2-7b-langchain-chat-gguf:Q3_K_S | Q3_K_S | 6.97 GB |
|
||||
| shaowenchen/llama-2-7b-langchain-chat-gguf:Q4_0 | Q4_0 | 8.55 GB |
|
||||
| shaowenchen/llama-2-7b-langchain-chat-gguf:Q4_1 | Q4_1 | 9.41 GB |
|
||||
| shaowenchen/llama-2-7b-langchain-chat-gguf:Q4_K | Q4_K | 9.17 GB |
|
||||
| shaowenchen/llama-2-7b-langchain-chat-gguf:Q4_K_S | Q4_K_S | 8.72 GB |
|
||||
| shaowenchen/llama-2-7b-langchain-chat-gguf:Q5_0 | Q5_0 | 10.4 GB |
|
||||
| shaowenchen/llama-2-7b-langchain-chat-gguf:Q5_K | Q5_K | 10.6 GB |
|
||||
| shaowenchen/llama-2-7b-langchain-chat-gguf:Q5_K_S | Q5_K_S | 10.4 GB |
|
||||
|
||||
Usage:
|
||||
|
||||
```
|
||||
docker run --rm -p 8000:8000 shaowenchen/llama-2-7b-langchain-chat-gguf:Q2_K
|
||||
```
|
||||
|
||||
and you can view http://localhost:8000/docs to see the swagger UI.
|
||||
10
configuration.json
Normal file
10
configuration.json
Normal file
@@ -0,0 +1,10 @@
|
||||
{
|
||||
"framework": "pytorch",
|
||||
"task": "text-generation",
|
||||
"model": {
|
||||
"type": "llama2"
|
||||
},
|
||||
"pipeline": {
|
||||
"type": "llama-2-7b-langchain-chat-text-generation-pipe"
|
||||
}
|
||||
}
|
||||
3
llama-2-7b-langchain-chat.Q2_K.gguf
Normal file
3
llama-2-7b-langchain-chat.Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:63c999be294da36ee52df97364ecb05fb19347bb4571c25431989708e4d90f18
|
||||
size 2825940672
|
||||
3
llama-2-7b-langchain-chat.Q3_K.gguf
Normal file
3
llama-2-7b-langchain-chat.Q3_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:afcbca6945929719f0fd3c4ea1c6c3dd87836976283928307d97eb899a976d7c
|
||||
size 3298004672
|
||||
3
llama-2-7b-langchain-chat.Q3_K_L.gguf
Normal file
3
llama-2-7b-langchain-chat.Q3_K_L.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:94d27df5c6dba24d51e1531ef0e021a89c1f2d861ab92de387986d1b78f9ef68
|
||||
size 3597110976
|
||||
3
llama-2-7b-langchain-chat.Q3_K_S.gguf
Normal file
3
llama-2-7b-langchain-chat.Q3_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:599007a41fc29ed2c5260edc1665911f59a072c0212009a1e1665884c889a70e
|
||||
size 2948304576
|
||||
3
llama-2-7b-langchain-chat.Q4_0.gguf
Normal file
3
llama-2-7b-langchain-chat.Q4_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:c70775c9f5d5041141d01d4a9d48038964ad25bc169c7996c340293ee3da2c72
|
||||
size 3825807040
|
||||
3
llama-2-7b-langchain-chat.Q4_1.gguf
Normal file
3
llama-2-7b-langchain-chat.Q4_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:84781a2e90d22da3d681d94ee38c9b54bf5d7afc655a6357797cbacff6523f1d
|
||||
size 4238749376
|
||||
3
llama-2-7b-langchain-chat.Q4_K.gguf
Normal file
3
llama-2-7b-langchain-chat.Q4_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:750e96efc7b6220462eabd02938ba1410c991773896acca1317e6da51b623a3e
|
||||
size 4081004224
|
||||
3
llama-2-7b-langchain-chat.Q4_K_S.gguf
Normal file
3
llama-2-7b-langchain-chat.Q4_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:edd52d07f82182e3748a2150abc9c17c619e650debac90b8d8649e66917736e0
|
||||
size 3856740032
|
||||
3
llama-2-7b-langchain-chat.Q5_0.gguf
Normal file
3
llama-2-7b-langchain-chat.Q5_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:de480a2674ca0d1656888700d2853ae39a20f0dcd21f092243393d7001c0e0f8
|
||||
size 4651691712
|
||||
3
llama-2-7b-langchain-chat.Q5_1.gguf
Normal file
3
llama-2-7b-langchain-chat.Q5_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:b024062fde85c7ece0efdf38d4bd8f99b0a7eb821bb1a2544d26771834963631
|
||||
size 5064634048
|
||||
3
llama-2-7b-langchain-chat.Q5_K.gguf
Normal file
3
llama-2-7b-langchain-chat.Q5_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:00c1c6129bccc237cdb85b065a25b8826f96464c94946a4f28a11313f10f0362
|
||||
size 4783156928
|
||||
3
llama-2-7b-langchain-chat.Q5_K_S.gguf
Normal file
3
llama-2-7b-langchain-chat.Q5_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:0e82d7cc1a7c64e17dd48e5eb1488b8065421c7271d47810b36da33df065b939
|
||||
size 4651691712
|
||||
3
llama-2-7b-langchain-chat.Q6_K.gguf
Normal file
3
llama-2-7b-langchain-chat.Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:9a625393ec6f72b60c3c0c7cd7db547b875c9becb6a8d43288036c73f8c4f7b7
|
||||
size 5529194176
|
||||
3
llama-2-7b-langchain-chat.Q8_0.gguf
Normal file
3
llama-2-7b-langchain-chat.Q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:84c321bc9173ded1e14d5a4139f524c4f809eb06c9c5ebe68a8dfd4deb43dc27
|
||||
size 7161089728
|
||||
3
llama-2-7b-langchain-chat.gguf
Normal file
3
llama-2-7b-langchain-chat.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:db3dc1820636e9db9a694b4633c743216726c03067ae1c7d1d5aeaacd5ddceec
|
||||
size 13478104736
|
||||
Reference in New Issue
Block a user