初始化项目,由ModelHub XC社区提供模型
Model: duyntnet/Vistral-7B-Chat-imatrix-GGUF Source: Original Platform
This commit is contained in:
62
.gitattributes
vendored
Normal file
62
.gitattributes
vendored
Normal file
@@ -0,0 +1,62 @@
|
||||
*.7z filter=lfs diff=lfs merge=lfs -text
|
||||
*.arrow filter=lfs diff=lfs merge=lfs -text
|
||||
*.bin filter=lfs diff=lfs merge=lfs -text
|
||||
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
||||
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
||||
*.ftz filter=lfs diff=lfs merge=lfs -text
|
||||
*.gz filter=lfs diff=lfs merge=lfs -text
|
||||
*.h5 filter=lfs diff=lfs merge=lfs -text
|
||||
*.joblib filter=lfs diff=lfs merge=lfs -text
|
||||
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
||||
*.model filter=lfs diff=lfs merge=lfs -text
|
||||
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
||||
*.npy filter=lfs diff=lfs merge=lfs -text
|
||||
*.npz filter=lfs diff=lfs merge=lfs -text
|
||||
*.onnx filter=lfs diff=lfs merge=lfs -text
|
||||
*.ot filter=lfs diff=lfs merge=lfs -text
|
||||
*.parquet filter=lfs diff=lfs merge=lfs -text
|
||||
*.pb filter=lfs diff=lfs merge=lfs -text
|
||||
*.pickle filter=lfs diff=lfs merge=lfs -text
|
||||
*.pkl filter=lfs diff=lfs merge=lfs -text
|
||||
*.pt filter=lfs diff=lfs merge=lfs -text
|
||||
*.pth filter=lfs diff=lfs merge=lfs -text
|
||||
*.rar filter=lfs diff=lfs merge=lfs -text
|
||||
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
||||
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
||||
*.tar filter=lfs diff=lfs merge=lfs -text
|
||||
*.tflite filter=lfs diff=lfs merge=lfs -text
|
||||
*.tgz filter=lfs diff=lfs merge=lfs -text
|
||||
*.wasm filter=lfs diff=lfs merge=lfs -text
|
||||
*.xz filter=lfs diff=lfs merge=lfs -text
|
||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
Vistral-7B-Chat-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
||||
60
README.md
Normal file
60
README.md
Normal file
@@ -0,0 +1,60 @@
|
||||
---
|
||||
license: other
|
||||
language:
|
||||
- en
|
||||
pipeline_tag: text-generation
|
||||
inference: false
|
||||
tags:
|
||||
- transformers
|
||||
- gguf
|
||||
- imatrix
|
||||
- Vistral-7B-Chat
|
||||
---
|
||||
Quantizations of https://huggingface.co/Viet-Mistral/Vistral-7B-Chat
|
||||
|
||||
# From original readme
|
||||
|
||||
## Usage
|
||||
|
||||
To enable single/multi-turn conversational chat with `Vistral-7B-Chat`, you can use the default chat template format:
|
||||
|
||||
```python
|
||||
import torch
|
||||
from transformers import AutoModelForCausalLM, AutoTokenizer
|
||||
|
||||
system_prompt = "Bạn là một trợ lí Tiếng Việt nhiệt tình và trung thực. Hãy luôn trả lời một cách hữu ích nhất có thể, đồng thời giữ an toàn.\n"
|
||||
system_prompt += "Câu trả lời của bạn không nên chứa bất kỳ nội dung gây hại, phân biệt chủng tộc, phân biệt giới tính, độc hại, nguy hiểm hoặc bất hợp pháp nào. Hãy đảm bảo rằng các câu trả lời của bạn không có thiên kiến xã hội và mang tính tích cực."
|
||||
system_prompt += "Nếu một câu hỏi không có ý nghĩa hoặc không hợp lý về mặt thông tin, hãy giải thích tại sao thay vì trả lời một điều gì đó không chính xác. Nếu bạn không biết câu trả lời cho một câu hỏi, hãy trẳ lời là bạn không biết và vui lòng không chia sẻ thông tin sai lệch."
|
||||
|
||||
tokenizer = AutoTokenizer.from_pretrained('Viet-Mistral/Vistral-7B-Chat')
|
||||
model = AutoModelForCausalLM.from_pretrained(
|
||||
'Viet-Mistral/Vistral-7B-Chat',
|
||||
torch_dtype=torch.bfloat16, # change to torch.float16 if you're using V100
|
||||
device_map="auto",
|
||||
use_cache=True,
|
||||
)
|
||||
|
||||
conversation = [{"role": "system", "content": system_prompt }]
|
||||
while True:
|
||||
human = input("Human: ")
|
||||
if human.lower() == "reset":
|
||||
conversation = [{"role": "system", "content": system_prompt }]
|
||||
print("The chat history has been cleared!")
|
||||
continue
|
||||
|
||||
conversation.append({"role": "user", "content": human })
|
||||
input_ids = tokenizer.apply_chat_template(conversation, return_tensors="pt").to(model.device)
|
||||
|
||||
out_ids = model.generate(
|
||||
input_ids=input_ids,
|
||||
max_new_tokens=768,
|
||||
do_sample=True,
|
||||
top_p=0.95,
|
||||
top_k=40,
|
||||
temperature=0.1,
|
||||
repetition_penalty=1.05,
|
||||
)
|
||||
assistant = tokenizer.batch_decode(out_ids[:, input_ids.size(1): ], skip_special_tokens=True)[0].strip()
|
||||
print("Assistant: ", assistant)
|
||||
conversation.append({"role": "assistant", "content": assistant })
|
||||
```
|
||||
3
Vistral-7B-Chat-IQ1_M.gguf
Normal file
3
Vistral-7B-Chat-IQ1_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:436a6746c4612e4f3e73cb834b3b9bd6ee508d242c97d43d9503b0a6618a4afa
|
||||
size 1781090016
|
||||
3
Vistral-7B-Chat-IQ1_S.gguf
Normal file
3
Vistral-7B-Chat-IQ1_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:b9547c09465e6d0848114097b5cd0a42f6cbb70b67b2aa6a83c8fb09b1d9ae0e
|
||||
size 1638745824
|
||||
3
Vistral-7B-Chat-IQ2_M.gguf
Normal file
3
Vistral-7B-Chat-IQ2_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:56b824fd83d1e1f663096ab7b810fd7198739bbdcbd839d7958c4ef3fbb2fc0d
|
||||
size 2530006144
|
||||
3
Vistral-7B-Chat-IQ2_S.gguf
Normal file
3
Vistral-7B-Chat-IQ2_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:66ac127eb065b7b2e6eee2510195ea225298a64f09fc8c925a5c438960e57614
|
||||
size 2340213888
|
||||
3
Vistral-7B-Chat-IQ2_XS.gguf
Normal file
3
Vistral-7B-Chat-IQ2_XS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:09c7e651bdbaad9057155cf156cbbbb9319a5a28614d7791d05c8ca3d746fa97
|
||||
size 2224899808
|
||||
3
Vistral-7B-Chat-IQ2_XXS.gguf
Normal file
3
Vistral-7B-Chat-IQ2_XXS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:5fd3cb112a004bc6608c30b64bcd68540e3f52fb9ebd800af24655a4d189063e
|
||||
size 2018330336
|
||||
3
Vistral-7B-Chat-IQ3_M.gguf
Normal file
3
Vistral-7B-Chat-IQ3_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:6ca4e03ca6cdd013701e5a38fac72212868037e56b998703f57cd993a14b99cb
|
||||
size 3317650080
|
||||
3
Vistral-7B-Chat-IQ3_S.gguf
Normal file
3
Vistral-7B-Chat-IQ3_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:32bcc62744d91e8f12f68b6537541e8a35cc2fbe8e3c60b77fe5f5285255080b
|
||||
size 3215151776
|
||||
3
Vistral-7B-Chat-IQ3_XS.gguf
Normal file
3
Vistral-7B-Chat-IQ3_XS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:79dca1a6be014551b0d82731e35d5985e88e41788224cb6982616c4f057b024e
|
||||
size 3051573920
|
||||
3
Vistral-7B-Chat-IQ3_XXS.gguf
Normal file
3
Vistral-7B-Chat-IQ3_XXS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:8e8855990539047e5fe03c8962592a816b65c809e64ed6a8d9be4a70eb780aa9
|
||||
size 2856637568
|
||||
3
Vistral-7B-Chat-IQ4_NL.gguf
Normal file
3
Vistral-7B-Chat-IQ4_NL.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:b602fedb65d849d92c621c342d354c88b65ad93c791b258ea685e6a0c03e500d
|
||||
size 4161917120
|
||||
3
Vistral-7B-Chat-IQ4_XS.gguf
Normal file
3
Vistral-7B-Chat-IQ4_XS.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:fde2fb02d5b8896af3dd60098987e97369fb4e4cd02c6346e308ee3f4a128e0d
|
||||
size 3943096384
|
||||
3
Vistral-7B-Chat-Q2_K.gguf
Normal file
3
Vistral-7B-Chat-Q2_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:dffa0435fd646c0bc1253521bdba3ad14eaf9759e3a4dd0d9c165212f530e3f6
|
||||
size 2749351168
|
||||
3
Vistral-7B-Chat-Q2_K_S.gguf
Normal file
3
Vistral-7B-Chat-Q2_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:e31c42dcafb01fd4024da4653e6281c583c5c1f6842a81e6fbb95a4f24b0a2b0
|
||||
size 2559034624
|
||||
3
Vistral-7B-Chat-Q3_K_L.gguf
Normal file
3
Vistral-7B-Chat-Q3_K_L.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:336d5aed85616561396f4a0ba5a7808ec3e8e765649bc52b8d7327ed24a00c76
|
||||
size 3854783136
|
||||
3
Vistral-7B-Chat-Q3_K_M.gguf
Normal file
3
Vistral-7B-Chat-Q3_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:544b04dfa91e258cc13f584b07fd3509560bdc560ed6facdc36592f11ee9b078
|
||||
size 3551744672
|
||||
3
Vistral-7B-Chat-Q3_K_S.gguf
Normal file
3
Vistral-7B-Chat-Q3_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:40d0ccc42a0fd5e9fb4519291aab3c1e15992d31cdde29a440b03a9409ff4dfe
|
||||
size 3197325984
|
||||
3
Vistral-7B-Chat-Q4_0.gguf
Normal file
3
Vistral-7B-Chat-Q4_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:8232ef8de32a4ef4378fb4b7d52072e6915d78a0fe0fca5938146ede1dc8286a
|
||||
size 4159819968
|
||||
3
Vistral-7B-Chat-Q4_1.gguf
Normal file
3
Vistral-7B-Chat-Q4_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:d7764635ad2024caaeeeef7d0334de7f28db0e8b8317cf4eb4504cddd35e4b7e
|
||||
size 4591169984
|
||||
3
Vistral-7B-Chat-Q4_K_M.gguf
Normal file
3
Vistral-7B-Chat-Q4_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:9f90eb1d9bf52bbd157e3c8233f06a0e4e9b984e591961d8583792bcb0b55442
|
||||
size 4404662464
|
||||
3
Vistral-7B-Chat-Q4_K_S.gguf
Normal file
3
Vistral-7B-Chat-Q4_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:98aa797ddeaa6ab2824c48e3ce80ff739caba44ea334b6861f8bc70b70ce81e8
|
||||
size 4176597184
|
||||
3
Vistral-7B-Chat-Q5_0.gguf
Normal file
3
Vistral-7B-Chat-Q5_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:d7a0d703b2550b1b92a034f2d834909f81fd7e15fb9dc6518bf2d212a6a46a7c
|
||||
size 5051880128
|
||||
3
Vistral-7B-Chat-Q5_1.gguf
Normal file
3
Vistral-7B-Chat-Q5_1.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:507850b6c32c536c69d2fd0e6a67146c499041f3b267e28b768f10dfb70f835a
|
||||
size 5483230144
|
||||
3
Vistral-7B-Chat-Q5_K_M.gguf
Normal file
3
Vistral-7B-Chat-Q5_K_M.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:8a0132536c56065c0f9daad04ab59456a8ffef5d4909d809c5bacba9865d0d0b
|
||||
size 5170893504
|
||||
3
Vistral-7B-Chat-Q5_K_S.gguf
Normal file
3
Vistral-7B-Chat-Q5_K_S.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:e58b42ec6852d9986c9e380e3e8d08d3f29b0304ed1990e6fc1e7e710c79f2de
|
||||
size 5037200064
|
||||
3
Vistral-7B-Chat-Q6_K.gguf
Normal file
3
Vistral-7B-Chat-Q6_K.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:4baae47e0038874afd24458265b05a4b04331f22585f1ad6707d3bbfd9d8624c
|
||||
size 5985013984
|
||||
3
Vistral-7B-Chat-Q8_0.gguf
Normal file
3
Vistral-7B-Chat-Q8_0.gguf
Normal file
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:c2ea5e26ca270b6205922509ce52264c7755e6b39ccdcbbf25285cc6f51f0cef
|
||||
size 7751442592
|
||||
Reference in New Issue
Block a user