初始化项目,由ModelHub XC社区提供模型

Model: duyntnet/Vistral-7B-Chat-imatrix-GGUF
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-06-17 16:08:15 +08:00
commit d39a7a42bf
29 changed files with 203 additions and 0 deletions

62
.gitattributes vendored Normal file
View File

@@ -0,0 +1,62 @@
*.7z filter=lfs diff=lfs merge=lfs -text
*.arrow filter=lfs diff=lfs merge=lfs -text
*.bin filter=lfs diff=lfs merge=lfs -text
*.bz2 filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.ftz filter=lfs diff=lfs merge=lfs -text
*.gz filter=lfs diff=lfs merge=lfs -text
*.h5 filter=lfs diff=lfs merge=lfs -text
*.joblib filter=lfs diff=lfs merge=lfs -text
*.lfs.* filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
*.pth filter=lfs diff=lfs merge=lfs -text
*.rar filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.tar.* filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.tflite filter=lfs diff=lfs merge=lfs -text
*.tgz filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.xz filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
Vistral-7B-Chat-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text

60
README.md Normal file
View File

@@ -0,0 +1,60 @@
---
license: other
language:
- en
pipeline_tag: text-generation
inference: false
tags:
- transformers
- gguf
- imatrix
- Vistral-7B-Chat
---
Quantizations of https://huggingface.co/Viet-Mistral/Vistral-7B-Chat
# From original readme
## Usage
To enable single/multi-turn conversational chat with `Vistral-7B-Chat`, you can use the default chat template format:
```python
import torch
from transformers import AutoModelForCausalLM, AutoTokenizer
system_prompt = "Bạn là một trợ lí Tiếng Việt nhiệt tình và trung thực. Hãy luôn trả lời một cách hữu ích nhất có thể, đồng thời giữ an toàn.\n"
system_prompt += "Câu trả lời của bạn không nên chứa bất kỳ nội dung gây hại, phân biệt chủng tộc, phân biệt giới tính, độc hại, nguy hiểm hoặc bất hợp pháp nào. Hãy đảm bảo rằng các câu trả lời của bạn không có thiên kiến xã hội và mang tính tích cực."
system_prompt += "Nếu một câu hỏi không có ý nghĩa hoặc không hợp lý về mặt thông tin, hãy giải thích tại sao thay vì trả lời một điều gì đó không chính xác. Nếu bạn không biết câu trả lời cho một câu hỏi, hãy trẳ lời là bạn không biết và vui lòng không chia sẻ thông tin sai lệch."
tokenizer = AutoTokenizer.from_pretrained('Viet-Mistral/Vistral-7B-Chat')
model = AutoModelForCausalLM.from_pretrained(
'Viet-Mistral/Vistral-7B-Chat',
torch_dtype=torch.bfloat16, # change to torch.float16 if you're using V100
device_map="auto",
use_cache=True,
)
conversation = [{"role": "system", "content": system_prompt }]
while True:
human = input("Human: ")
if human.lower() == "reset":
conversation = [{"role": "system", "content": system_prompt }]
print("The chat history has been cleared!")
continue
conversation.append({"role": "user", "content": human })
input_ids = tokenizer.apply_chat_template(conversation, return_tensors="pt").to(model.device)
out_ids = model.generate(
input_ids=input_ids,
max_new_tokens=768,
do_sample=True,
top_p=0.95,
top_k=40,
temperature=0.1,
repetition_penalty=1.05,
)
assistant = tokenizer.batch_decode(out_ids[:, input_ids.size(1): ], skip_special_tokens=True)[0].strip()
print("Assistant: ", assistant)
conversation.append({"role": "assistant", "content": assistant })
```

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:436a6746c4612e4f3e73cb834b3b9bd6ee508d242c97d43d9503b0a6618a4afa
size 1781090016

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:b9547c09465e6d0848114097b5cd0a42f6cbb70b67b2aa6a83c8fb09b1d9ae0e
size 1638745824

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:56b824fd83d1e1f663096ab7b810fd7198739bbdcbd839d7958c4ef3fbb2fc0d
size 2530006144

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:66ac127eb065b7b2e6eee2510195ea225298a64f09fc8c925a5c438960e57614
size 2340213888

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:09c7e651bdbaad9057155cf156cbbbb9319a5a28614d7791d05c8ca3d746fa97
size 2224899808

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5fd3cb112a004bc6608c30b64bcd68540e3f52fb9ebd800af24655a4d189063e
size 2018330336

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:6ca4e03ca6cdd013701e5a38fac72212868037e56b998703f57cd993a14b99cb
size 3317650080

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:32bcc62744d91e8f12f68b6537541e8a35cc2fbe8e3c60b77fe5f5285255080b
size 3215151776

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:79dca1a6be014551b0d82731e35d5985e88e41788224cb6982616c4f057b024e
size 3051573920

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:8e8855990539047e5fe03c8962592a816b65c809e64ed6a8d9be4a70eb780aa9
size 2856637568

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:b602fedb65d849d92c621c342d354c88b65ad93c791b258ea685e6a0c03e500d
size 4161917120

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:fde2fb02d5b8896af3dd60098987e97369fb4e4cd02c6346e308ee3f4a128e0d
size 3943096384

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:dffa0435fd646c0bc1253521bdba3ad14eaf9759e3a4dd0d9c165212f530e3f6
size 2749351168

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e31c42dcafb01fd4024da4653e6281c583c5c1f6842a81e6fbb95a4f24b0a2b0
size 2559034624

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:336d5aed85616561396f4a0ba5a7808ec3e8e765649bc52b8d7327ed24a00c76
size 3854783136

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:544b04dfa91e258cc13f584b07fd3509560bdc560ed6facdc36592f11ee9b078
size 3551744672

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:40d0ccc42a0fd5e9fb4519291aab3c1e15992d31cdde29a440b03a9409ff4dfe
size 3197325984

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:8232ef8de32a4ef4378fb4b7d52072e6915d78a0fe0fca5938146ede1dc8286a
size 4159819968

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:d7764635ad2024caaeeeef7d0334de7f28db0e8b8317cf4eb4504cddd35e4b7e
size 4591169984

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:9f90eb1d9bf52bbd157e3c8233f06a0e4e9b984e591961d8583792bcb0b55442
size 4404662464

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:98aa797ddeaa6ab2824c48e3ce80ff739caba44ea334b6861f8bc70b70ce81e8
size 4176597184

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:d7a0d703b2550b1b92a034f2d834909f81fd7e15fb9dc6518bf2d212a6a46a7c
size 5051880128

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:507850b6c32c536c69d2fd0e6a67146c499041f3b267e28b768f10dfb70f835a
size 5483230144

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:8a0132536c56065c0f9daad04ab59456a8ffef5d4909d809c5bacba9865d0d0b
size 5170893504

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e58b42ec6852d9986c9e380e3e8d08d3f29b0304ed1990e6fc1e7e710c79f2de
size 5037200064

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:4baae47e0038874afd24458265b05a4b04331f22585f1ad6707d3bbfd9d8624c
size 5985013984

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c2ea5e26ca270b6205922509ce52264c7755e6b39ccdcbbf25285cc6f51f0cef
size 7751442592