commit d39a7a42bfd33948b01722a25905bdca93fa3ff8 Author: ModelHub XC Date: Wed Jun 17 16:08:15 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: duyntnet/Vistral-7B-Chat-imatrix-GGUF Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..f561261 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,62 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ1_M.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ1_S.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ2_M.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ2_S.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ2_XS.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ2_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ3_XXS.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q2_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q5_1.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Vistral-7B-Chat-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..2948f6b --- /dev/null +++ b/README.md @@ -0,0 +1,60 @@ +--- +license: other +language: +- en +pipeline_tag: text-generation +inference: false +tags: +- transformers +- gguf +- imatrix +- Vistral-7B-Chat +--- +Quantizations of https://huggingface.co/Viet-Mistral/Vistral-7B-Chat + +# From original readme + +## Usage + +To enable single/multi-turn conversational chat with `Vistral-7B-Chat`, you can use the default chat template format: + +```python +import torch +from transformers import AutoModelForCausalLM, AutoTokenizer + +system_prompt = "Bạn là một trợ lí Tiếng Việt nhiệt tình và trung thực. Hãy luôn trả lời một cách hữu ích nhất có thể, đồng thời giữ an toàn.\n" +system_prompt += "Câu trả lời của bạn không nên chứa bất kỳ nội dung gây hại, phân biệt chủng tộc, phân biệt giới tính, độc hại, nguy hiểm hoặc bất hợp pháp nào. Hãy đảm bảo rằng các câu trả lời của bạn không có thiên kiến xã hội và mang tính tích cực." +system_prompt += "Nếu một câu hỏi không có ý nghĩa hoặc không hợp lý về mặt thông tin, hãy giải thích tại sao thay vì trả lời một điều gì đó không chính xác. Nếu bạn không biết câu trả lời cho một câu hỏi, hãy trẳ lời là bạn không biết và vui lòng không chia sẻ thông tin sai lệch." + +tokenizer = AutoTokenizer.from_pretrained('Viet-Mistral/Vistral-7B-Chat') +model = AutoModelForCausalLM.from_pretrained( + 'Viet-Mistral/Vistral-7B-Chat', + torch_dtype=torch.bfloat16, # change to torch.float16 if you're using V100 + device_map="auto", + use_cache=True, +) + +conversation = [{"role": "system", "content": system_prompt }] +while True: + human = input("Human: ") + if human.lower() == "reset": + conversation = [{"role": "system", "content": system_prompt }] + print("The chat history has been cleared!") + continue + + conversation.append({"role": "user", "content": human }) + input_ids = tokenizer.apply_chat_template(conversation, return_tensors="pt").to(model.device) + + out_ids = model.generate( + input_ids=input_ids, + max_new_tokens=768, + do_sample=True, + top_p=0.95, + top_k=40, + temperature=0.1, + repetition_penalty=1.05, + ) + assistant = tokenizer.batch_decode(out_ids[:, input_ids.size(1): ], skip_special_tokens=True)[0].strip() + print("Assistant: ", assistant) + conversation.append({"role": "assistant", "content": assistant }) +``` \ No newline at end of file diff --git a/Vistral-7B-Chat-IQ1_M.gguf b/Vistral-7B-Chat-IQ1_M.gguf new file mode 100644 index 0000000..d20a4a7 --- /dev/null +++ b/Vistral-7B-Chat-IQ1_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:436a6746c4612e4f3e73cb834b3b9bd6ee508d242c97d43d9503b0a6618a4afa +size 1781090016 diff --git a/Vistral-7B-Chat-IQ1_S.gguf b/Vistral-7B-Chat-IQ1_S.gguf new file mode 100644 index 0000000..02d8f0b --- /dev/null +++ b/Vistral-7B-Chat-IQ1_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9547c09465e6d0848114097b5cd0a42f6cbb70b67b2aa6a83c8fb09b1d9ae0e +size 1638745824 diff --git a/Vistral-7B-Chat-IQ2_M.gguf b/Vistral-7B-Chat-IQ2_M.gguf new file mode 100644 index 0000000..6b197ed --- /dev/null +++ b/Vistral-7B-Chat-IQ2_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b824fd83d1e1f663096ab7b810fd7198739bbdcbd839d7958c4ef3fbb2fc0d +size 2530006144 diff --git a/Vistral-7B-Chat-IQ2_S.gguf b/Vistral-7B-Chat-IQ2_S.gguf new file mode 100644 index 0000000..6a13631 --- /dev/null +++ b/Vistral-7B-Chat-IQ2_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ac127eb065b7b2e6eee2510195ea225298a64f09fc8c925a5c438960e57614 +size 2340213888 diff --git a/Vistral-7B-Chat-IQ2_XS.gguf b/Vistral-7B-Chat-IQ2_XS.gguf new file mode 100644 index 0000000..611f22a --- /dev/null +++ b/Vistral-7B-Chat-IQ2_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09c7e651bdbaad9057155cf156cbbbb9319a5a28614d7791d05c8ca3d746fa97 +size 2224899808 diff --git a/Vistral-7B-Chat-IQ2_XXS.gguf b/Vistral-7B-Chat-IQ2_XXS.gguf new file mode 100644 index 0000000..c7a839e --- /dev/null +++ b/Vistral-7B-Chat-IQ2_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd3cb112a004bc6608c30b64bcd68540e3f52fb9ebd800af24655a4d189063e +size 2018330336 diff --git a/Vistral-7B-Chat-IQ3_M.gguf b/Vistral-7B-Chat-IQ3_M.gguf new file mode 100644 index 0000000..e0137f8 --- /dev/null +++ b/Vistral-7B-Chat-IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca4e03ca6cdd013701e5a38fac72212868037e56b998703f57cd993a14b99cb +size 3317650080 diff --git a/Vistral-7B-Chat-IQ3_S.gguf b/Vistral-7B-Chat-IQ3_S.gguf new file mode 100644 index 0000000..f15d727 --- /dev/null +++ b/Vistral-7B-Chat-IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32bcc62744d91e8f12f68b6537541e8a35cc2fbe8e3c60b77fe5f5285255080b +size 3215151776 diff --git a/Vistral-7B-Chat-IQ3_XS.gguf b/Vistral-7B-Chat-IQ3_XS.gguf new file mode 100644 index 0000000..0fad05d --- /dev/null +++ b/Vistral-7B-Chat-IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79dca1a6be014551b0d82731e35d5985e88e41788224cb6982616c4f057b024e +size 3051573920 diff --git a/Vistral-7B-Chat-IQ3_XXS.gguf b/Vistral-7B-Chat-IQ3_XXS.gguf new file mode 100644 index 0000000..0c7aec0 --- /dev/null +++ b/Vistral-7B-Chat-IQ3_XXS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e8855990539047e5fe03c8962592a816b65c809e64ed6a8d9be4a70eb780aa9 +size 2856637568 diff --git a/Vistral-7B-Chat-IQ4_NL.gguf b/Vistral-7B-Chat-IQ4_NL.gguf new file mode 100644 index 0000000..74e997d --- /dev/null +++ b/Vistral-7B-Chat-IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b602fedb65d849d92c621c342d354c88b65ad93c791b258ea685e6a0c03e500d +size 4161917120 diff --git a/Vistral-7B-Chat-IQ4_XS.gguf b/Vistral-7B-Chat-IQ4_XS.gguf new file mode 100644 index 0000000..11033e8 --- /dev/null +++ b/Vistral-7B-Chat-IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde2fb02d5b8896af3dd60098987e97369fb4e4cd02c6346e308ee3f4a128e0d +size 3943096384 diff --git a/Vistral-7B-Chat-Q2_K.gguf b/Vistral-7B-Chat-Q2_K.gguf new file mode 100644 index 0000000..3c401cf --- /dev/null +++ b/Vistral-7B-Chat-Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dffa0435fd646c0bc1253521bdba3ad14eaf9759e3a4dd0d9c165212f530e3f6 +size 2749351168 diff --git a/Vistral-7B-Chat-Q2_K_S.gguf b/Vistral-7B-Chat-Q2_K_S.gguf new file mode 100644 index 0000000..59173ac --- /dev/null +++ b/Vistral-7B-Chat-Q2_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e31c42dcafb01fd4024da4653e6281c583c5c1f6842a81e6fbb95a4f24b0a2b0 +size 2559034624 diff --git a/Vistral-7B-Chat-Q3_K_L.gguf b/Vistral-7B-Chat-Q3_K_L.gguf new file mode 100644 index 0000000..468bb85 --- /dev/null +++ b/Vistral-7B-Chat-Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:336d5aed85616561396f4a0ba5a7808ec3e8e765649bc52b8d7327ed24a00c76 +size 3854783136 diff --git a/Vistral-7B-Chat-Q3_K_M.gguf b/Vistral-7B-Chat-Q3_K_M.gguf new file mode 100644 index 0000000..a16f3f0 --- /dev/null +++ b/Vistral-7B-Chat-Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:544b04dfa91e258cc13f584b07fd3509560bdc560ed6facdc36592f11ee9b078 +size 3551744672 diff --git a/Vistral-7B-Chat-Q3_K_S.gguf b/Vistral-7B-Chat-Q3_K_S.gguf new file mode 100644 index 0000000..1c2eec7 --- /dev/null +++ b/Vistral-7B-Chat-Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40d0ccc42a0fd5e9fb4519291aab3c1e15992d31cdde29a440b03a9409ff4dfe +size 3197325984 diff --git a/Vistral-7B-Chat-Q4_0.gguf b/Vistral-7B-Chat-Q4_0.gguf new file mode 100644 index 0000000..0241ad0 --- /dev/null +++ b/Vistral-7B-Chat-Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8232ef8de32a4ef4378fb4b7d52072e6915d78a0fe0fca5938146ede1dc8286a +size 4159819968 diff --git a/Vistral-7B-Chat-Q4_1.gguf b/Vistral-7B-Chat-Q4_1.gguf new file mode 100644 index 0000000..e6b97ac --- /dev/null +++ b/Vistral-7B-Chat-Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7764635ad2024caaeeeef7d0334de7f28db0e8b8317cf4eb4504cddd35e4b7e +size 4591169984 diff --git a/Vistral-7B-Chat-Q4_K_M.gguf b/Vistral-7B-Chat-Q4_K_M.gguf new file mode 100644 index 0000000..e15236a --- /dev/null +++ b/Vistral-7B-Chat-Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f90eb1d9bf52bbd157e3c8233f06a0e4e9b984e591961d8583792bcb0b55442 +size 4404662464 diff --git a/Vistral-7B-Chat-Q4_K_S.gguf b/Vistral-7B-Chat-Q4_K_S.gguf new file mode 100644 index 0000000..cb9c963 --- /dev/null +++ b/Vistral-7B-Chat-Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98aa797ddeaa6ab2824c48e3ce80ff739caba44ea334b6861f8bc70b70ce81e8 +size 4176597184 diff --git a/Vistral-7B-Chat-Q5_0.gguf b/Vistral-7B-Chat-Q5_0.gguf new file mode 100644 index 0000000..dc9b8e2 --- /dev/null +++ b/Vistral-7B-Chat-Q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7a0d703b2550b1b92a034f2d834909f81fd7e15fb9dc6518bf2d212a6a46a7c +size 5051880128 diff --git a/Vistral-7B-Chat-Q5_1.gguf b/Vistral-7B-Chat-Q5_1.gguf new file mode 100644 index 0000000..7b41c9a --- /dev/null +++ b/Vistral-7B-Chat-Q5_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:507850b6c32c536c69d2fd0e6a67146c499041f3b267e28b768f10dfb70f835a +size 5483230144 diff --git a/Vistral-7B-Chat-Q5_K_M.gguf b/Vistral-7B-Chat-Q5_K_M.gguf new file mode 100644 index 0000000..c9e744d --- /dev/null +++ b/Vistral-7B-Chat-Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0132536c56065c0f9daad04ab59456a8ffef5d4909d809c5bacba9865d0d0b +size 5170893504 diff --git a/Vistral-7B-Chat-Q5_K_S.gguf b/Vistral-7B-Chat-Q5_K_S.gguf new file mode 100644 index 0000000..e5d1d50 --- /dev/null +++ b/Vistral-7B-Chat-Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e58b42ec6852d9986c9e380e3e8d08d3f29b0304ed1990e6fc1e7e710c79f2de +size 5037200064 diff --git a/Vistral-7B-Chat-Q6_K.gguf b/Vistral-7B-Chat-Q6_K.gguf new file mode 100644 index 0000000..62c3f35 --- /dev/null +++ b/Vistral-7B-Chat-Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4baae47e0038874afd24458265b05a4b04331f22585f1ad6707d3bbfd9d8624c +size 5985013984 diff --git a/Vistral-7B-Chat-Q8_0.gguf b/Vistral-7B-Chat-Q8_0.gguf new file mode 100644 index 0000000..88873fa --- /dev/null +++ b/Vistral-7B-Chat-Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2ea5e26ca270b6205922509ce52264c7755e6b39ccdcbbf25285cc6f51f0cef +size 7751442592