From 3f6724d967d5b53e832bd4b350f2315f5523e41a Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Thu, 4 Jun 2026 05:44:19 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: RichardErkhov/sail_-_Sailor-7B-Chat-gguf Source: Original Platform --- .gitattributes | 57 +++++++++++ README.md | 188 +++++++++++++++++++++++++++++++++++++ Sailor-7B-Chat.IQ3_M.gguf | 3 + Sailor-7B-Chat.IQ3_S.gguf | 3 + Sailor-7B-Chat.IQ3_XS.gguf | 3 + Sailor-7B-Chat.IQ4_NL.gguf | 3 + Sailor-7B-Chat.IQ4_XS.gguf | 3 + Sailor-7B-Chat.Q2_K.gguf | 3 + Sailor-7B-Chat.Q3_K.gguf | 3 + Sailor-7B-Chat.Q3_K_L.gguf | 3 + Sailor-7B-Chat.Q3_K_M.gguf | 3 + Sailor-7B-Chat.Q3_K_S.gguf | 3 + Sailor-7B-Chat.Q4_0.gguf | 3 + Sailor-7B-Chat.Q4_1.gguf | 3 + Sailor-7B-Chat.Q4_K.gguf | 3 + Sailor-7B-Chat.Q4_K_M.gguf | 3 + Sailor-7B-Chat.Q4_K_S.gguf | 3 + Sailor-7B-Chat.Q5_0.gguf | 3 + Sailor-7B-Chat.Q5_1.gguf | 3 + Sailor-7B-Chat.Q5_K.gguf | 3 + Sailor-7B-Chat.Q5_K_M.gguf | 3 + Sailor-7B-Chat.Q5_K_S.gguf | 3 + Sailor-7B-Chat.Q6_K.gguf | 3 + Sailor-7B-Chat.Q8_0.gguf | 3 + 24 files changed, 311 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 Sailor-7B-Chat.IQ3_M.gguf create mode 100644 Sailor-7B-Chat.IQ3_S.gguf create mode 100644 Sailor-7B-Chat.IQ3_XS.gguf create mode 100644 Sailor-7B-Chat.IQ4_NL.gguf create mode 100644 Sailor-7B-Chat.IQ4_XS.gguf create mode 100644 Sailor-7B-Chat.Q2_K.gguf create mode 100644 Sailor-7B-Chat.Q3_K.gguf create mode 100644 Sailor-7B-Chat.Q3_K_L.gguf create mode 100644 Sailor-7B-Chat.Q3_K_M.gguf create mode 100644 Sailor-7B-Chat.Q3_K_S.gguf create mode 100644 Sailor-7B-Chat.Q4_0.gguf create mode 100644 Sailor-7B-Chat.Q4_1.gguf create mode 100644 Sailor-7B-Chat.Q4_K.gguf create mode 100644 Sailor-7B-Chat.Q4_K_M.gguf create mode 100644 Sailor-7B-Chat.Q4_K_S.gguf create mode 100644 Sailor-7B-Chat.Q5_0.gguf create mode 100644 Sailor-7B-Chat.Q5_1.gguf create mode 100644 Sailor-7B-Chat.Q5_K.gguf create mode 100644 Sailor-7B-Chat.Q5_K_M.gguf create mode 100644 Sailor-7B-Chat.Q5_K_S.gguf create mode 100644 Sailor-7B-Chat.Q6_K.gguf create mode 100644 Sailor-7B-Chat.Q8_0.gguf diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..4570bae --- /dev/null +++ b/.gitattributes @@ -0,0 +1,57 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.IQ3_XS.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.IQ3_S.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.IQ3_M.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q3_K.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.IQ4_XS.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q4_0.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.IQ4_NL.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q4_K.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q4_1.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q5_0.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q5_K.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q5_1.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text +Sailor-7B-Chat.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..e96b620 --- /dev/null +++ b/README.md @@ -0,0 +1,188 @@ +Quantization made by Richard Erkhov. + +[Github](https://github.com/RichardErkhov) + +[Discord](https://discord.gg/pvy7H8DZMG) + +[Request more models](https://github.com/RichardErkhov/quant_request) + + +Sailor-7B-Chat - GGUF +- Model creator: https://huggingface.co/sail/ +- Original model: https://huggingface.co/sail/Sailor-7B-Chat/ + + +| Name | Quant method | Size | +| ---- | ---- | ---- | +| [Sailor-7B-Chat.Q2_K.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q2_K.gguf) | Q2_K | 2.89GB | +| [Sailor-7B-Chat.IQ3_XS.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.IQ3_XS.gguf) | IQ3_XS | 3.18GB | +| [Sailor-7B-Chat.IQ3_S.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.IQ3_S.gguf) | IQ3_S | 3.32GB | +| [Sailor-7B-Chat.Q3_K_S.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q3_K_S.gguf) | Q3_K_S | 3.32GB | +| [Sailor-7B-Chat.IQ3_M.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.IQ3_M.gguf) | IQ3_M | 3.48GB | +| [Sailor-7B-Chat.Q3_K.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q3_K.gguf) | Q3_K | 3.65GB | +| [Sailor-7B-Chat.Q3_K_M.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q3_K_M.gguf) | Q3_K_M | 3.65GB | +| [Sailor-7B-Chat.Q3_K_L.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q3_K_L.gguf) | Q3_K_L | 3.93GB | +| [Sailor-7B-Chat.IQ4_XS.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.IQ4_XS.gguf) | IQ4_XS | 4.02GB | +| [Sailor-7B-Chat.Q4_0.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q4_0.gguf) | Q4_0 | 4.2GB | +| [Sailor-7B-Chat.IQ4_NL.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.IQ4_NL.gguf) | IQ4_NL | 4.22GB | +| [Sailor-7B-Chat.Q4_K_S.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q4_K_S.gguf) | Q4_K_S | 4.23GB | +| [Sailor-7B-Chat.Q4_K.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q4_K.gguf) | Q4_K | 4.44GB | +| [Sailor-7B-Chat.Q4_K_M.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q4_K_M.gguf) | Q4_K_M | 4.44GB | +| [Sailor-7B-Chat.Q4_1.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q4_1.gguf) | Q4_1 | 4.62GB | +| [Sailor-7B-Chat.Q5_0.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q5_0.gguf) | Q5_0 | 5.03GB | +| [Sailor-7B-Chat.Q5_K_S.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q5_K_S.gguf) | Q5_K_S | 5.03GB | +| [Sailor-7B-Chat.Q5_K.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q5_K.gguf) | Q5_K | 5.15GB | +| [Sailor-7B-Chat.Q5_K_M.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q5_K_M.gguf) | Q5_K_M | 5.15GB | +| [Sailor-7B-Chat.Q5_1.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q5_1.gguf) | Q5_1 | 5.44GB | +| [Sailor-7B-Chat.Q6_K.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q6_K.gguf) | Q6_K | 5.91GB | +| [Sailor-7B-Chat.Q8_0.gguf](https://huggingface.co/RichardErkhov/sail_-_Sailor-7B-Chat-gguf/blob/main/Sailor-7B-Chat.Q8_0.gguf) | Q8_0 | 7.65GB | + + + + +Original model description: +--- +language: +- en +- zh +- id +- th +- vi +- ms +- lo +datasets: +- CohereForAI/aya_dataset +- CohereForAI/aya_collection +- Open-Orca/OpenOrca +tags: +- multilingual +- sea +- sailor +- sft +- chat +- instruction +widget: +- text: "如何制作烤鱼?" + example_title: "Chinese" +- text: "How to bake fish?" + example_title: "English" +- text: "Bagaimana cara memanggang ikan?" + example_title: "Malay" +- text: "วิธีย่างปลา?" + example_title: "Thai" +- text: "Bagaimana membuat bakaran ikan?" + example_title: "Indonesian" +- text: "Làm thế nào để nướng cá?" + example_title: "Vietnamese" +license: apache-2.0 +base_model: sail/Sailor-7B +--- + +
+ +
+ +Sailor is a suite of Open Language Models tailored for South-East Asia (SEA), focusing on languages such as 🇮🇩Indonesian, 🇹🇭Thai, 🇻🇳Vietnamese, 🇲🇾Malay, and 🇱🇦Lao. +Developed with careful data curation, Sailor models are designed to understand and generate text across diverse linguistic landscapes of SEA region. +Built from [Qwen 1.5](https://huggingface.co/collections/Qwen/qwen15-65c0a2f577b1ecb76d786524) , Sailor encompasses models of varying sizes, spanning from 0.5B to 7B versions for different requirements. +We further fine-tune the base model with open-source datasets to get instruction-tuned models, namedly Sailor-Chat. +Benchmarking results demonstrate Sailor's proficiency in tasks such as question answering, commonsense reasoning, and other tasks in SEA languages. + +> The logo was generated by MidJourney + +## Model Summary +- **Model Collections:** [Base Model & Chat Model](https://huggingface.co/collections/sail/sailor-65e19a749f978976f1959825) +- **Project Website:** [sailorllm.github.io](https://sailorllm.github.io/) +- **Codebase:** [github.com/sail-sg/sailor-llm](https://github.com/sail-sg/sailor-llm) +- **Technical Report:** [arxiv.org/pdf/2404.03608.pdf](https://arxiv.org/pdf/2404.03608.pdf) + + +## Training details +Sailor is crafted by continually pre-training from language models like the remarkable Qwen 1.5 models, which already has a great performance on SEA languages. +The pre-training corpus heavily leverages the publicly available corpus, including +[SlimPajama](https://huggingface.co/datasets/cerebras/SlimPajama-627B), +[SkyPile](https://huggingface.co/datasets/Skywork/SkyPile-150B), +[CC100](https://huggingface.co/datasets/cc100) and [MADLAD-400](https://huggingface.co/datasets/allenai/MADLAD-400). +The instruction tuning corpus are all publicly available including +[aya_collection](https://huggingface.co/datasets/CohereForAI/aya_collection), +[aya_dataset](https://huggingface.co/datasets/CohereForAI/aya_dataset), +[OpenOrca](https://huggingface.co/datasets/Open-Orca/OpenOrca). + +By employing aggressive data deduplication and careful data cleaning on the collected corpus, we have attained a high-quality dataset spanning various languages. +Through systematic experiments to determine the weights of different languages, Sailor models undergo training from 200B to 400B tokens, tailored to different model sizes. +The approach boosts their performance on SEA languages while maintaining proficiency in English and Chinese without significant compromise. +Finally, we continually pre-train the Qwen1.5-0.5B model with 400 Billion tokens, and other models with 200 Billion tokens to obtain the Sailor models. + +## Requirements +The code of Sailor has been in the latest Hugging face transformers and we advise you to install `transformers>=4.37.0`. + +## Quickstart + +Here provides a code snippet to show you how to load the tokenizer and model and how to generate contents. + +```python +from transformers import AutoModelForCausalLM, AutoTokenizer +device = "cuda" + +model = AutoModelForCausalLM.from_pretrained( + 'sail/Sailor-7B-Chat', + torch_dtype="auto", + device_map="auto" +) + +tokenizer = AutoTokenizer.from_pretrained('sail/Sailor-7B-Chat') +system_prompt= 'You are a helpful assistant' + +prompt = "Beri saya pengenalan singkat tentang model bahasa besar." +# prompt = "Hãy cho tôi một giới thiệu ngắn gọn về mô hình ngôn ngữ lớn." +# prompt = "ให้ฉันแนะนำสั้น ๆ เกี่ยวกับโมเดลภาษาขนาดใหญ่" + +messages = [ + {"role": "system", "content": system_prompt}, + {"role": "question", "content": prompt} +] +text = tokenizer.apply_chat_template( + messages, + tokenize=False, + add_generation_prompt=True +) + +model_inputs = tokenizer([text], return_tensors="pt").to(device) +input_ids = model_inputs.input_ids.to(device) + +generated_ids = model.generate( + input_ids, + max_new_tokens=512, +) + +generated_ids = [ + output_ids[len(input_ids):] for input_ids, output_ids in zip(model_inputs.input_ids, generated_ids) +] +response = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)[0] +print(response) +``` + +# License + +Sailor is distributed under the terms of the Apache License 2.0. +No restrict on the research and the commercial use, but should comply with the [Qwen License](https://huggingface.co/Qwen/Qwen1.5-1.8B/blob/main/LICENSE). + +## Citation + +If you find sailor useful, please cite our work as follows: + +``` +@misc{dou2024sailor, + title={Sailor: Open Language Models for South-East Asia}, + author={Longxu Dou and Qian Liu and Guangtao Zeng and Jia Guo and Jiahui Zhou and Wei Lu and Min Lin}, + year={2024}, + eprint={2404.03608}, + archivePrefix={arXiv}, + primaryClass={cs.CL} +} +``` + +# Contact Us + +If you have any questions, please raise an issue or contact us at [doulx@sea.com](mailto:doulx@sea.com) or [liuqian@sea.com](mailto:liuqian@sea.com). + diff --git a/Sailor-7B-Chat.IQ3_M.gguf b/Sailor-7B-Chat.IQ3_M.gguf new file mode 100644 index 0000000..56ca50e --- /dev/null +++ b/Sailor-7B-Chat.IQ3_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57ff7817b5f1d13d0c80715a6507868d42063881a2a93b362a8dfba766273b95 +size 3735719488 diff --git a/Sailor-7B-Chat.IQ3_S.gguf b/Sailor-7B-Chat.IQ3_S.gguf new file mode 100644 index 0000000..dd8a0f7 --- /dev/null +++ b/Sailor-7B-Chat.IQ3_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd5b963d2499b918b66e9d52fcd2d92ec6c19413be8f2196d4eecaefc2df695c +size 3569159744 diff --git a/Sailor-7B-Chat.IQ3_XS.gguf b/Sailor-7B-Chat.IQ3_XS.gguf new file mode 100644 index 0000000..d18a562 --- /dev/null +++ b/Sailor-7B-Chat.IQ3_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04bd765ee89db91a18d0c16f4a118b1b04f3d62b2c4bc0c2fc2a81a0278c93fa +size 3417378368 diff --git a/Sailor-7B-Chat.IQ4_NL.gguf b/Sailor-7B-Chat.IQ4_NL.gguf new file mode 100644 index 0000000..4663716 --- /dev/null +++ b/Sailor-7B-Chat.IQ4_NL.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8c62002ad3436f589acd090b95648abdc824e9bbf11bb432739471e7ee431b9 +size 4534451776 diff --git a/Sailor-7B-Chat.IQ4_XS.gguf b/Sailor-7B-Chat.IQ4_XS.gguf new file mode 100644 index 0000000..e9c5259 --- /dev/null +++ b/Sailor-7B-Chat.IQ4_XS.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f9d013a2365df6d0208c84300c7b6ee5bce15ea7c08d319c49214a20e960216 +size 4318264896 diff --git a/Sailor-7B-Chat.Q2_K.gguf b/Sailor-7B-Chat.Q2_K.gguf new file mode 100644 index 0000000..1d8a5cb --- /dev/null +++ b/Sailor-7B-Chat.Q2_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:addaa505830c75341f97eff9ce7eba1149f8483e1cd293aac830eeb1e1bce258 +size 3103825472 diff --git a/Sailor-7B-Chat.Q3_K.gguf b/Sailor-7B-Chat.Q3_K.gguf new file mode 100644 index 0000000..b2c8c82 --- /dev/null +++ b/Sailor-7B-Chat.Q3_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb8b46b06f6b1a9bb24b2d76197d2245b7b5547e441f2f24f8e2e6ff3a818597 +size 3918859840 diff --git a/Sailor-7B-Chat.Q3_K_L.gguf b/Sailor-7B-Chat.Q3_K_L.gguf new file mode 100644 index 0000000..5de06bf --- /dev/null +++ b/Sailor-7B-Chat.Q3_K_L.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ed9d869c6a4a05c30bc0aa486bcbbf7e243fd4c31b60f63645dfbbc2aabad33 +size 4217966144 diff --git a/Sailor-7B-Chat.Q3_K_M.gguf b/Sailor-7B-Chat.Q3_K_M.gguf new file mode 100644 index 0000000..b2c8c82 --- /dev/null +++ b/Sailor-7B-Chat.Q3_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb8b46b06f6b1a9bb24b2d76197d2245b7b5547e441f2f24f8e2e6ff3a818597 +size 3918859840 diff --git a/Sailor-7B-Chat.Q3_K_S.gguf b/Sailor-7B-Chat.Q3_K_S.gguf new file mode 100644 index 0000000..89e0f28 --- /dev/null +++ b/Sailor-7B-Chat.Q3_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34d410e2da08c43e62facfca1f7390d84cf0cbc1d7c301e1245c97a14e9fd286 +size 3569159744 diff --git a/Sailor-7B-Chat.Q4_0.gguf b/Sailor-7B-Chat.Q4_0.gguf new file mode 100644 index 0000000..981167f --- /dev/null +++ b/Sailor-7B-Chat.Q4_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3011de7dce255b69041591915346831cd72122b3ee3ef71b3dea21c0961ea13 +size 4511907392 diff --git a/Sailor-7B-Chat.Q4_1.gguf b/Sailor-7B-Chat.Q4_1.gguf new file mode 100644 index 0000000..5dec1a1 --- /dev/null +++ b/Sailor-7B-Chat.Q4_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bafd723dfc81301a122d347e73fe88040ea80ab8dc347a9cd591422f6846564 +size 4955553344 diff --git a/Sailor-7B-Chat.Q4_K.gguf b/Sailor-7B-Chat.Q4_K.gguf new file mode 100644 index 0000000..741bd0c --- /dev/null +++ b/Sailor-7B-Chat.Q4_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d98ca1d6e2c9e12501d773f9e74d4126274589480772b0fb0d54690ed05825c7 +size 4767104576 diff --git a/Sailor-7B-Chat.Q4_K_M.gguf b/Sailor-7B-Chat.Q4_K_M.gguf new file mode 100644 index 0000000..741bd0c --- /dev/null +++ b/Sailor-7B-Chat.Q4_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d98ca1d6e2c9e12501d773f9e74d4126274589480772b0fb0d54690ed05825c7 +size 4767104576 diff --git a/Sailor-7B-Chat.Q4_K_S.gguf b/Sailor-7B-Chat.Q4_K_S.gguf new file mode 100644 index 0000000..339a25f --- /dev/null +++ b/Sailor-7B-Chat.Q4_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c4ac5ec06ba211cef29c174ab17fa117222e2d92f90c1d5469876709849daf3 +size 4542840384 diff --git a/Sailor-7B-Chat.Q5_0.gguf b/Sailor-7B-Chat.Q5_0.gguf new file mode 100644 index 0000000..202ee67 --- /dev/null +++ b/Sailor-7B-Chat.Q5_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9a5b25960ca61fcb9e7e2bdd91adfe4989f4d178de628bf44c62a7e196b33b8 +size 5399199296 diff --git a/Sailor-7B-Chat.Q5_1.gguf b/Sailor-7B-Chat.Q5_1.gguf new file mode 100644 index 0000000..a6241f8 --- /dev/null +++ b/Sailor-7B-Chat.Q5_1.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8ada141d82222d32e63cb98aca5da8e7202cca40302ce0ff3eda8006b5ff6d0 +size 5842845248 diff --git a/Sailor-7B-Chat.Q5_K.gguf b/Sailor-7B-Chat.Q5_K.gguf new file mode 100644 index 0000000..7482a49 --- /dev/null +++ b/Sailor-7B-Chat.Q5_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7ac428ec7328eed7ca25c193ad755c8919153afbff3eef2c038093b1346df2 +size 5530664512 diff --git a/Sailor-7B-Chat.Q5_K_M.gguf b/Sailor-7B-Chat.Q5_K_M.gguf new file mode 100644 index 0000000..7482a49 --- /dev/null +++ b/Sailor-7B-Chat.Q5_K_M.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7ac428ec7328eed7ca25c193ad755c8919153afbff3eef2c038093b1346df2 +size 5530664512 diff --git a/Sailor-7B-Chat.Q5_K_S.gguf b/Sailor-7B-Chat.Q5_K_S.gguf new file mode 100644 index 0000000..276c743 --- /dev/null +++ b/Sailor-7B-Chat.Q5_K_S.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d15add0b8ed745f5e79aad16a07b32485b7e210b01a8009ac318206a050e02f8 +size 5399199296 diff --git a/Sailor-7B-Chat.Q6_K.gguf b/Sailor-7B-Chat.Q6_K.gguf new file mode 100644 index 0000000..a4e0c78 --- /dev/null +++ b/Sailor-7B-Chat.Q6_K.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb5b66e88d67940fd1b6bf576d474efe5db821bfe46d2b05e079fcf8d5950b4 +size 6341946944 diff --git a/Sailor-7B-Chat.Q8_0.gguf b/Sailor-7B-Chat.Q8_0.gguf new file mode 100644 index 0000000..336abdf --- /dev/null +++ b/Sailor-7B-Chat.Q8_0.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85256f7be31bff480247d1c17a9ec6d35eeb7852eb4730705ff0eadb6884250b +size 8211795520