Upload llama-3.1-Asian-Bllossom-8B-Translator.Q4_0_8_8.gguf with huggingface_hub

This commit is contained in:
ai-modelscope
2024-11-26 15:14:52 +08:00
parent a9e4052cbd
commit 040d94035b
20 changed files with 223 additions and 62 deletions

49
.gitattributes vendored
View File

@@ -1,47 +1,52 @@
*.7z filter=lfs diff=lfs merge=lfs -text
*.arrow filter=lfs diff=lfs merge=lfs -text
*.bin filter=lfs diff=lfs merge=lfs -text
*.bin.* filter=lfs diff=lfs merge=lfs -text
*.bz2 filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.ftz filter=lfs diff=lfs merge=lfs -text
*.gz filter=lfs diff=lfs merge=lfs -text
*.h5 filter=lfs diff=lfs merge=lfs -text
*.joblib filter=lfs diff=lfs merge=lfs -text
*.lfs.* filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
*.pth filter=lfs diff=lfs merge=lfs -text
*.rar filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.tar.* filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.tflite filter=lfs diff=lfs merge=lfs -text
*.tgz filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.xz filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zstandard filter=lfs diff=lfs merge=lfs -text
*.tfevents* filter=lfs diff=lfs merge=lfs -text
*.db* filter=lfs diff=lfs merge=lfs -text
*.ark* filter=lfs diff=lfs merge=lfs -text
**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text
**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text
**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.gguf* filter=lfs diff=lfs merge=lfs -text
*.ggml filter=lfs diff=lfs merge=lfs -text
*.llamafile* filter=lfs diff=lfs merge=lfs -text
*.pt2 filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q4_1.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q5_1.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q4_0_4_8.gguf filter=lfs diff=lfs merge=lfs -text
llama-3.1-Asian-Bllossom-8B-Translator.Q4_0_8_8.gguf filter=lfs diff=lfs merge=lfs -text

184
README.md
View File

@@ -1,47 +1,151 @@
---
license: Apache License 2.0
#model-type:
##如 gpt、phi、llama、chatglm、baichuan 等
#- gpt
library_name: transformers
license: llama3.1
language:
- ko
- vi
- id
- km
- th
metrics:
- bleu
- rouge
base_model:
- meta-llama/Llama-3.1-8B-Instruct
#domain:
##如 nlp、cv、audio、multi-modal
#- nlp
#language:
##语言代码列表 https://help.aliyun.com/document_detail/215387.html?spm=a2c4g.11186623.0.0.9f8d7467kni6Aa
#- cn
#metrics:
##如 CIDEr、Blue、ROUGE 等
#- CIDEr
#tags:
##各种自定义,包括 pretrained、fine-tuned、instruction-tuned、RL-tuned 等训练方法和其他
#- pretrained
#tools:
##如 vllm、fastchat、llamacpp、AdaSeq 等
#- vllm
---
### 当前模型的贡献者未提供更加详细的模型介绍。模型文件和权重,可浏览“模型文件”页面获取。
#### 您可以通过如下git clone命令或者ModelScope SDK来下载模型
SDK下载
```bash
#安装ModelScope
pip install modelscope
```
```python
#SDK模型下载
from modelscope import snapshot_download
model_dir = snapshot_download('QuantFactory/llama-3.1-Asian-Bllossom-8B-Translator-GGUF')
```
Git下载
```
#Git模型下载
git clone https://www.modelscope.cn/QuantFactory/llama-3.1-Asian-Bllossom-8B-Translator-GGUF.git
[![QuantFactory Banner](https://lh7-rt.googleusercontent.com/docsz/AD_4nXeiuCm7c8lEwEJuRey9kiVZsRn2W-b4pWlu3-X534V3YmVuVc2ZL-NXg2RkzSOOS2JXGHutDuyyNAUtdJI65jGTo8jT9Y99tMi4H4MqL44Uc5QKG77B0d6-JfIkZHFaUA71-RtjyYZWVIhqsNZcx8-OMaA?key=xt3VSDoCbmTY7o-cwwOFwQ)](https://hf.co/QuantFactory)
# QuantFactory/llama-3.1-Asian-Bllossom-8B-Translator-GGUF
This is quantized version of [MLP-KTLim/llama-3.1-Asian-Bllossom-8B-Translator](https://huggingface.co/MLP-KTLim/llama-3.1-Asian-Bllossom-8B-Translator) created using llama.cpp
# Original Model Card
# Model Card for Model ID
This model is a multilingual translation model fine-tuned on LLaMA 3.1 Instruct base model. It enables mutual translation between the following Southeast Asian languages:
- Korean
- Vietnamese
- Indonesian
- Cambodian (Khmer)
- Thai
## Acknowledgements
AICA <img src="https://aica-gj.kr/images/logo.png" width="20%" height="20%">
## Model Details
The model is designed for translating short text segments between any pair of the supported languages.
Supported language pairs:
- Korean ↔ Vietnamese
- Korean ↔ Indonesian
- Korean ↔ Cambodian
- Korean ↔ Thai
- Vietnamese ↔ Indonesian
- Vietnamese ↔ Cambodian
- Vietnamese ↔ Thai
- Indonesian ↔ Cambodian
- Indonesian ↔ Thai
- Cambodian ↔ Thai
### Model Description
This model is specifically optimized for Southeast Asian language translation needs, focusing on enabling communication between these specific language communities.
The extensive training data of 20M examples (1M for each translation direction) provides a robust foundation for handling common expressions and basic conversations across these languages.
### Model Architecture
Base Model: meta-llama/Llama-3.1-8B-Instruct
## Bias, Risks, and Limitations
- Performance is limited to short sentences and phrases
- May not handle complex or lengthy text effectively
- Translation quality may vary depending on language pair and content complexity
## Evaluation results
| Source Language | Target Language | BLEU Score | ROUGE-1 | ROUGE-L |
|----------------|-----------------|------------|---------|---------|
| Korean | Vietnamese | 56.70 | 81.64 | 76.66 |
| Korean | Cambodian | 71.69 | 89.26 | 88.20 |
| Korean | Indonesian | 58.32 | 80.39 | 76.63 |
| Korean | Thai | 63.26 | 78.88 | 72.29 |
| Vietnamese | Korean | 49.01 | 75.57 | 72.74 |
| Vietnamese | Cambodian | 78.26 | 90.74 | 90.32 |
| Vietnamese | Indonesian | 65.96 | 83.08 | 81.46 |
| Vietnamese | Thai | 65.93 | 81.09 | 76.57 |
| Cambodian | Korean | 49.10 | 72.67 | 69.75 |
| Cambodian | Vietnamese | 63.42 | 81.56 | 79.09 |
| Cambodian | Indonesian | 61.41 | 79.67 | 77.75 |
| Cambodian | Thai | 70.91 | 81.85 | 77.66 |
| Indonesian | Korean | 53.61 | 77.14 | 74.29 |
| Indonesian | Vietnamese | 68.21 | 85.41 | 83.10 |
| Indonesian | Cambodian | 78.84 | 90.81 | 90.35 |
| Indonesian | Thai | 67.12 | 81.54 | 77.19 |
| Thai | Korean | 45.59 | 72.48 | 69.46 |
| Thai | Vietnamese | 61.55 | 81.01 | 78.24 |
| Thai | Cambodian | 78.52 | 91.47 | 91.16 |
| Thai | Indonesian | 58.99 | 78.56 | 76.40 |
## Example
```py
from transformers import AutoModelForCausalLM, AutoTokenizer
model = AutoModelForCausalLM.from_pretrained(
"MLP-KTLim/llama-3.1-Asian-Bllossom-8B-Translator",
torch_dtype="auto",
device_map="auto",
)
tokenizer = AutoTokenizer.from_pretrained(
"MLP-KTLim/llama-3.1-Asian-Bllossom-8B-Translator",
)
input_text = "안녕하세요? 아시아 언어 번역 모델 입니다."
def get_input_ids(source_lang, target_lang, message):
assert source_lang in ["Korean", "Vietnamese", "Indonesian", "Thai", "Cambodian"]
assert target_lang in ["Korean", "Vietnamese", "Indonesian", "Thai", "Cambodian"]
input_ids = tokenizer.apply_chat_template(
conversation=[
{"role": "system", "content": f"You are a useful translation AI. Please translate the sentence given in {source_lang} into {target_lang}."},
{"role": "user", "content": message},
],
tokenize=True,
return_tensors="pt",
add_generation_prompt=True,
)
return input_ids
input_ids = get_input_ids(
source_lang="Korean",
target_lang="Vietnamese",
message=input_text,
)
output = model.generate(
input_ids.to(model.device),
max_new_tokens=128,
)
print(tokenizer.decode(output[0][len(input_ids[0]):], skip_special_tokens=True))
```
<p style="color: lightgrey;">如果您是本模型的贡献者,我们邀请您根据<a href="https://modelscope.cn/docs/ModelScope%E6%A8%A1%E5%9E%8B%E6%8E%A5%E5%85%A5%E6%B5%81%E7%A8%8B%E6%A6%82%E8%A7%88" style="color: lightgrey; text-decoration: underline;">模型贡献文档</a>,及时完善模型卡片内容。</p>
## Contributor
- 원인호 (wih1226@seoultech.ac.kr)
- 김민준 (mjkmain@seoultech.ac.kr)

1
configuration.json Normal file
View File

@@ -0,0 +1 @@
{"framework": "pytorch", "task": "others", "allow_remote": true}

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:8ce6cc376fe14246c75dfc2950f3e2ef7dab02d223120227b8d8c6b261f6435a
size 3179136352

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:a2d63db545c414e0abc5de575204f0167d6724d78a2342350fe809f98feeaa55
size 4321961312

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:45e235d6b8bf298862a031bc1ba238b3436e5ba5de0fe26a91810d54368ea2e5
size 4018922848

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:ebe9c4f006becd324c1559435ebb1fe7c5566d01410f38313c09c7fdc16c350d
size 3664504160

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:889b19180b29ca4bb0567426a44d4a0d717e1e09e4593463d03a1b8a24c5570f
size 4661216608

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:73be4caaaee2a624fa0155f926513408c59e1d9955d1e98e7285531372e1f011
size 4661216608

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:c8cd82427285627c7ede558a36f2c6f90fb4707116091e2df096d823849e449f
size 4661216608

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:f4544c4505bda00cd930184fcf2bf56fb0d9b343ddac941cd68b0504b0a57d7e
size 4661216608

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5210ebd599dd5968e858b49ccfa2538d6685c5de07d6e32b27cd5157e426ee94
size 5130257760

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:e996e6c9da143aa13770925f840b5f150b85bd057fd5c563a7e10ee621c0fe01
size 4920739168

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:8c111ab784eb742c1eb27158637ab92441c27ab7ebf4ed1d9948d38a08ef6635
size 4692673888

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5700fa0c48db5e996759ad38c0d0a5ac10d0059e252933f252ad1585d002d565
size 5599298912

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:71de48c86a8233b90e705cef65de2d4affa3d9e8c44ada2111169d36687aee81
size 6068340064

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5710fea256f67ce48cb2213b3444224c9521dd33d456b1341a8b53a286ee8828
size 5732992352

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:5de5422d74760becd20d924ca4f42ecc8699ae0946c45484ff0930cd41215a71
size 5599298912

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:2ac05cc8867ae60b8206a2c942d09172d8079bbf658799cd57de6c67c02c80fa
size 6596011360

View File

@@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:619ae723e4e3c56c25f04202982e612cf0846e0c2b59295bb91e258241b7fa37
size 8540775776