初始化项目,由ModelHub XC社区提供模型

Model: thanhhoangnvbg/empathAI-llama3.1-8b
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-05-31 20:45:21 +08:00
commit 332f1c539e
9 changed files with 545 additions and 0 deletions

24
tokenizer_config.json Normal file
View File

@@ -0,0 +1,24 @@
{
"bos_token": "<|begin_of_text|>",
"eos_token": "<|eot_id|>",
"pad_token": "<|eot_id|>",
"unk_token": "<|unk|>",
"padding_side": "right",
"model_max_length": 8192,
"model_input_names": [
"input_ids",
"attention_mask"
],
"clean_up_tokenization_spaces": true,
"tokenizer_class": "PreTrainedTokenizerFast",
"add_bos_token": true,
"add_eos_token": false,
"chat_template": "{% if messages[0]['role'] == 'system' %}\n {% set system_message = messages[0]['content'] | trim %}\n {% set messages = messages[1:] %}\n{% else %}\n {% set system_message = 'Bạn là EmpathAI, trợ lý CSKH tiếng Việt giàu sự thấu cảm, chuyên xử lý khiếu nại và hỗ trợ khách hàng.' %}\n{% endif %}\n\n<|start_header_id|>system<|end_header_id|>\n\n{{ system_message }}<|eot_id|>\n\n{% for message in messages %}\n\n {% if message['role'] == 'user' %}\n<|start_header_id|>user<|end_header_id|>\n\n{{ message['content'] | trim }}<|eot_id|>\n\n {% elif message['role'] == 'assistant' %}\n<|start_header_id|>assistant<|end_header_id|>\n\n{{ message['content'] | trim }}<|eot_id|>\n\n {% endif %}\n\n{% endfor %}\n\n{% if add_generation_prompt %}\n<|start_header_id|>assistant<|end_header_id|>\n\n{% endif %}"
}