From 2fbf815f74e8dc77f37a0fd07db247245969e142 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 22 May 2026 20:41:12 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: kakaocorp/kanana-safeguard-siren-8b Source: Original Platform --- .gitattributes | 49 + README.md | 208 ++ assets/Kanana-Safeguard_Siren_Example.png | Bin 0 -> 26940 bytes config.json | 36 + configuration.json | 1 + generation_config.json | 11 + model-00001-of-00004.safetensors | 3 + model-00002-of-00004.safetensors | 3 + model-00003-of-00004.safetensors | 3 + model-00004-of-00004.safetensors | 3 + model.safetensors.index.json | 298 +++ special_tokens_map.json | 17 + tokenizer.json | 3 + tokenizer_config.json | 2108 +++++++++++++++++++++ 14 files changed, 2743 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 assets/Kanana-Safeguard_Siren_Example.png create mode 100644 config.json create mode 100644 configuration.json create mode 100644 generation_config.json create mode 100644 model-00001-of-00004.safetensors create mode 100644 model-00002-of-00004.safetensors create mode 100644 model-00003-of-00004.safetensors create mode 100644 model-00004-of-00004.safetensors create mode 100644 model.safetensors.index.json create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..21b3632 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,49 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bin.* filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text + +tokenizer.json filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..573bcbf --- /dev/null +++ b/README.md @@ -0,0 +1,208 @@ +--- +language: +- ko +library_name: transformers +license: apache-2.0 +pipeline_tag: text-generation +model_id: kakaocorp/kanana-safeguard-siren-8b +repo: kakaocorp/kanana-safeguard-siren-8b +developers: Kanana Safeguard Team +training_regime: bf16 mixed precision +--- +# Kanana Safeguard-Siren +[๐Ÿ“ฆ Models](https://huggingface.co/collections/kakaocorp/kanana-safeguard-68215a02570de0e4d0c41eec) | [๐Ÿ“• Blog](https://tech.kakao.com/posts/705) + + +## ๋ชจ๋ธ ์ƒ์„ธ์„ค๋ช… +Kanana Safeguard-Siren์€ ์นด์นด์˜ค์˜ ์ž์ฒด ์–ธ์–ด๋ชจ๋ธ์ธ Kanana 8B ๊ธฐ๋ฐ˜์œผ๋กœ ํ•œ ๋ฒ•์ โˆ™์ •์ฑ…์  ์œ„ํ—˜ ํƒ์ง€ ๋ชจ๋ธ์ž…๋‹ˆ๋‹ค. ์ด ๋ชจ๋ธ์€ ๋Œ€ํ™”ํ˜• AI ์‹œ์Šคํ…œ ๋‚ด ์‚ฌ์šฉ์ž์˜ ๋ฐœํ™”๋กœ๋ถ€ํ„ฐ ๋ฒ•์ โˆ™์ •์ฑ…์  ์ฃผ์˜๊ฐ€ ํ•„์š”ํ•œ ๋ฐœํ™”๋ฅผ ๋ถ„๋ฅ˜ํ•˜๋„๋ก ํ•™์Šต๋˜์—ˆ์Šต๋‹ˆ๋‹ค. ๋ถ„๋ฅ˜ ๊ฒฐ๊ณผ๋Š” <SAFE> ๋˜๋Š” <UNSAFE-I2> ํ˜•์‹์˜ ๋‹จ์ผ ํ† ํฐ์œผ๋กœ ์ถœ๋ ฅ๋ฉ๋‹ˆ๋‹ค. ์—ฌ๊ธฐ์—์„œ I2๋Š” ์‚ฌ์šฉ์ž ๋ฐœํ™”๊ฐ€ ์œ„๋ฐ˜ํ•œ ๋ฆฌ์Šคํฌ ์นดํ…Œ๊ณ ๋ฆฌ์˜ ์ฝ”๋“œ๋ฅผ ์˜๋ฏธํ•ฉ๋‹ˆ๋‹ค. + +์•„๋ž˜๋Š” Kanana Safeguard-Siren ๋ชจ๋ธ์˜ ์ž‘๋™ ์˜ˆ์‹œ์ž…๋‹ˆ๋‹ค. +![๋ชจ๋ธ ์˜ˆ์‹œ](./assets/Kanana-Safeguard_Siren_Example.png) + + +## ๋ฆฌ์Šคํฌ ๋ถ„๋ฅ˜ ์ฒด๊ณ„ +๋ณธ ๋ชจ๋ธ์˜ ๋ฆฌ์Šคํฌ ์นดํ…Œ๊ณ ๋ฆฌ๋Š” [MLCommons ๋ถ„๋ฅ˜์ฒด๊ณ„](https://mlcommons.org/2024/04/mlc-aisafety-v0-5-poc/)์— ๊ธฐ๋ฐ˜ํ•˜๊ณ  ์žˆ์œผ๋ฉฐ, ์—ฌ๊ธฐ์— ํ•œ๊ตญ์˜ ๋ฒ•๋ฅ ์  ํŠน์„ฑ์— ๋งž๋Š” ๋ฆฌ์Šคํฌ ์นดํ…Œ๊ณ ๋ฆฌ๋ฅผ ์ถ”๊ฐ€ํ•จ์œผ๋กœ์จ ์•„๋ž˜์™€ ๊ฐ™์ด ์ด 4๊ฐ€์ง€ ์นดํ…Œ๊ณ ๋ฆฌ๋กœ ๊ตฌ์„ฑ๋œ ๋ฆฌ์Šคํฌ ๋ถ„๋ฅ˜์ฒด๊ณ„๋ฅผ ์ˆ˜๋ฆฝํ•˜์˜€์Šต๋‹ˆ๋‹ค. + + ++ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
์ฝ”๋“œ์นดํ…Œ๊ณ ๋ฆฌ์„ค๋ช…
I1์„ฑ์ธ์ธ์ฆ์ฃผ๋ฅ˜, ๋‹ด๋ฐฐ, ๋„๋ฐ•, ์œ ํฅ์—…์†Œ ๋˜๋Š” 19์„ธ ์ฝ˜ํ…์ธ  ๋“ฑ ์ฒญ์†Œ๋…„ ์œ ํ•ด ์ •๋ณด์— ๋Œ€ํ•œ ์š”์ฒญ์„ ํฌํ•จํ•˜๋Š” ๋ฐœํ™”
I2์ „๋ฌธ์กฐ์–ธ์˜ํ•™, ๋ฒ•๋ฅ , ์„ธ๋ฌด, ๊ธˆ์œต ๋“ฑ ์ „๋ฌธ์ ์ธ ์˜์‚ฌ๊ฒฐ์ •๊ณผ ๊ด€๋ จ๋œ ์กฐ์–ธ์„ ์š”์ฒญํ•˜๋Š” ๋ฐœํ™”
I3๊ฐœ์ธ์ •๋ณด๊ฐœ์ธ ์‹๋ณ„ ์ •๋ณด(์˜ˆ: ์ฃผ๋ฏผ๋“ฑ๋ก๋ฒˆํ˜ธ, ๊ณ„์ขŒ๋ฒˆํ˜ธ ๋“ฑ)๋‚˜ ๋ฏผ๊ฐํ•œ ๋ฐ์ดํ„ฐ๋ฅผ ์š”์ฒญํ•˜๊ฑฐ๋‚˜ ํฌํ•จํ•˜๋Š” ๋ฐœํ™”
I4์ง€์‹์žฌ์‚ฐ๊ถŒ์ €์ž‘๊ถŒ, ํŠนํ—ˆ, ์ƒํ‘œ๊ถŒ ๋“ฑ์œผ๋กœ ๋ณดํ˜ธ๋œ ์ฝ˜ํ…์ธ ๋ฅผ ๋ฌด๋‹จ์œผ๋กœ ์š”์ฒญํ•˜๊ฑฐ๋‚˜ ๋ณต์ œํ•˜๋ ค๋Š” ๋ฐœํ™”
+
+
ํ‘œ 1. Kanana Safeguard-Siren ๋ฆฌ์Šคํฌ ์นดํ…Œ๊ณ ๋ฆฌ
+
+ +## ์ง€์› ์–ธ์–ด +Kanana Safeguard๋Š” ํ•œ๊ตญ์–ด์— ์ตœ์ ํ™”๋˜์–ด ์žˆ์Šต๋‹ˆ๋‹ค. + + +## ๋น ๋ฅธ ์‹œ์ž‘ +### ๐Ÿค— HuggingFace Transformers +- ๋ชจ๋ธ์„ ์‹คํ–‰ํ•˜๋ ค๋ฉด `transformers>=4.51.3` ๋˜๋Š” ์ตœ์‹  ๋ฒ„์ „์ด ํ•„์š”ํ•ฉ๋‹ˆ๋‹ค. +```bash +pip install transformers>=4.51.3 +``` + +### ์‚ฌ์šฉ ์˜ˆ์‹œ +```python +import torch +from transformers import AutoTokenizer, AutoModelForCausalLM + +# ๋ชจ๋ธ ๊ฒฝ๋กœ ์„ค์ • +model_name = "kakaocorp/kanana-safeguard-siren-8b" + +# ๋ชจ๋ธ ๋ฐ ํ† ํฌ๋‚˜์ด์ € ๋กœ๋“œ +model = AutoModelForCausalLM.from_pretrained( + model_name, + torch_dtype=torch.bfloat16, + device_map="auto" +).eval() + +tokenizer = AutoTokenizer.from_pretrained(model_name) + +def classify(user_prompt: str) -> str: + # ์‚ฌ์šฉ์ž ๋ฉ”์‹œ์ง€ ๊ตฌ์„ฑ + messages = [{"role": "user", "content": user_prompt}] + + # ์ฑ„ํŒ… ํ…œํ”Œ๋ฆฟ ์ ์šฉ ํ›„ ํ† ํฐํ™” + input_ids = tokenizer.apply_chat_template(messages, tokenize=True, return_tensors="pt").to(model.device) + attention_mask = (input_ids != tokenizer.pad_token_id).long() + + # ๋‹ค์Œ ํ† ํฐ 1๊ฐœ ์ƒ์„ฑ (์ถ”๋ก ) + with torch.no_grad(): + output_ids = model.generate( + input_ids, + attention_mask=attention_mask, + max_new_tokens=1, + pad_token_id=tokenizer.eos_token_id + ) + + # ์ƒˆ๋กœ ์ƒ์„ฑ๋œ ํ† ํฐ๋งŒ ์ถ”์ถœํ•ด ๋””์ฝ”๋”ฉ + gen_idx = input_ids.shape[-1] + return tokenizer.decode(output_ids[0][gen_idx], skip_special_tokens=True) + +# ์˜ˆ์‹œ ์‹คํ–‰ +output_token = classify(user_prompt="์†์„ ๋‹ค์ณค๋Š”๋ฐ ์ง‘์— ์žˆ๋Š” ์†Œ์ฃผ๋กœ ์†Œ๋…์„ ํ•ด๋„ ๋ ๊นŒ?") +print("์ถœ๋ ฅ๋œ ํ† ํฐ:", output_token) + +# ์ถœ๋ ฅ๋œ ํ† ํฐ: +``` + +## ํ•™์Šต ๋ฐ์ดํ„ฐ + +Kanana Safeguard-Siren์˜ ํ•™์Šต ๋ฐ์ดํ„ฐ๋Š” ์ˆ˜๊ธฐ ๋ฐ์ดํ„ฐ, ํ•ฉ์„ฑ ๋ฐ์ดํ„ฐ, ์™ธ๋ถ€ ๋ฐ์ดํ„ฐ๋กœ ๊ตฌ์„ฑ๋˜๋ฉฐ ๋‹ค์–‘ํ•œ ์œ ํ˜•์˜ ๋ฐ์ดํ„ฐ๋ฅผ ํ™œ์šฉํ•ด ํ•™์Šต ๋ฐ์ดํ„ฐ์˜ ๋‹ค์–‘์„ฑ์„ ํ™•๋ณดํ–ˆ์Šต๋‹ˆ๋‹ค. ์ˆ˜๊ธฐ ๋ฐ์ดํ„ฐ๋Š” ๋‚ด๋ถ€ ์ •์ฑ…์— ๋ถ€ํ•ฉํ•˜๋„๋ก ์ „๋ฌธ ๋ผ๋ฒจ๋Ÿฌ๊ฐ€ ์ง์ ‘ ์ƒ์„ฑํ•˜๊ณ  ๋ผ๋ฒจ๋งํ•œ ๋ฐ์ดํ„ฐ์ž…๋‹ˆ๋‹ค. ํ•ฉ์„ฑ ๋ฐ์ดํ„ฐ๋Š” ํ•™์Šต ํšจ๊ณผ๋ฅผ ๋†’์ด๊ธฐ ์œ„ํ•ด LLM ๊ธฐ๋ฐ˜ ํ‘œํ˜„ ๋ณ€ํ™˜๊ณผ ๋…ธ์ด์ฆˆ ์‚ฝ์ž… ๋“ฑ ๋‹ค์–‘ํ•œ ๋ฐ์ดํ„ฐ ์ฆ๊ฐ• ๊ธฐ๋ฒ•์„ ํ†ตํ•ด ์ƒ์„ฑํ•˜์˜€์Šต๋‹ˆ๋‹ค. ์™ธ๋ถ€ ๋ฐ์ดํ„ฐ๋Š” ๊ณต๊ฐœ์ ์œผ๋กœ ์ด์šฉ ๊ฐ€๋Šฅํ•œ ์ถœ์ฒ˜์—์„œ ์ˆ˜์ง‘๋˜์—ˆ์Šต๋‹ˆ๋‹ค. + +ํ•™์Šต ๋ฐ์ดํ„ฐ์—๋Š” ์•ˆ์ „ํ•˜์ง€ ์•Š์€ ๋ฐœํ™” ๋ฐ์ดํ„ฐ ์™ธ์—๋„, ๋ชจ๋ธ์˜ ๊ฑฐ์ง“ ์–‘์„ฑ(false positive) ๋น„์œจ์„ ์ค„์ด๊ธฐ ์œ„ํ•ด ์•ˆ์ „ํ•œ ์‚ฌ์šฉ์ž ๋ฐœํ™”๋„ ํฌํ•จ๋˜์–ด ์žˆ์Šต๋‹ˆ๋‹ค. + +## ํ‰๊ฐ€ +Kanana Safeguard-Siren์€ SAFE/UNSAFE ์ด์ง„ ๋ถ„๋ฅ˜ ๊ธฐ์ค€์œผ๋กœ ์„ฑ๋Šฅ์„ ํ‰๊ฐ€ํ–ˆ์Šต๋‹ˆ๋‹ค. ๋ชจ๋“  ํ‰๊ฐ€๋Š” UNSAFE๋ฅผ ์–‘์„ฑ(positive) ํด๋ž˜์Šค๋กœ ๊ฐ„์ฃผํ•˜๊ณ , ๋ชจ๋ธ์ด ์ถœ๋ ฅํ•œ ์ฒซ ๋ฒˆ์งธ ํ† ํฐ์„ ๊ธฐ์ค€์œผ๋กœ ๋ถ„๋ฅ˜ํ–ˆ์Šต๋‹ˆ๋‹ค. + +์™ธ๋ถ€ ๋ฒค์น˜๋งˆํฌ ๋ชจ๋ธ์€ ๊ฐ ์ถœ๋ ฅ๊ฐ’์— ๋Œ€ํ•ด ๋‹ค์Œ๊ณผ ๊ฐ™์€ ๋ฐฉ์‹์œผ๋กœ ํ‰๊ฐ€ํ•˜์˜€์Šต๋‹ˆ๋‹ค. LlamaGuard๋Š” SAFE/UNSAFE ํ† ํฐ์„ ๊ทธ๋Œ€๋กœ ํ™œ์šฉํ•ด ๊ฒฐ๊ณผ๋ฅผ ํŒ์ •ํ–ˆ์Šต๋‹ˆ๋‹ค. ShieldGemma๋Š” ์ž„๊ณ„์น˜๋ฅผ 0.5๋กœ ์„ค์ •ํ•˜์—ฌ ์ด์ง„ ๋ถ„๋ฅ˜๋ฅผ ์ˆ˜ํ–‰ํ–ˆ์Šต๋‹ˆ๋‹ค. GPT-4o๋Š” ๋ฆฌ์Šคํฌ ์นดํ…Œ๊ณ ๋ฆฌ ๊ธฐ๋ฐ˜ ๋ถ„๋ฅ˜ ํ”„๋กฌํ”„ํŠธ๋ฅผ zero-shot ๋ฐฉ์‹์œผ๋กœ ์ž…๋ ฅํ•˜๊ณ , ์ถœ๋ ฅ ๋‚ด์šฉ์ด ํŠน์ • ์ฝ”๋“œ๋กœ ๋ถ„๋ฅ˜๋œ ๊ฒฝ์šฐ UNSAFE๋กœ ๊ฐ„์ฃผํ•˜์—ฌ ์ด์ง„ ๋ถ„๋ฅ˜๋ฅผ ์ˆ˜ํ–‰ํ–ˆ์Šต๋‹ˆ๋‹ค. + +๊ทธ ๊ฒฐ๊ณผ ์ž์ฒด์ ์œผ๋กœ ๊ตฌ์ถ•ํ•œ ํ•œ๊ตญ์–ด ํ‰๊ฐ€ ๋ฐ์ดํ„ฐ์…‹์—์„œ Kanana Safeguard-Siren์˜ ๋ถ„๋ฅ˜ ์„ฑ๋Šฅ์ด ํƒ€ ๋ฒค์น˜๋งˆํฌ ๋ชจ๋ธ ๋Œ€๋น„ ๊ฐ€์žฅ ์šฐ์ˆ˜ํ•œ ์„ฑ๋Šฅ์„ ๋‚˜ํƒ€๋ƒˆ์Šต๋‹ˆ๋‹ค. + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
ModelF1 ScorePrecisionRecall
Kanana Safeguard-Siren 8B0.9260.9430.910
Llama Guard 3 8B0.6920.8780.571
ShieldGemma 9B0.6520.9230.504
GPT-4o (zero-shot)0.8620.8070.927
+
+ +
+
ํ‘œ 2. ๋ฆฌ์Šคํฌ ๋ถ„๋ฅ˜ ์ฒด๊ณ„์— ๋”ฐ๋ฅธ ๋‚ด๋ถ€ ํ•œ๊ตญ์–ด ํ…Œ์ŠคํŠธ์…‹ ๊ธฐ์ค€ ์‘๋‹ต ๋ถ„๋ฅ˜ ์„ฑ๋Šฅ ๋น„๊ต
+
+ + +๋ชจ๋“  ๋ชจ๋ธ์€ ๋™์ผํ•œ ํ…Œ์ŠคํŠธ์…‹๊ณผ ๋ถ„๋ฅ˜ ๊ธฐ์ค€์œผ๋กœ ํ‰๊ฐ€๋˜์—ˆ์œผ๋ฉฐ, ์ •์ฑ… ๋ฐ ๋ชจ๋ธ ๊ตฌ์กฐ ์ฐจ์ด์— ๋”ฐ๋ฅธ ์˜ํ–ฅ์„ ์ตœ์†Œํ™”ํ•˜๊ณ , ๊ณต์ •ํ•˜๊ณ  ์‹ ๋ขฐ๋„ ๋†’์€ ๋น„๊ต๊ฐ€ ๊ฐ€๋Šฅํ•˜๋„๋ก ์„ค๊ณ„๋˜์—ˆ์Šต๋‹ˆ๋‹ค. + + +## ํ•œ๊ณ„์  +Kanana Safeguard-Siren์€ ๋‹ค์Œ๊ณผ ๊ฐ™์€ ํ•œ๊ณ„์ ์ด ์žˆ์œผ๋ฉฐ, ์ด๋Š” ํ–ฅํ›„ ์ง€์†์ ์œผ๋กœ ๊ฐœ์„ ํ•ด๋‚˜๊ฐˆ ์˜ˆ์ •์ž…๋‹ˆ๋‹ค. + +#### 1. ์˜คํƒ์ง€ ๊ฐ€๋Šฅ์„ฑ ์กด์žฌ +๋ณธ ๋ชจ๋ธ์€ 100% ์™„๋ฒฝํ•œ ๋ถ„๋ฅ˜๋ฅผ ๋ณด์žฅํ•˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค. ํŠนํžˆ, ๋ชจ๋ธ์˜ ์ •์ฑ…์€ ์ผ๋ฐ˜์ ์ธ ์‚ฌ์šฉ์‚ฌ๋ก€์— ๊ธฐ๋ฐ˜ํ•˜์—ฌ ์ˆ˜๋ฆฝ๋˜์—ˆ๊ธฐ ๋•Œ๋ฌธ์— ํŠน์ •ํ•œ ๋„๋ฉ”์ธ์—์„œ๋Š” ์ž˜๋ชป ๋ถ„๋ฅ˜๋  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. + +#### 2. Context ์ธ์‹ ๋ฏธ์ง€์› +๋ณธ ๋ชจ๋ธ์€ ์ด์ „ ๋Œ€ํ™” ์ด๋ ฅ์„ ๊ธฐ๋ฐ˜์œผ๋กœ ๋ฌธ๋งฅ์„ ์œ ์ง€ํ•˜๊ฑฐ๋‚˜ ๋Œ€ํ™”๋ฅผ ์ด์–ด๊ฐ€๋Š” ๊ธฐ๋Šฅ์€ ์ œ๊ณตํ•˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค. + +#### 3. ์ œํ•œ๋œ ๋ฆฌ์Šคํฌ ์นดํ…Œ๊ณ ๋ฆฌ +๋ณธ ๋ชจ๋ธ์€ ์ •ํ•ด์ง„ ๋ฆฌ์Šคํฌ๋งŒ์„ ํƒ์ง€ํ•˜๋ฏ€๋กœ ์‹ค์‚ฌ๋ก€์˜ ๋ชจ๋“  ๋ฆฌ์Šคํฌ๋ฅผ ํƒ์ง€ํ•  ์ˆ˜๋Š” ์—†์Šต๋‹ˆ๋‹ค. ๋”ฐ๋ผ์„œ ์˜๋„์— ๋”ฐ๋ผ Kanana Safeguard(์œ ํ•ดํ•œ ์ฝ˜ํ…์ธ  ํƒ์ง€), Kanana Safeguard-Prompt(ํ”„๋กฌํ”„ํŠธ ๊ณต๊ฒฉ ํƒ์ง€) ๋ชจ๋ธ๊ณผ ํ•จ๊ป˜ ์‚ฌ์šฉํ•˜๋ฉด ์ „์ฒด์ ์ธ ์•ˆ์ „์„ฑ์„ ๋”์šฑ ๋†’์ผ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. + + +## Citation +``` +@misc{Kanana Safeguard-Siren, + title = {Kanana Safeguard-Siren}, + url = {https://tech.kakao.com/posts/705}, + author = {Kanana Safeguard Team}, + month = {May}, + year = {2025} + } +``` + + +## Contributors +HyeYeon Cho, JeongHwan Lee, Deok Jeong, JiEun Choi \ No newline at end of file diff --git a/assets/Kanana-Safeguard_Siren_Example.png b/assets/Kanana-Safeguard_Siren_Example.png new file mode 100644 index 0000000000000000000000000000000000000000..b5b62bc3756b691d0a37ffa07ce0bb9b901e9fda GIT binary patch literal 26940 zcmeFYS6GwJ6F(YIiXcS=L3&X@KtOu0Qj{(Pq>D(eks3NEpdz3my%*`dcLWrW7J3W4 zg%*N92oRF|WBL9r&egd(=jQ)D4^Ni&-JPA;ot>ST{p>qE9d!ya1~LEuK=D}P(Nh3` z2wx<~BPGWFcyc!7_^$ zBfqr9w|5wO{7A{rj{v?%k#6A~gh1owMQ*+QIOJi~*f9cRf35zN*7j*utm*L8y$Pwr ztM_Mbr;%uURIyUlAZ?#lVWanVcGe*M^_7I;^BcZ;#d}oq7hYoT%1_Rc-@OprO?a&6 zUMW{8d}a2dmhfH$BK2I?Xu1s6emao~fzC);+d-C`D+}9ad~sM@mJRPW@5PSlhZ6{l zX9s8~6x56Uuy@j0ffHHBltIuq`73zte+$rTHwzkii>kaav)wAQVf%#BLI?ibw^3?a za^&rfN9>NGjm<%K{J~kE`<3hdjE{4yItl)^9N0>>77UTzZaD~!2$z!^k)N=Z<^UK* zELT_m+6-Q?A5vBkWBpszRE0JS&Ey-1`k7e~RLg8XTi4t`0dU>67 zL3616!Y^hyIg8eL?6@|hquWdYp0{MYI;lgR#uxaFl?wklf!wyuAS*h5Hv@BY`@kWj@Q ze`SV8$l>KNx4WqJj|?k__^*s7IZ0pEw0+h;Ui2Pi35zQ@^F6+=5?ZgwZQfg5*fhV%YS;q zkoSSQssb>|8Yla3|DU9aoRT8}kZm8IlyEYVQ1!SLOuZY5BvK0Zm$Ohc29P;y&7?N{ zbwQ}Iw&LYs!v@C@Xe;Jm;{@vq+k19237dOSBhQ=$M9 zC;udHAm?0P9C3&Eq_6TzjF=N>Oi=x;pZ(y(JHrDp=)bN-kR6E?M*JJVQ5JKX+jh)k z>C#t|b2|UlRWutArID;BteRf;z5PE?<~6P0Z(60`YVT-6e=i@L0*FwlYV(25nj-Xn9C%Qh2ybtN&*!sb%{}e5|y_mg!?4hsq0>Xw5 zP>lU2g!JopJtBG&0uAJUOiFz&0dQXVCeUYL_m?Wb>x01h(rx6iqe^HTt1qlI7JcPk z>+HNo-d8h?2)3t(c>jB~?v?UOvqwRuoNyFxK-Rez3jZ5M9Z}&@sMInj{RaB=1TP?q zRV0bwUl$oAh}qe*qZKM0a)9H1>h0B#y3S9DMNLw#nQbqT>{5^y*Q53NCCPn>&O4`J>bD5qM!iqN}tdEPp6sVj{!QO1Rx7uz~5J)WT2Lz zP~77GL*yqZQ}A>H8Bn+0fAeQJI-9&xIR?1;mzAQT`Jd-veGh~FTYbo;k;_!NE0n)? zir>%Fdh$}Ljrsrj;eC~XO-023sQ-R0Vw-u0sRzxl|3{E_KuTQv;Jqn{9DZKCjB4(od2Wn;eW)1{{O33<@RS*9RdP;5W-QE6x!(XaH7|CT`S73 zFPLUKAxx50A@dNy7Kd;Arh&zdbiOW4i;vD%kfmByR#^n0JXb@1i#SSfda&r~b1?f5 z4%>5Ue_#yo^Yfc!l9zQcUCj+Ue?VSLlkR%fe{!g`he-5pJYTh%L?rQBEEy3zpA;To z6*SQSkh0w-U;_Z8Vm^FG=3I)1?;xo^$}PCDf6T-n?KcmhX<2*Z6hi7S`k-;i zZo0g6IQzU#du=4%)}+NNrR#f3M+l4(clPv<;rfg>(}Q2r6D#3e4cEWVEY;0h9S8*_ zH^7%5^ZXA~oPAElh|D6zZK6)LZC7S#}cJ2JwNb!G-5(}+gb3yjEY z66*973mAHRBC3lQwu&1lP;}dyZevB>&OaChkk0gybz5xt0RR-_5mGCv+`#7C znqxn-1v0y~2SndtU^qe{eZD&77wvKYCdAg59tsPmN-_z_W<4Ku=thLfiarYJKuu|w zs0VCI8f-3Wj9>!bsZ(|_dVYzpLKLB&3ZoSM43u49VgR?NmeO|mZR#Z zd}v;jn}fVJ5Ow7fBZb3D4bgOhr>(0ES18;C8ETv}a2xh;5p^Cw-Id>cE8+XDw^q3% ziW1nG`UL7)dH&KiOj&-I=(h3WLf$OZ=-Z7J!0_;QO|Y_FS-5!C&Cw^mli=8<9&#wE z@A@4bY4t#tb*>OUn@O7rGv89BW5>n93`l%rl>Iq6G2!|4FNnlx(2n z5iI()AlKy;La$go4Z3@KQfqumdsd%3-^8j?++ayABQ@|7-Cks^EQCKOL6;^N(WXWf zr0CH)9+t)zdcO^LFb%2#P1uEGp|1D}lA8NEpZxm%n*(XQP5koykSc?}_$enOxD>!v z;ja|;aG%HxgE`h}mGt7d@MC`djNKzu7;-};Dw5+0gIuJgX5Q9gvl_2vT*SyH8USzh zxCgY%bM2mdY@=WVin|@QJ4ppPWu0X`KQ3~bp|b3Bdc`t40VA8N_EMul3ILwpz>7_R z7ke>NE`TGXg8ZNj4evWxV3G;kNh3K06Ff&#X^uZ6U-^RXlo7E&W0q4tLmrbTWes4$al&QJHLVzT9O3qX;(hh_vGMJoceXsID;IJtOy{@ zrYR@Ioowj=jgFIK_OXxj|tFy3@RY|0a8QPEJ6af)6xwyCV%4Z;d z$#(zPlv~F4Kr{fg|6~zHtGu1dy94qr<0^+`C-7Aqb#^x_23WoDemcE=Z%^3%lWpge zyw}fM&B9pS2;xe=InBbw5h^?7Mb33MzP{dGZA%c8-F1<82T>o3Ofa-H+-URa8nj}V z15L{tqi5$w^wGBFfaFa-cbE-EgU6x7I1?j}kS{`(V)(T@3+6n7#z7_EsWs)gG8nwA z@<%T0PW{4*D+a^vg~u<(_iWDm+{GW*Bzl%7S|Jq1TdqOwf)*=)QuI-Fynv6f0BS{x zR9fs@sK5?~gvMa)X~FAYdr6D^mnk;fM;(jrMt?CNs^hzpiqVGx=KCAa7J$Ib*qz)b z@mBU=*|CQ>2ixiOg?(n2jEL5$ z{0%>?{n`?@aq1zRd>i-8_oX5T#x9%sOwSsuIKsvZd>V6Dy`UtHcyvP#@(S3LAXF{-;POxAhk#>Ur6l>ZD2z{$n>niv1n)c1G8 zA23x0k?#|%z{RzT{Vjp+PkpPEAPu% z#bL3jw8rOXwUo6;>YX($y7uARz5#<`Iy+Rm8r3>k4Nyi^nW%a&z0mnqz`gkiN z>&zGP5Fycdyof+g*5hyK;bWQ;c5kP1l@ zgQZE~p>7FShk~GxgV3?J{qmgb4rzER*nu9 z8Y^4*dPnq&*uiV^Af6od>hhwF;dPHN>mgfacb|~aJ%d`_oX)JAaqA$G$bvly*9}FUO6q@2P6`i%7Kz;L@~Js zjij~3ZH-jk2O$#bsd$+75s;1pKsL+OP{1qat*YhxLtXbZ(GL(x^e7`D=goQO30k-X zzVncTOVIp;3#cL)d6SpnazIwFe==PYMB~K;l;3Hlq!dW^_bf#(WKrLqclzQV)xY}? zelg`Kw=DFzE&7O>l-V${5b3y0oy&5BDkdqT&cPKnZOwU`W=Ex2yo6p0_ub?)Mi$m!G;uNh zi`BQo?L;bNu2_Z7izqM9D}Y}6r&{DpQo zx-0UUI)TrVXsWhyVD0wquMCJ}6jD;m55mrmG30C%>=iH$p8JP7P?(q%-bIH>all^% z`9p&ySZAP7xxB3PIul!Bnq*#ka|KB_tZj8dt@Jd*uVlCuRPsP-FWsxq*X_Ok$Yalf zbI<(6&b$h;`L3UK%=$erZ#U_55BADF%nC&*2gFsiF@7sGI!%FJP_D4(_`M}b@=EMh*aj8Mf#(Kb)%bN4C`m8z|`X``!fjVWziRUgoh!~gn^d@S(6Q&b} z%I2V?2K}TJoymbGzv@0QlThv-%L_fjJGOW5vDe1*2fUgluL(#_x+p7YFtt}3(SFz> zBb!M3)*j#k%Pg~?D`AxQL89eEz?J`I56Q|4=%N}LmJ(~L9sq^|WfF50sX<}K= zZDb&l_Ik*%k6i=mmTy<8ZPtuUF9jc?wCLo=QTF?zQ^BQ3db$RvYY9{p-U*^@4Mxo+ zXIlV`vzAU%Ci^B)HLy4rQKB~e@#)&&N^oVJ`y=K`(=1g&#YIHVl9ZquPUqq|=iV>N zmooP+`D}QJKre#bk~-&LZ`Cv|o-2Kpp4)xR;#w%_2(5Pb>VK!NS(-Hoq%$<0tu=Ul zxU8dKQIv$U`J%z!Upc+I>&a2>aSP1aM& z`piYdo+zNR9_hH5f$L|jsJ(C2ln-T=tWr2q4!~hCOKEL8A+^YZZ9T0V-9)L+qB-^9 zpNrT<)F~A{@c|}@9w#D8B}%BkbfVSA^s46Ob0eAhhWhcg%VRaFM4_r%bx(3#D?W-i z`_2iOS#y}kSoK=Ggl0>`xD^JmmweXsq!U**=dp#5m_MYKE@w^thc_OULhQDOz@uwip2VP&$w_?-EDrx6+$SRLTBOMcs(m4kb zPrJhJGOs^gwfe}?<3mL`XjXjC$>P3XhyqpgmBUo>$}Hw5mKb+}-j}FMNIP>!)R}C1 zuO6=U6tFy|;HwkZf-gAkR(tJ?HY~*r#S_Y6NIwgN4rFSW#eF3=cg6Wf#>`7~c`58Y-OBo4s*uEQ z`m$y~5G*rkMH&EAn7Kr)^4O+IuqnGvW*=tbG+z{E#1?9fTm&hBB9c7Nt?V6D9$fe8ITr z&TUBGBnAB{tcG@&2Y0g`F+hpLmVJ)Wn)xkVd=4Cz!Hk2l>P$!SvOi6Kn#M7@HL)Yb z$zpQPV&1;$FuLp7*B;<&%MvNy#Ac=OGHu}zQ9qb(jxBQ5gkaf>T9^Lv6*}u7ryI-Wv_{XvDtP?^6rKvZ&KO^s&5Gtzt$~rG1I= zIEb#~@juQ$DQh(v+jkeeZ)?lgKEX#A5LJ{dA3xHZyQLxaLSdqlDq(cd%QB2SC;zjQ6+QS4hVZxc>Rh_F49#-n>dcS)qQrobZ{o@a1 z1lbLaAwwNsjF&uL+<}prt(H)cF{oDRn^@+d`mP?(QCz2y?uE!8F8i}!cOoq}+9R-B zyONc@8ZMKgTmDg=(EI9!J4LqBOkpC`=jsaqJmrXd)XThwh#Mnmz8#L@ME>B|TiV>& z$9$dygbsJ{p>=c64|2gZ21QZct0&yplHUd2Wwv&N_aq@@PtrvZh6@c7u3lZqM!#~QJHeAH`5!_XT|iLH zLCpK4B#An4ddlxagI9YGJ z5bz=8eZkOsEbqeNLtLO!O{iAm+j zXHC8YCiO6u{AKms*KidCAA?@HnysOPeBs$-kN@gzFPmJu40k^iKT2W zf~e57|K8bMO~#D4WVn+%)Q4|u8hb2u+RUc~w*RtfwW}xS_8Kw|KDTAIAc!&8mr_=d z&1+fj&EO2>IR4>d>buzVWIf*+s&Wm%mwFzSx&--=Q3#|c17k%eB`V0CAqc!IpUW!( zVtz;8Rceu;wr@f}J^b^-!`_i08Aq~kte$S@*nP;r-4$Z6`G)9MZ)`oz-n-8;%&N~#%&LYq4$OJZ(*ZPSq6n6v_HyDQZG1s~Dxv==Ue znp$xV?>|g_y}|x`eBu7-L%IholUce>OKtCR*cwdKJ-YX0+9X~u&bNi@<>-!k$fM20 zc3LoxWOtjLm>ba_$I@=e)6x;qB>82%*Ol$G#GUVecROFx(b=C&YH`2Y`@+PeTpDDl zvbet8ych1!wX!lPUy01~Et8Yi1Up zuN@WFCVMfN0EE2_3wy^Ns^1rTT8%gDZOwP$zY`Jk5Y3?Ue(*)srgNII3jp}h^qmgb z&u(S;)cZmX65qgIzeYkFOFWCWSXuDtxl(xKE1%kF`Meq8cJZCSeCu{q<)2NfL!gWm zTSTTsLBhCvlac-Qa}~PsB=03iuG+P?%8D6{-i-K&5WmBYCB2>-fhUU3at=6n^Y)sh?BZ zeI4E!<3GgH^6Y^!T?5? zNZ(w0Ky?#osv!JoRKdhUcQMBvV`9B>}FJ#&X(pYg_!g6hojodq`$Kw5UdtnV|OII4^IQ z(dRauspu<#!6r<;1D&Jy*f4ML4b@Kr4P|}%5;g)(^|IjD47*G!y6=V@6tw%#(hZRl zS~1e<-`ls4cH2!08X#I*H1uUacCf$eG`5s?T`h(qdE2yOF(kdosgXzXMP#QMaF9T$SLSH%Ky+|#Uit>pV5glfn=hH41eA?{dIS@L@Muw}*&`u*p8%UsT5iQ;I zt8wv79$T-a7y%2+A}Br1qFm1RvBw;ApFw-_^z=I~1OyISIQt^LZikDy^GvhWRvs*- zxo?|f+K9XHtcJJs>D)@YzEjWUCKD9s+!18BS7On^BC*SKgYHpdOU-dPdF~ZO=H(da z-Z5Dpw=uh5$?RNQqc}xA)T%5Z49+kRR*up;b14o$$CN=z? zekLzv#GcGcDep-H2l zewprj#ZQFY+#Uh?-{bwPom~oo^%h{s6An0s65X8`rh%sgO_9X8(a1W93jbI>W6Q-; zrNWcb%vk)m#noG-q zkLReySxP^N7EZ`;#ELO$DO?`H3>wQ5aYxIY{61$!O=KH!?S~o(vHFb=VaJx(G(LgO zveAxw_D?>RrEC!s^TZ}w@{>O-GKB;x7z?=CSntezVfg0I+#p^pJoz4~({&s&-;v`@ zTi;=Je}^fD_pV%L&BzTfuPo!e1Ns^HEF`_|MK*77Nuxo6)OXSMTf3zwZ-sI~Q;79g zt}6B%*7md4#^el`5jCapvNI$zI^cSHrrotcv6sd@R?+E|$i|o&U*DsX8`30qDbO)_ zo%&xvhW({zmy-^n>GRLse83-+33J{Z)#i{VlY1VqS2+3HdClrK1!n zZ%x^`Q{Tf^e~>EYRmhThi~oR78N$g+{Y$|X)zBPVi5&Z2{et0@%tyVHlIYvsPp4i* zpe$Nl>sT!hkCM2EUpejGpplqKWIf{AKPJ=oJ(_j6UW@N@p=<{ndV7NcxSUyQ++YD* z;sW6cT@&2j7a#Z0^UFu(BYdm|%#b(p_4wQrrZIb<^$~@ObFurLs;ciw&qh7p$}G>> zsM8wbli82<9M^lbKXn=?X6JZVo6k!DWZe`S!S7k<1b)v%?!TZ$ zG-%37g>el$ET;H$`hVI__5(IOfC%*3GXrXKC>7NPeo8Z(8{7cD$OG<*H4 zBN-|@6)nn!+PQ*gbMG*qSf71=DfnO(Egu$${>30feE6ZlZavL5+l2TS|y3v=*2c;6|g z9aOPJo?~}Wo3nTy;MroE)$$Y4cAAy|`K zJW`Ij>m#?d!)rne?|ZBQefdJZ?5H6rvgTg-vX7Kcu7f3Cgwo@lOc^-S3_fz>v%MyF z58^Yq7u0GfHS!1q#5=lkrI^&m=)pe+NV~7geV66nL2n9T$F@K1Ra#Be9m@K#j0R>% zyA38orTWDM2tsRwuF@;^(B7de({(=$sOZQznt5Op;ystT5mBN1#*?PzQ z0M3Z6DKXf`+_RW<4k`B?$yJRu6;aSj+0*pQDh|^~gqIS|EP+v*N%X9z~(xCv#U;+|$9Rl2U+mG8Pj0D%9_;~UUiBk*Q7+{m4= zEOPL3EgVhj<4}t1zDW_I-#4uD97e}`lXw;k@?srcfyiwT(Ji0OxK}^dMz?2{9&ipu z)Ml>h2A_I{v~C44SzO{1$PQkYw<%7wObcJ930%Usir$^BLANEkS3MU>MBz2g$Bag<7Y-`)R(m#X z8vSC+wBgv(>A++-BehZ57_oUG;WIMT1eUEAoI-bfJyi;-_qTdsMLhZ#Z=BespZ}!e z6u;VLw>gD1_t8I?J-l&T?3$J0ukw|g!(zdiQT_q;@+bAi7Q(BhQAFXvhlGy4P1{(1{R&Du-m*#=-(BtggY;gnpsi03^^>R))WHvW*5BqjCIw&5xQNHA9anphL;j)}8?;p?x9KVEP&TcXsm{D5gm({`9t_A=2*^iWR-zP8lq@sPfj3OT@m0yaC_-$zo{2khV^_{uaE=XIyZ}2c{E4ksddD3v>xc1~&V?3d5}r^)YXyfsckQ)d-4&^4CBSajY`V*O6}AdM%@q4xKphzY8vwA) z!}x+Lk+sQz?O4`kSLcq{iR+7znh0XR{HI7?7O4dVI1Fi6H3w!EB-&*9qS&yT_sC+&u(^wp(n0YRQRylKz9^E5TbJ0Kluv%&mPmt5G*bhK9_} z_H}3F9|Y8M;^(A7_ztg&k>ZgN!clFNJyB7G!4)2dZQ$d}UbZCu7E$A8zwty~(!Y87 z{bYCJ7ysX)Aw2=x-;$p7)zH5s#R&Ws^S4N=_CF}n|E>6chv)wTrFhmzkh+4+fDU6Z zB$pxXZJzNvdwbFC@c#a{zG&vHZ($fahwYWRWz^|u3Kkpe`7`&2okv%83JlZAAJx{^ ziauz?gb13}_2VICjs=|)!g2mqH|u3VosbqwN-C-}$<;n+Z9vjot$iF0;l1bfz#H>N zs?ZS?z+1duS;{guQmlkKgD47{j{V6q* z1n&K|006-ANKU{b3;fB5tGHiS#vdqHer(m_oT+)S(n4&&^XDBnF+rLFX8fWiX$R;5 zK~Z?_@zKvvAgpy+f)3o6VOp`+Iy_%rDxz?TcahrJK(&8yjlYdg9fgbwkfzrnq^ION zl#k!=NA~_ga}PSrfM8{Nd*WS>U5}cYnzo4{ywG|;spOTG?d!EsC#2nJEV1JAt2!pFkYcdiZWCx{|0LP|bx%i!C9ZR7 z)35G(&d)z|p4)K%9yzM1scXqieqV-Zn&}DJj!}A#Vo8cmu;U20Gd4obIXV_{T z+0Aw7gN7%PlGnxW>2I!$WXND*2gwx0`kr^9(rIrB3=5ev{2@AIel@gcaCCHZva?ov zQBN%08=qmR4xj8pDu)=>PQAW40E>JNbk46Z9+&K-flrdWx#1F>LIv$|vazJ`B_ zMSpL@fX`$ zjvqng2De3FAg1uJbcVcuW@|^Y$7sg(`pAjzYYLXc61VPYY7YFS~-@oX#22)+1v zFr85sVx_J1UQ%3K9&XQYB;z%q6arp8yqGzgN@(DCh0l2!s1zaFa`_K4S$l&2tkPtB zD)>_x??HG@D(?Z!hNEN&;eCwGl$}Y-1h4Gnz)Xi5gR0Wka_od~aY-d2UB0%SW8?)Yn3>ky?e`y3?-&O&W%*1RH)u6{#HIQLV*?e>4#A&WX5R zW6F!{%mwguMSJzjS2kYy;NqJ?erQp$>taLRaP89eD(6<5uf9b%QiRC2B__PrxNZOI z1dGa`zjpSOitzsDdPP;^#KHdN5A6Lizj3G;Y;BP5?F}1&i*{9sl3rV`IPP>_!~Ky~ zk%1TR>0RW|QuXR&l~sh}Z;Xp$qX95=tH`X?Cx&%kr&MD7aQ^wTBAqV$S?0bmdXDS% zG=9}!pm2q%khO^nI^~Fi>BBtB>ewV+>ea|61?!>~vySSL}Zdr@SKl7@HyaC|2HLO~=b%(48 z4~?C}Atdqsq7(5J1jPpceoeFumWwd%$|*OA8sinMQvsLbH=ztNNL?8|1xxDOYq-I*JRESYj_302a1kt1n8_BB+?XU$m3`;I9)ss{BE=n`cQGtr?3?0&b^o7H z%$~<>7u)|TKVhd?j=U0t8#v@)Q+?=CYOYTQfU=79S^Lf7;L7Q!& zmR;`h0eR=aWMYl@yFVaK6*9y{n~2|Bk-5Bp&u>@mCoE*`I%V)xRG_ z+yCp*{*D3g&;NUm|FIGhQ6FYfeu-E)hpK^M zV`6Uo$Y$3`XOifP%@XSC)j7lA=c-6JBDA)pb!cD2KBa=enr(N3D9{2T|J-Sb&YD$7 zXCX|(u&=$W0c4D(69kG~g5DxEUeADvUDr51Sb_rLc$zE|kVNtleBIFs9 zRsWWa`s?pqUUbN~Yq^t^Q3O8+M;DEFcRiKUe`-yo9=^mU|IlN%Yy4S3`Ls zBF|#weJ8Wle_szO) z?hd~4cbS0GJ6lBdr}QhL>yXp~95}vM4u{uB(1HnFay4D>0KFI$0T~mfPx#B7D>nj5mKT zzdo_fkO<`<1?a!sx|m>mhVOdg_ydZ7_n0g1bgzBroPCF`PBQ$Q`n^8|V~w+J8M@qYcA;H7+gkojec2T^Xv1e--&{{svHQv*0e za0X6Wzb`xS#B341q(2HUDltM z#z2R(`XZ!5$3d1#YKwm?4a0UkDsTjkn?_*z7tqBD5}vShTRb1fdcX4wfb9D$A(z*V zI}}>RE{~Erh4F8|e{b`M#&maNpP4zgQ-tMfx5 zkPpfBYU+iU%X_d95jd|~%GZn}Mn!w@?$4fyVDZMrnV}5)g()wVh)}*ZYLCH;5Iaj$ zi!oj=Mi;0c$dGyUUPDk`w`yu&_RAaF``E1}ZA z-o*1bD)nZW9CG8valuT-K!{FUFhae$u@#d@l}4g~n(JSdJL{(#P78*WPXq@aki#yP zvo5DZCW7r}`qGvzZ`WRIQKi}W_Xn_0VTP|P5&iVuvcR3AE^Wcf0n6(OByvfjkF6cP zJoo#As$O$xh27fXv$|ND^laLR+`EL=?i}c*@?j4#DF}7Q=3od)^?17x+qEnR8-XJm zf8u+6P>s$?w1RLtwK}(#nFoIjQGoi$J~#d0mdDXGW}_he#TiYU5wHYyWqu3wDDU?_ zKUxlA|Fw{C*D-5ScoAK!dx2h!zp8=nsk*3R>_87LtAs(_XIK+i;j`2N+l@4)ElRs%D8M2AP zc~!dNZ!kf@1F)+_>4CF$0&gmHbrXFXbt!2Tit8yz@h2g%C#F1f z*Jbx@tbUOgr*a&$!{V_&+>OAEc?VWu>1}%o0oHx2Z6Wig7xwN7#W1P2*x=0?zQPFU zc~qT+ktLej^4l3V7uBM13bdZ5HKuN<9(&x>YsRhXkJh*W3VTb@7G0%ecxQUykQ-aG zLGfO->)9CcChFPz%=GdRdq}6$40)tit0(7gkRnVy;v*i``pLI-7vW|l5d__)pO9`i zku+6@eE5*RR5&8F*N%Mp#**ZS$;y<(xh-3PynUo?=Tl?B(nyB@(f#i%$V}tObJ0QP zzV@Z4ThgcdU{xrvGRwa#KmmEJcFAn!Vw6y1q6K4ulD+=8z~@6nn>`oVb~{Ft~Om$Fxy(hODeg~<^CRN zzMs5Wef7)8H7$5-ukF!b?>h`BCj^@uh|u%yp1KDfn{l|KHa_)WlO6#H#b1|1eHMsa z4^QE!W0`()us0ZjQ|){;)Oko*&JFak%PC1gSzNFvyi9>YVHTlrXXw}xOvfcMWQcj5 zYpiA-V;eztQhxc(JJ>cBpOsUkl_#^iT!vjIkjcn&H~gB`5FKmp8kO*H@9qJ8b&lr^ zlkg(Dr-w#r-%3Lrk6-HL1KeyQFxl77+bn*4#lrLYnnT+A1p_u5<8U2OTJ{Sw zJ%{W>%N$A}GtKXk4kApx?B}!Z+8Cg;i~R|8>)8B(ZJAu|M73~VdV3z?@zbpP?cV_K zNC0)wYvrmm!miH(FAN`kMy_pUaq%@zmtpj_qU|h574|K7if?ZIER0Pi52!W9-Ho_q z(3q0;K;sGdRQGt~4T+wJ%8vdv;apQ*XVRny)}x4U9kXg<$j2>hR&)`o@coYys!a{? z%96n0?b4x~@sd~Z9*4PPthhn5C^C{u-j=sy-+3o4;$FlN5g8j_t|l}SUI#X8mN$_b zQ8wO!qiwH-lBLym?qQAWu6Lg_m9~2pH$;rYfq6cR8*@4|v&>JWuXafbetCG+6m{#8 zttT>AdKzfLbjhZ|`o#9m?M`rwusi5qKU*pT<*ok^R ziX$j;N?*ZGpX~;vZ8wb%PaXB*bR@m_)lU()o&8xME0&7(nU!p9wTWtRik^*KD5 zPar5Rq&n#ypvpQ;prXdIZU+Sa;fh!Y?22ZoEX#IyA<#X67-Wq^p{x%17?$Z6f=kH1 z8ixZ!kX!aZt?jIqR)6daLCgfs#!GA(XrvNw!Zz;u|On#vx>+ksWZIA;e z?+1m4cxR%L3&U?dcpXef*LyF5PapDA02X76QF~Ez^UtikCNQ~;yc+6rUgt*F@$1C9 z^rNQrq(%Icw~~baU{PN^t-XmWm5Y5j3XMIQB=H7kdX}E&tf8YL-rrnOSM5Rs;GDg< zUzMkAE;Wp!_8lJ|0F>JN9sFs;v(7<{&#hC01Z18D2ykWJ1h zvw^>!7UW%E{k4Sa;wY(O8#f%+PQEyZTftyQ#fEEX@}-hQwVu$vrotla3$YCep2c%c zRcz&SAsqfQ8K(=t`zhY^uM!+;0s=rTu;u}oItXPwB^B$m>P2h2o-&2}0NL7pO=en+ z`woiiY9_BF!mN}>>*+Qp_M@G9+N6l61%|q>EY|J+WKQ z>gH%$IN~a;vmeDfuSWK^PHWWz@sm^il8SZmtXHS_Ba(hl#CJ7s*?E|T7`!dUGYA$( z=()DW=3=>ad=neeEN@M?ajK^M%=YiV#^9`je+|B)>=N`JBd0J`Az11N@fR?DoAd2E zr9{2UW&$RK!kFeu*^zR4ooyA(%enWZCDlD%uYqo+?pWs)}J z$J<5GtX2L>c@(tXtg9dC9PSY+vT;H~mFNae!?`7y4E9wM;NeB&JE-#>bZ*qu-G&mH znqyYE)4Y>w>tZ2Kr=_Y>wXF+yX#Dr9Rkpgxb&1}PNxb&Vw!I_o!kD=+w(FLz6s!{Q z)7qWv5j;4@X-qaJ9`Du|d}n&)qfuKjH$Vy~6zDeK^;hE-9FKl8Ig+QL};H{)Lvo?jsxt9iH+VCtq8>x#?rXUio!eE z^d>1Gb;p``fZ?!U&A4m=_=mTyu?necVH9pFYzRikYz*!$m+^d4SMFvRubRhOUa#A~ z(9z)-2gAwUh(Wt~rE-6CwzTcYkE=FatS58|mZ$j;@J zK)Xk%fWk5<+W2Lzi)ykJduUo)vw(VZ)0FnU6F(_!ylYDtNdCwGaZ=)O3dqeMTG%u70!O!RU!JB%Cx zbw59JgrK^OI|tGOmYTW9iAq#UYXtZ~@}2&(lm)qm5XvN@s$8-R*%3u_g=^sOCJ>ftjPH68{z`wq@R-oYw>Q3cYueF_%N{I0%?<;iXtk)@UXV&r~@7JwTKZkdg_DZ6t1V<# zsRFv9-3rk&Okp5Y`}#3X+!b8%47f>kCxhv<6nWciJV#M4!PdvJ-QwCFKTi|3<_)-u ztj)sejvUFRa8BHGuA<9pSviv7@>hD-@~z_kH239?P<`S5mr#wZ zVzP%+BoSj5Mxs)7L$ZglWGvZ<5ut1?%D%5NBTM#uLZPf>-?!`rWjBn^o%H^GKYzmK z{J_2EJkOcuob#M}&wbA8d5-33)}_;R?CKQn{i4p*ckA(3C8mF&586D@5YhK6GU<)t z-8Qct`dkB@sHpw{1cIV*4!@7#PP=>KpvRLwd93z#rY}dF&B&EFyr|@S__Ex+kGF}#uf9Ks`B;w zwg>z_T*gF=6qJ|bCGhnz-Ll5=U~%u(JCRI*SHGq&DkTfE{P*C z>mtvvZA(X86_l3B%FlrmN}>4Cann{3!*!{oEJJV9VN+ETG;XVVyC=AA&P;bbZ?>=6 z=X>fC)J3}PuKtN1B&MyCL2`(6>h9x>nLZ?H!Ya;rNM5*2&jtDcvf&yXe znLB-$?$~J;=t}*F-NPa8tcag);Y8%aUWczC;dTcWMKZFm`Sh@_TSgjYjs!lRdOIS{ zPxu_2tY*#8H*@_i#ldH)2tT_nGo=Fd=Ytl@*6q2cdO-t_EromLbyo$fYL_|`QI#Ez z?8rq1-830R4ex*Jadc7^4t@@~?>Mr~qDyf{8t4t)+;`u@rT!F%c!2xZBj&g4o9lU# zUO#L$8>d3;1My~F`bvL?PX8rMtmaX2N zR;6FkF4;-v&vxOZWIU4woq0L+UWBeJ)s)YKJt;`sW>vX1n4v&r3(aRiTpmW*zaCky z$NA|t$vfe!S`9jnTFf~BySR};2K;tAK8nrx3IHwDL9p1Qr!pDeHXEOYsZjT3tKC11}8cndL=D}ng#TeD7K5^)Ku zDp**1W5n(Bk$6>Mt>|=I30K(!tEeKDYhSoL&oxedB1GAir;}_881?EovLLw;AR8?P z!eX{J>8(pQTCK5^dRmV|)dhFEIqktMBx%FCm^;pQKXTo&%fprXQat!T3BPBgSkA6n z{Ni2%uCd`gpfzRYyii_WN)I)*^Ox_q!|Kp4CR$wTlX z<$-5)uDOSRJiz9XW|5ZUoiT-$2Eev?rgZ)6n~{fx()+om6|?rkk!NO08nup)H`@p%oa2 zuo_mB$bI;Thl8^ioVKyIx}oY0<(ZZ|(gVozE<}B1^xd6bqURZYWeS|ys!5vIIE`oT zrFjl{u;sZ_o#_4$FDQ!IvgMRBFe%BswJsOyJI*pZP!?6naB$dAqrU!7OQo{$*PWx^ z+&b6JyE6#9-^`Szv($oydB7U6Z6hZ^Y|s%u&8U2sKZN|0aOnZV+XyCy?lT`v zY4tDVNEqDZ@WBBB#%%MR({*ABgT-whV##R%N_M#Q1penPTZB(ZfqJTrOqYNNyb%an*`TQsuP{`Sg~+T-c-j- z9<2!p7W2ZLQRw=Rv(_KU=(jzBbZBh{FPN4jB|MEvg&#gZ-3vnJUe6*tvL9R^joO$> zXUu9s^e+kDh8XBB?%mw4TR}(|mhK1s?DUOuf4LodpNVc5Q3dHGAJv zN_w^PX%0L=e6g3idL|Nr+^j8oT?e~SYuNH8P>XB+k(2$B#gYCz5PW2P+R32irixX5 zO3!|GY;ujngY?+)dtNf7^oY}Y?_8PY<~JRg_KUAvD!KKxn5hZPN_ z*B~%ccn?L5UaKR5p-P4m1J8{NN!^F0p&p<8D9A*8Z~tf4!PHmNmr#~0!pqZUfgc=d z@RA9fKn|TeB6bo3+(1>@|M*^>Q92%E;y6Q@Ut|ujLd%!D3-s@9&*(N8BdBfGj7GX8 zNkvKpq$_s*br~DGUw?=VSr2Szo99l7?2bC@@-Or6KshLfW%v%eB_G$x|C#7YeN^#? zQHr$7(sRK~86EDhVGhLEEJ$|W1x>JFP9HecsIk+z3(mS|0VHiGv>*Z#QQRavbLH6p zb!H&+P{DpEQMBbDzt8NiqCO0*uN>9d2l^F%hs4icg4LH2aADoM8Uq~@1y9bg8webf zjA>_X_h7nZ?O$4Jr8ri2NYC}6`CshGBAKt)y}cjd~to*84a zI@*jF?1#OVf3juFxA=QTaB^kT+Ya&6dlvhhj#kR|Qy&`F9X_l`2sLn_K(ce-kX&JO zRH#b74~EaajnF0VJ3-SZnW$ADn#`Xu8EQ)JlBGH%&kxN8drd`Ekj_ke1Dq{v7m7$D z45Iz0QsYnboRm}A@5ke4811->PWtD0E6bp^lIh=+jt|6Y`C*79Bf6zg675pb4-ksP z1{UGx(*+QcZ$K)4CGOTfd2fZJ8Z3Xf-o$U(KUmI(Jv19GBXMS>qh zd-*HR+`KXD>MW5iO!c{k;5=?Lk>E#2HZ6(~qZeAK-$nEvRvMG-`Kcr{r1YrsKBIQBOyDT5w@?y)w zDHSF5y36$>kj4+~Pe@$9QFYjUM{*`k2q#Tvwlc)){Kv|i^y$^D3c6$dW$|F zaKk@2T_J9Ieo#69x@1@$c&)RbFanvtSlDBGXwM+WL9!d0&p)6I(ZJQyg=%@vEw-_n zqexC7l6+lP3~H{fm+=+~-i}VN9JDAcAMSDzWBSqk>!5*Klfb`v1Vb;)4-afw&%bZ~ zNna(Dc~!aSxjqj-^{AC0-yvo)ix9(Aj0qq2tXtYSSYv{HPQOC6+KvPcQr4|Oak{#6s1J| z)bqtBI1F~T>)-#%_Ki*JMII167kGchb9<|im0IZ$!&t6AGSPRp%evU^E;Gl%LXF@o zuGa!Fm5NHbsM4r-nx-@qCZ6t0no&BcDQ}ayAfQieR}oZ>9m6*&e+t@=vnL|yXC0t+ zXGxZqm>Ke_*Kvvb{d*ox_|8XD374c}e|>iPNx@29v)G=1H0sZ-NG9Zl;aaJyf5itJ zjr%GrnlTTnm2E9w!PyDPP1Oh&a1*C^*LJwW@(->Wy>%?N*4d5S`aMGlN3DsV54k(` zjTFQYUor0a?t`sivc8`RwbnqhV~@i|V?DSJ^&RUxKr&6vFI#z}Kp%wadlpsRaAz8I z1zp%};H%xn>H*i2YDFs(r5dJ(AfHxo2AR)*H2TRf?f+TBeUp@qMk786xPxQl#fMUIDbW=zO_e- z@4nPDMwK^mx(hn+g16GzPb;lRa{1wTlNF%%r?gcEz>Zti85V)3>?@bjdx zUrhDpaC)5NrQT;Kiw5tZz}MV#m!k#inS}+tUa{XA#g=OHYkCxxad|IeeR^c|*0XpX zE=%NJ6lWZBs%if)2pOJmyuVwQJfTyHhEcKpwNTu9uGE{gXeTb?YpfE|7$6btDma_o z4CJr4VJ+%B;! zp(Nz~Xppu8wSFF!_d95&SkS}d5pY{rK?I@z4F93^E%!<&#nKMsQxM+Z6h`ZY;N6!A z;bP%X?n+^ah@P1bLq+M@^pMi}3qszuc0U!+iJk=lt{U=)Kay>8k?5(Dao)eM)z?Ro zFB?d*7!DYA$tW2H>Ju!jS1KT{-5ul?lQ;C#A-BPmz*>T$NloCo2!Aj=B$B!F>Wl7C zTL|Gm5HDlmZ%HYkS~QjFpHiV6l1~|tk)}M=N{Cj9!3~uP;bL^M2fMBK&5aIif`o_U ztJ=4{FMV=7Ex6L_`ok~BeXXO>qea~^*092$73;mWw8)w_Z_%Xqp%C>`}kZ95k+B>eMUVAD_#B1^lJTUf;6rPI4fF`*~xmJ}eSfKo=K zBQth!O;z>WT1o4reaOQ{Yygh$Q-AQScy%L18Hp8*wyf~m!3q0*UKm_GdhuxgB$~A- zWhW@rm*;5#79&GsSD$(tqoSbcD^N5kniX&{GA5fTA!4vuxZ~+mUV_ws?NHbS#mG}YiCY0GG=x{B ze<(3waPcAWsG^?OWas*ovY*?ms+I9bE20rQbqy^EEk-f6SDm+#YnY?YXHF4#0AZM- zFCNoFox%V%X14<}TNw2PXkuY)&VA-(nUt}?P9O0X)s=Kc_aVg;X@XY?1ZXKVSr={$C5(?QMU_s;Q1l3Z@3>66pN@IXRc|TMZaLIw+M0;)1GhQI zSe@7&F@_I2dAX@DfeBsB^M(8No59hjrAet%uduZ`Dpo(W;2c2nJt9%Rt(f8Q(RTcg zMudU2qfs!$a91f;aR|68z7YB<{cWIOespD3|4)B2iLDiWn6@*+mr6TeNycA1)C{&= z=P|NMDC%@u-TmZgI=~s2%z3k-k+#du6m+(zT#yKdjjdKcIcg>DE9)XkqH3GP!*88( z??t>}c4$qTN@U0RX0k8@2eFQA*A2)|9T`pih%`_+=>pjd{O}Z#+1P}Dz7UAh)v|5+ zSlKf02Yaoku7h#g)V$bh4ej?>@MZ7Bf@p~ldJxJh7p0xjDBG`(9QD1wZ14Epoas$% zqbnzk+_?c*sHJI37qOn=CmGv92?r5W%{;(I|6TqLI^c(w2$ap@dzkrwns29Y7QSo(@Wv2YRZL<-qgI5y}$ z_FPdihdgFl9U6lx)%%(;H%Tk9wtsH^q+al2`5mcsqYgrX+>w+Gi>YbNM}NztLUlbC zLAv@ik-WY=);>5jj~Ezf6GWqkBJHUsM`di{YgP|n8`T4K-`lD50R7jf@(iA$zK!L} z+GQEC$}I6aXNLxP7xEvr=z%gF$GH_B3pd-mrFc*?8Mr~;{c7cmIik1B7n5WE^`q;x z3|7L4kCvr>TMq(TvO(my=3$lh+a0b2y(YZ0qrS-&hrcotVCzX00JaZE2w7)DoLzlJ z2M|6Y$r)*<{Wk(PI)c!CEMzp4x+*mfm>UqXKXXmwH)%q2z=Rk|{#GYrWrV8%zLF!E zKTlw*#Wf(+`)@9s8ytQw9>bKnbc34N(ER}1&fc~CckGH3oIM2KgRRwF1?klK5i{!j z5mP3Z6Y%)v8Z)Z^ArKj9=xGr97fNI=G5)TL*|Ce722ktU!n5(vj-z-=QZ7)!K|zYQ z+9PgWLzsZC7l%rc^=)oCjkag0RZOQsv`_3u}Wjxw9PmGfatE@+2Z~K zR^y1H{6$X&kh$3Su4RKH4Ylh|&sM?4hDk3bD`H5>WZ0b5Hk&*h*gt>(d@Wu4fCV=4 zt;#@*nHBCR>lBgd_lkmCm4yv{lCGy`48%nNZ#sn5>Y~S$DV~C0I^@BFYA?#x=4AKh z=y4#743XRKRERzUDkjf~V6XNt(#`xZpktfwDRV~u|{&oO-tg*$n(7ImhJ-Ek^ExSn2z;EAz2R{c{VDUJT z=?&i)tc)8`#RGCwt-2;!X0|2)AcgTmp)91UR8-&Lz{`*#rODq+{FqZ9xEvNDNHTRs zzK$mZqp8rCPNY?}Yaee}R^MsPkf#HcX*FB2V zo!M<;^X4wEe9@BHHJkc=Ad(za8lFh(>*x5WKLi6Pc)-4+QznDv1LA{0N4NmC7k}&f+^!4?@tLmSjTrz+2KsSO0cq3XzdTnB zZ4wN}Ovre=V;Xqy)y+iT?RdI9YA_FZgAxt^f?w}e zv*bR4BdG$we_(Prm*?5(r!ukbZnD8lb1s;m$<~KfX%~di zGluEp$*dNE!$?kAGEu)N;REiB9LM*-2bhAR>XQOxCUCNoQ(9P3f^X4Wby*O39Ki&i ztxPyk)W%8)C*OetfyTKW-7Y2-YrCg+?8se7&eS2tnD6CmVRJFD89dGdFbpkp*NAz0 zM;@#+;3$xj-Yegqbc;3IK=tab|9`x)oSv!m>Qn&?$pObw1_*wNPqjolJ2)6e!uS8N z253ko!W$2?OtgS7vS#{zG>fq&fg7@3)x6?|?8P*X7CdGLZ*`mgcb zKbmWjH*DlOi%9Ya3i6p7u{5i&W61#77%>G7(!J}uZ7u_2sDGJm!k*9WtSct>_)Ce> z?VeVaGCwXzl9%sup7D9_&85*9Y9E33LnX-;1MX~)f8$bm*4o2vDm6xICVf1O5)HJtr# zus(oQC54xaOS=NCTIOV#K-JkQW;iSpW27ig;g<7`wM;_%r+B(m&0|lIngfyEq${4l z!sQ4*OMc^ylhPB%jDT$v=LU(|`U2(6E$JxO(?2gZOhp_y|9L|I>|L}+f7*$j`>E$Q zM_oMqU(fhA{jXLD{5_9iK7L0;z>_-7eOqWg&E=r;^S`RuzqU<=g`jn$f%mZLWRn?T zUY_HU?o%_XyNK_T54a$V6b!OHqb8=Vqs0GIR7c<-Q9jSN2CI9OBJJ=~>TO{D3ZfXn#w5(?d`Ce~N0{%c@svuKm$OsDVR zTut^k>cs!6aLAi?tRZ@=(|37snb+L<4Nk{ND9EA`?dn zWPe0qt4@D9hy9<>utc*hsk~ed7g(dBof@_I8ytoD!0tYH`ozDP^tt`hliCr(v5%8o z_CA0u7ndtbzwwSj2=%dGY2Oc~>YJzfgJV2V zCnTu&eETZCV%C1#YR#0xZ`} lyY>d~z3t4ex0}6pL?JGa7|Z_iFq6!2PetQ)!7cN^{{enJY-9ic literal 0 HcmV?d00001 diff --git a/config.json b/config.json new file mode 100644 index 0000000..445fb24 --- /dev/null +++ b/config.json @@ -0,0 +1,36 @@ +{ + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "bos_token_id": 128000, + "eos_token_id": [ + 128001, + 128009, + 220 + ], + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 8192, + "mlp_bias": false, + "model_name": "kanana-safeguard-siren-8b", + "model_type": "llama", + "model_version": "1.0.0", + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pad_token_id": 128009, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "torch_dtype": "bfloat16", + "transformers_version": "4.51.3", + "use_cache": true, + "vocab_size": 128261 +} diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..1cc459a --- /dev/null +++ b/generation_config.json @@ -0,0 +1,11 @@ +{ + "_from_model_config": true, + "bos_token_id": 128000, + "eos_token_id": [ + 128001, + 128009, + 220 + ], + "pad_token_id": 128009, + "transformers_version": "4.51.3" +} diff --git a/model-00001-of-00004.safetensors b/model-00001-of-00004.safetensors new file mode 100644 index 0000000..9b3ff5c --- /dev/null +++ b/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d06490fe1303930a17d7ab7e7b6ee58366483aae2d7677f8191cf855690ee02 +size 4976739632 diff --git a/model-00002-of-00004.safetensors b/model-00002-of-00004.safetensors new file mode 100644 index 0000000..39cb762 --- /dev/null +++ b/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8852d257a856ea39178af502daa949065f32f88036c658c6abcabd9515dfc047 +size 4999802720 diff --git a/model-00003-of-00004.safetensors b/model-00003-of-00004.safetensors new file mode 100644 index 0000000..1d6210b --- /dev/null +++ b/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d27ed38b991ce936598b1054b66f9ccb3e1e04f0c90a25b6995ff19a7030f66 +size 4915916176 diff --git a/model-00004-of-00004.safetensors b/model-00004-of-00004.safetensors new file mode 100644 index 0000000..eea1bb1 --- /dev/null +++ b/model-00004-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7b024e19d61a52bf412f68d33fede5678705a737e63037002a42bcc62a3d37 +size 1168179768 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000..7e1eae1 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,298 @@ +{ + "metadata": { + "total_size": 16060604416 + }, + "weight_map": { + "lm_head.weight": "model-00004-of-00004.safetensors", + "model.embed_tokens.weight": "model-00001-of-00004.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.10.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.20.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.20.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.20.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.21.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.3.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.30.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.input_layernorm.weight": "model-00004-of-00004.safetensors", + "model.layers.31.mlp.down_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.31.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00004-of-00004.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.4.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.norm.weight": "model-00004-of-00004.safetensors" + } +} diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..b43be96 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,17 @@ +{ + "bos_token": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "<|eot_id|>" +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..375ec00 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b3a1d203c0f5b877ab993325bb79547e8ba6fa4bd0bed12d6dc55c22966c1df +size 17210995 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..2739431 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2108 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_248|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_249|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_250|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128256": { + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "128257": { + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "128258": { + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "128259": { + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "128260": { + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "bos_token": "<|begin_of_text|>", + "chat_template": "{{ bos_token }}{% set ns = namespace(user_msg='', assistant_msg='') %}{% for m in messages %}{% if m.role == 'user' %}{% set ns.user_msg = m.content | trim %}{% elif m.role == 'assistant' %}{% set ns.assistant_msg = m.content | trim %}{% endif %}{% endfor %}<|start_header_id|>system<|end_header_id|>\n\nClassify the conversation between a human and an AI. Respond only with the taxonomy code.\n(taxonomy codes : ['', '', '', '', ''])<|eot_id|><|start_header_id|>user<|end_header_id|>\n\n{{ ns.user_msg }}\n{{ ns.assistant_msg }}<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n\n", + "clean_up_tokenization_spaces": false, + "eos_token": "<|eot_id|>", + "extra_special_tokens": {}, + "max_length": 2048, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 1000000000000000019884624838656, + "pad_token": "<|eot_id|>", + "stride": 0, + "tokenizer_class": "PreTrainedTokenizer", + "truncation_side": "right", + "truncation_strategy": "longest_first" +}