初始化项目，由ModelHub XC社区提供模型

Model: jekunz/Qwen3-1.7B-Base-sv-CPT-plus-IR-sv-SmolTalk Source: Original Platform
2026-05-12 20:41:22 +08:00
commit d0b6c0d927
35 changed files with 304056 additions and 0 deletions
--- a/.gitattributes
+++ b/.gitattributes
@@ -0,0 +1,37 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+checkpoint-2011/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text
--- a/README.md
+++ b/README.md
@@ -0,0 +1,57 @@
+---
+library_name: transformers
+model_name: qwen-sv10m-merged-sv-smoltalk
+tags:
+- generated_from_trainer
+- sft
+- trl
+licence: license
+---
+
+# Model Card for qwen-sv10m-merged-sv-smoltalk
+
+This model is a fine-tuned version of [None](https://huggingface.co/None).
+It has been trained using [TRL](https://github.com/huggingface/trl).
+
+## Quick start
+
+```python
+from transformers import pipeline
+
+question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
+generator = pipeline("text-generation", model="None", device="cuda")
+output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
+print(output["generated_text"])
+```
+
+## Training procedure
+
+ 
+
+
+This model was trained with SFT.
+
+### Framework versions
+
+- TRL: 0.25.1
+- Transformers: 4.57.3
+- Pytorch: 2.9.1
+- Datasets: 4.4.1
+- Tokenizers: 0.22.1
+
+## Citations
+
+
+
+Cite TRL as:
+    
+```bibtex
+@misc{vonwerra2022trl,
+	title        = {{TRL: Transformer Reinforcement Learning}},
+	author       = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallou{\'e}dec},
+	year         = 2020,
+	journal      = {GitHub repository},
+	publisher    = {GitHub},
+	howpublished = {\url{https://github.com/huggingface/trl}}
+}
+```
--- a/added_tokens.json
+++ b/added_tokens.json
@@ -0,0 +1,28 @@
+{
+  "</think>": 151668,
+  "</tool_call>": 151658,
+  "</tool_response>": 151666,
+  "<think>": 151667,
+  "<tool_call>": 151657,
+  "<tool_response>": 151665,
+  "<|box_end|>": 151649,
+  "<|box_start|>": 151648,
+  "<|endoftext|>": 151643,
+  "<|file_sep|>": 151664,
+  "<|fim_middle|>": 151660,
+  "<|fim_pad|>": 151662,
+  "<|fim_prefix|>": 151659,
+  "<|fim_suffix|>": 151661,
+  "<|im_end|>": 151645,
+  "<|im_start|>": 151644,
+  "<|image_pad|>": 151655,
+  "<|object_ref_end|>": 151647,
+  "<|object_ref_start|>": 151646,
+  "<|quad_end|>": 151651,
+  "<|quad_start|>": 151650,
+  "<|repo_name|>": 151663,
+  "<|video_pad|>": 151656,
+  "<|vision_end|>": 151653,
+  "<|vision_pad|>": 151654,
+  "<|vision_start|>": 151652
+}
--- a/chat_template.jinja
+++ b/chat_template.jinja
@@ -0,0 +1,4 @@
+{% for message in messages %}{{'<|im_start|>' + message['role'] + '
+' + message['content'] + '<|im_end|>' + '
+'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant
+' }}{% endif %}
--- a/checkpoint-2011/added_tokens.json
+++ b/checkpoint-2011/added_tokens.json
@@ -0,0 +1,28 @@
+{
+  "</think>": 151668,
+  "</tool_call>": 151658,
+  "</tool_response>": 151666,
+  "<think>": 151667,
+  "<tool_call>": 151657,
+  "<tool_response>": 151665,
+  "<|box_end|>": 151649,
+  "<|box_start|>": 151648,
+  "<|endoftext|>": 151643,
+  "<|file_sep|>": 151664,
+  "<|fim_middle|>": 151660,
+  "<|fim_pad|>": 151662,
+  "<|fim_prefix|>": 151659,
+  "<|fim_suffix|>": 151661,
+  "<|im_end|>": 151645,
+  "<|im_start|>": 151644,
+  "<|image_pad|>": 151655,
+  "<|object_ref_end|>": 151647,
+  "<|object_ref_start|>": 151646,
+  "<|quad_end|>": 151651,
+  "<|quad_start|>": 151650,
+  "<|repo_name|>": 151663,
+  "<|video_pad|>": 151656,
+  "<|vision_end|>": 151653,
+  "<|vision_pad|>": 151654,
+  "<|vision_start|>": 151652
+}
--- a/checkpoint-2011/chat_template.jinja
+++ b/checkpoint-2011/chat_template.jinja
@@ -0,0 +1,4 @@
+{% for message in messages %}{{'<|im_start|>' + message['role'] + '
+' + message['content'] + '<|im_end|>' + '
+'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant
+' }}{% endif %}
--- a/checkpoint-2011/config.json
+++ b/checkpoint-2011/config.json
@@ -0,0 +1,61 @@
+{
+  "architectures": [
+    "Qwen3ForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 151644,
+  "dtype": "bfloat16",
+  "eos_token_id": 151645,
+  "head_dim": 128,
+  "hidden_act": "silu",
+  "hidden_size": 2048,
+  "initializer_range": 0.02,
+  "intermediate_size": 6144,
+  "layer_types": [
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention"
+  ],
+  "max_position_embeddings": 32768,
+  "max_window_layers": 28,
+  "model_type": "qwen3",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 28,
+  "num_key_value_heads": 8,
+  "pad_token_id": 151645,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": null,
+  "rope_theta": 1000000,
+  "sliding_window": null,
+  "tie_word_embeddings": true,
+  "transformers_version": "4.57.3",
+  "use_cache": true,
+  "use_sliding_window": false,
+  "vocab_size": 151669
+}
--- a/checkpoint-2011/generation_config.json
+++ b/checkpoint-2011/generation_config.json
@@ -0,0 +1,9 @@
+{
+  "bos_token_id": 151644,
+  "eos_token_id": [
+    151645
+  ],
+  "max_new_tokens": 2048,
+  "pad_token_id": 151645,
+  "transformers_version": "4.57.3"
+}
--- a/checkpoint-2011/merges.txt
+++ b/checkpoint-2011/merges.txt
--- a/checkpoint-2011/model.safetensors
+++ b/checkpoint-2011/model.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f78fd28d6162fd41392fe469bb68cfc323d68863e59cf6c86ea5ad31af34e2d2
+size 3440091976
--- a/checkpoint-2011/optimizer.pt
+++ b/checkpoint-2011/optimizer.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:95e040e16b57c0024f411ef2f1e13ad5656276bfd99fbe6f7857024d34d99efb
+size 6880384943
--- a/checkpoint-2011/rng_state_0.pth
+++ b/checkpoint-2011/rng_state_0.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7350b59a307e1d89d4515e24325811dc1aa8deab5b5b4635887adaaf78ea1dc5
+size 16389
--- a/checkpoint-2011/rng_state_1.pth
+++ b/checkpoint-2011/rng_state_1.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:af262eaf45f7c1f39099b694376de497429ab46c1046a1d9afe70a315f1b6d81
+size 16389
--- a/checkpoint-2011/rng_state_2.pth
+++ b/checkpoint-2011/rng_state_2.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:57f833fda5ff0e7e566107275c268625e3eb07e8475116fe109d9c667809d469
+size 16389
--- a/checkpoint-2011/rng_state_3.pth
+++ b/checkpoint-2011/rng_state_3.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2a6e6037388bc56484982620075eea8724b4696f67f60603b9c448e44f41705c
+size 16389
--- a/checkpoint-2011/rng_state_4.pth
+++ b/checkpoint-2011/rng_state_4.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d2bf73391bb68f0fffcb931501656f3679db7d996fe258d8287099b6cb7a23a2
+size 16389
--- a/checkpoint-2011/rng_state_5.pth
+++ b/checkpoint-2011/rng_state_5.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:222199bb7faa2ce2cb817e7f870ac7c364fb0f0872e17d8a9280f38596da9a06
+size 16389
--- a/checkpoint-2011/rng_state_6.pth
+++ b/checkpoint-2011/rng_state_6.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ca3accfbfe6616f878cfeda3df23f4418e00b348760c584e397d6c92081cb5c4
+size 16389
--- a/checkpoint-2011/rng_state_7.pth
+++ b/checkpoint-2011/rng_state_7.pth
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a64b41c5668afda0c862d9774a14b1c0a390fe6a57086de71f9fdfb00edb457e
+size 16389
--- a/checkpoint-2011/scheduler.pt
+++ b/checkpoint-2011/scheduler.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2b41df694f4954c1e053affa08a57688d639f9026ab853a930f869e4a2a775e1
+size 1465
--- a/checkpoint-2011/special_tokens_map.json
+++ b/checkpoint-2011/special_tokens_map.json
@@ -0,0 +1,21 @@
+{
+  "additional_special_tokens": [
+    {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    }
+  ],
+  "bos_token": "<|im_start|>",
+  "eos_token": "<|im_end|>",
+  "pad_token": "<|im_end|>"
+}
--- a/checkpoint-2011/tokenizer.json
+++ b/checkpoint-2011/tokenizer.json
--- a/checkpoint-2011/tokenizer_config.json
+++ b/checkpoint-2011/tokenizer_config.json
@@ -0,0 +1,228 @@
+{
+  "add_bos_token": false,
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "151643": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151644": {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151645": {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151646": {
+      "content": "<|object_ref_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151647": {
+      "content": "<|object_ref_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151648": {
+      "content": "<|box_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151649": {
+      "content": "<|box_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151650": {
+      "content": "<|quad_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151651": {
+      "content": "<|quad_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151652": {
+      "content": "<|vision_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151653": {
+      "content": "<|vision_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151654": {
+      "content": "<|vision_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151655": {
+      "content": "<|image_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151656": {
+      "content": "<|video_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151657": {
+      "content": "<tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151658": {
+      "content": "</tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151659": {
+      "content": "<|fim_prefix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151660": {
+      "content": "<|fim_middle|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151661": {
+      "content": "<|fim_suffix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151662": {
+      "content": "<|fim_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151663": {
+      "content": "<|repo_name|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151664": {
+      "content": "<|file_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151665": {
+      "content": "<tool_response>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151666": {
+      "content": "</tool_response>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151667": {
+      "content": "<think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151668": {
+      "content": "</think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>"
+  ],
+  "bos_token": "<|im_start|>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|im_end|>",
+  "errors": "replace",
+  "extra_special_tokens": {},
+  "model_max_length": 131072,
+  "pad_token": "<|im_end|>",
+  "split_special_tokens": false,
+  "tokenizer_class": "Qwen2Tokenizer",
+  "unk_token": null
+}
--- a/checkpoint-2011/trainer_state.json
+++ b/checkpoint-2011/trainer_state.json
@@ -0,0 +1,434 @@
+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 2011,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "entropy": 0.8093053457140923,
+      "epoch": 0.02486325211337643,
+      "grad_norm": 3.875,
+      "learning_rate": 7.277227722772277e-06,
+      "loss": 1.7423,
+      "mean_token_accuracy": 0.671543929874897,
+      "num_tokens": 12997394.0,
+      "step": 50
+    },
+    {
+      "entropy": 1.2584100252389907,
+      "epoch": 0.04972650422675286,
+      "grad_norm": 0.62109375,
+      "learning_rate": 1.4702970297029704e-05,
+      "loss": 1.3055,
+      "mean_token_accuracy": 0.7016283966600895,
+      "num_tokens": 25982466.0,
+      "step": 100
+    },
+    {
+      "entropy": 1.1815398697555066,
+      "epoch": 0.07458975634012929,
+      "grad_norm": 0.5625,
+      "learning_rate": 2.212871287128713e-05,
+      "loss": 1.1874,
+      "mean_token_accuracy": 0.7216299413144589,
+      "num_tokens": 38965230.0,
+      "step": 150
+    },
+    {
+      "entropy": 1.1402550649642944,
+      "epoch": 0.09945300845350571,
+      "grad_norm": 0.5390625,
+      "learning_rate": 2.9554455445544555e-05,
+      "loss": 1.142,
+      "mean_token_accuracy": 0.7295443145930767,
+      "num_tokens": 51948935.0,
+      "step": 200
+    },
+    {
+      "entropy": 1.110574235022068,
+      "epoch": 0.12431626056688215,
+      "grad_norm": 0.5546875,
+      "learning_rate": 2.9950061158395005e-05,
+      "loss": 1.1098,
+      "mean_token_accuracy": 0.7351739694178104,
+      "num_tokens": 64951043.0,
+      "step": 250
+    },
+    {
+      "entropy": 1.0846257837116717,
+      "epoch": 0.14917951268025859,
+      "grad_norm": 0.5390625,
+      "learning_rate": 2.9787675503104344e-05,
+      "loss": 1.0836,
+      "mean_token_accuracy": 0.7398869113624096,
+      "num_tokens": 77936279.0,
+      "step": 300
+    },
+    {
+      "entropy": 1.0673179541528226,
+      "epoch": 0.174042764793635,
+      "grad_norm": 0.54296875,
+      "learning_rate": 2.9513863052820796e-05,
+      "loss": 1.0648,
+      "mean_token_accuracy": 0.7432914447784423,
+      "num_tokens": 90932336.0,
+      "step": 350
+    },
+    {
+      "entropy": 1.052229733467102,
+      "epoch": 0.19890601690701143,
+      "grad_norm": 0.5703125,
+      "learning_rate": 2.913068701509568e-05,
+      "loss": 1.049,
+      "mean_token_accuracy": 0.746162725687027,
+      "num_tokens": 103921567.0,
+      "step": 400
+    },
+    {
+      "entropy": 1.0345054648816585,
+      "epoch": 0.22376926902038788,
+      "grad_norm": 0.53515625,
+      "learning_rate": 2.864103466438891e-05,
+      "loss": 1.0312,
+      "mean_token_accuracy": 0.7494943365454674,
+      "num_tokens": 116912063.0,
+      "step": 450
+    },
+    {
+      "entropy": 1.0316937543451785,
+      "epoch": 0.2486325211337643,
+      "grad_norm": 0.53125,
+      "learning_rate": 2.8048595586131855e-05,
+      "loss": 1.0284,
+      "mean_token_accuracy": 0.7500163938105107,
+      "num_tokens": 129905218.0,
+      "step": 500
+    },
+    {
+      "entropy": 1.0241920906305313,
+      "epoch": 0.27349577324714075,
+      "grad_norm": 0.55078125,
+      "learning_rate": 2.7357833875286894e-05,
+      "loss": 1.0203,
+      "mean_token_accuracy": 0.7514490978419781,
+      "num_tokens": 142885565.0,
+      "step": 550
+    },
+    {
+      "entropy": 1.0306694743037224,
+      "epoch": 0.29835902536051717,
+      "grad_norm": 0.54296875,
+      "learning_rate": 2.6573954498890738e-05,
+      "loss": 1.0269,
+      "mean_token_accuracy": 0.750104363411665,
+      "num_tokens": 155872064.0,
+      "step": 600
+    },
+    {
+      "entropy": 1.0152570338547229,
+      "epoch": 0.3232222774738936,
+      "grad_norm": 0.5234375,
+      "learning_rate": 2.5702864076043493e-05,
+      "loss": 1.0108,
+      "mean_token_accuracy": 0.7531800110638142,
+      "num_tokens": 168867280.0,
+      "step": 650
+    },
+    {
+      "entropy": 1.0094216690957547,
+      "epoch": 0.34808552958727,
+      "grad_norm": 0.53125,
+      "learning_rate": 2.4751126370870668e-05,
+      "loss": 1.005,
+      "mean_token_accuracy": 0.7541881857812405,
+      "num_tokens": 181860562.0,
+      "step": 700
+    },
+    {
+      "entropy": 1.0075355672836304,
+      "epoch": 0.37294878170064644,
+      "grad_norm": 0.5703125,
+      "learning_rate": 2.3725912833823623e-05,
+      "loss": 1.0029,
+      "mean_token_accuracy": 0.7544908618927002,
+      "num_tokens": 194857393.0,
+      "step": 750
+    },
+    {
+      "entropy": 1.0026545779407023,
+      "epoch": 0.39781203381402286,
+      "grad_norm": 0.54296875,
+      "learning_rate": 2.263494856399534e-05,
+      "loss": 0.9983,
+      "mean_token_accuracy": 0.7555115695297718,
+      "num_tokens": 207830748.0,
+      "step": 800
+    },
+    {
+      "entropy": 0.9955900900065899,
+      "epoch": 0.4226752859273993,
+      "grad_norm": 0.55859375,
+      "learning_rate": 2.148645409963155e-05,
+      "loss": 0.991,
+      "mean_token_accuracy": 0.7569138373434544,
+      "num_tokens": 220811854.0,
+      "step": 850
+    },
+    {
+      "entropy": 0.9966490264236927,
+      "epoch": 0.44753853804077576,
+      "grad_norm": 0.5234375,
+      "learning_rate": 2.0289083475452206e-05,
+      "loss": 0.9917,
+      "mean_token_accuracy": 0.7566816800832749,
+      "num_tokens": 233809152.0,
+      "step": 900
+    },
+    {
+      "entropy": 0.9946993951499462,
+      "epoch": 0.4724017901541522,
+      "grad_norm": 0.5703125,
+      "learning_rate": 1.9051859013528333e-05,
+      "loss": 0.9902,
+      "mean_token_accuracy": 0.7567966990172863,
+      "num_tokens": 246795198.0,
+      "step": 950
+    },
+    {
+      "entropy": 0.9998035056889057,
+      "epoch": 0.4972650422675286,
+      "grad_norm": 0.50390625,
+      "learning_rate": 1.7784103339072398e-05,
+      "loss": 0.9943,
+      "mean_token_accuracy": 0.7560001449286937,
+      "num_tokens": 259785941.0,
+      "step": 1000
+    },
+    {
+      "entropy": 0.991586543917656,
+      "epoch": 0.522128294380905,
+      "grad_norm": 0.515625,
+      "learning_rate": 1.649536913341075e-05,
+      "loss": 0.9866,
+      "mean_token_accuracy": 0.7574710394442081,
+      "num_tokens": 272778072.0,
+      "step": 1050
+    },
+    {
+      "entropy": 0.9825779674947261,
+      "epoch": 0.5469915464942815,
+      "grad_norm": 0.5234375,
+      "learning_rate": 1.5195367153457442e-05,
+      "loss": 0.9782,
+      "mean_token_accuracy": 0.7593892233073711,
+      "num_tokens": 285763198.0,
+      "step": 1100
+    },
+    {
+      "entropy": 0.9868022166192532,
+      "epoch": 0.5718547986076579,
+      "grad_norm": 0.52734375,
+      "learning_rate": 1.3893893060070753e-05,
+      "loss": 0.982,
+      "mean_token_accuracy": 0.7586962369084358,
+      "num_tokens": 298755470.0,
+      "step": 1150
+    },
+    {
+      "entropy": 0.9881981492042542,
+      "epoch": 0.5967180507210343,
+      "grad_norm": 0.51953125,
+      "learning_rate": 1.260075360664893e-05,
+      "loss": 0.983,
+      "mean_token_accuracy": 0.7583484600484371,
+      "num_tokens": 311732964.0,
+      "step": 1200
+    },
+    {
+      "entropy": 0.990956412255764,
+      "epoch": 0.6215813028344107,
+      "grad_norm": 0.54296875,
+      "learning_rate": 1.1325692744142444e-05,
+      "loss": 0.9855,
+      "mean_token_accuracy": 0.7576845416426659,
+      "num_tokens": 324722969.0,
+      "step": 1250
+    },
+    {
+      "entropy": 0.9845810621976853,
+      "epoch": 0.6464445549477872,
+      "grad_norm": 0.5234375,
+      "learning_rate": 1.0078318199289694e-05,
+      "loss": 0.98,
+      "mean_token_accuracy": 0.7590868937969207,
+      "num_tokens": 337708515.0,
+      "step": 1300
+    },
+    {
+      "entropy": 0.9848950608074665,
+      "epoch": 0.6713078070611636,
+      "grad_norm": 0.51171875,
+      "learning_rate": 8.868029079317466e-06,
+      "loss": 0.9794,
+      "mean_token_accuracy": 0.7590427026152611,
+      "num_tokens": 350694304.0,
+      "step": 1350
+    },
+    {
+      "entropy": 0.9880955889821053,
+      "epoch": 0.69617105917454,
+      "grad_norm": 0.5234375,
+      "learning_rate": 7.703945048612838e-06,
+      "loss": 0.9829,
+      "mean_token_accuracy": 0.758459353595972,
+      "num_tokens": 363687831.0,
+      "step": 1400
+    },
+    {
+      "entropy": 0.9795867702364922,
+      "epoch": 0.7210343112879165,
+      "grad_norm": 0.5,
+      "learning_rate": 6.594837611028224e-06,
+      "loss": 0.9748,
+      "mean_token_accuracy": 0.760101655125618,
+      "num_tokens": 376685856.0,
+      "step": 1450
+    },
+    {
+      "entropy": 0.9814675351977349,
+      "epoch": 0.7458975634012929,
+      "grad_norm": 0.51171875,
+      "learning_rate": 5.549064015615166e-06,
+      "loss": 0.9759,
+      "mean_token_accuracy": 0.7595324893295765,
+      "num_tokens": 389669946.0,
+      "step": 1500
+    },
+    {
+      "entropy": 0.9784578867256641,
+      "epoch": 0.7707608155146694,
+      "grad_norm": 0.515625,
+      "learning_rate": 4.574504283814536e-06,
+      "loss": 0.9735,
+      "mean_token_accuracy": 0.7601935516297817,
+      "num_tokens": 402664698.0,
+      "step": 1550
+    },
+    {
+      "entropy": 0.9806207512319088,
+      "epoch": 0.7956240676280457,
+      "grad_norm": 0.52734375,
+      "learning_rate": 3.67850183261035e-06,
+      "loss": 0.9754,
+      "mean_token_accuracy": 0.7597657778859138,
+      "num_tokens": 415650519.0,
+      "step": 1600
+    },
+    {
+      "entropy": 0.981166479587555,
+      "epoch": 0.8204873197414222,
+      "grad_norm": 0.498046875,
+      "learning_rate": 2.8678081410584267e-06,
+      "loss": 0.9759,
+      "mean_token_accuracy": 0.7597530463337898,
+      "num_tokens": 428641539.0,
+      "step": 1650
+    },
+    {
+      "entropy": 0.9809097257256508,
+      "epoch": 0.8453505718547986,
+      "grad_norm": 0.50390625,
+      "learning_rate": 2.1485318771337776e-06,
+      "loss": 0.9757,
+      "mean_token_accuracy": 0.7594838063418865,
+      "num_tokens": 441636832.0,
+      "step": 1700
+    },
+    {
+      "entropy": 0.9838246862590313,
+      "epoch": 0.870213823968175,
+      "grad_norm": 0.4921875,
+      "learning_rate": 1.5260928682316267e-06,
+      "loss": 0.9788,
+      "mean_token_accuracy": 0.7591392694413662,
+      "num_tokens": 454630338.0,
+      "step": 1750
+    },
+    {
+      "entropy": 0.9816241288185119,
+      "epoch": 0.8950770760815515,
+      "grad_norm": 0.51171875,
+      "learning_rate": 1.0051812621595896e-06,
+      "loss": 0.9763,
+      "mean_token_accuracy": 0.7593851044774056,
+      "num_tokens": 467615642.0,
+      "step": 1800
+    },
+    {
+      "entropy": 0.9775546994805336,
+      "epoch": 0.9199403281949279,
+      "grad_norm": 0.51953125,
+      "learning_rate": 5.89722186347399e-07,
+      "loss": 0.9727,
+      "mean_token_accuracy": 0.7600829027593136,
+      "num_tokens": 480607840.0,
+      "step": 1850
+    },
+    {
+      "entropy": 0.9843708150088787,
+      "epoch": 0.9448035803083044,
+      "grad_norm": 0.498046875,
+      "learning_rate": 2.828461715710806e-07,
+      "loss": 0.9798,
+      "mean_token_accuracy": 0.7588261432945729,
+      "num_tokens": 493591064.0,
+      "step": 1900
+    },
+    {
+      "entropy": 0.9855945162475109,
+      "epoch": 0.9696668324216807,
+      "grad_norm": 0.5234375,
+      "learning_rate": 8.686556305214144e-08,
+      "loss": 0.9812,
+      "mean_token_accuracy": 0.7586447390913963,
+      "num_tokens": 506570590.0,
+      "step": 1950
+    },
+    {
+      "entropy": 0.9880490954220295,
+      "epoch": 0.9945300845350572,
+      "grad_norm": 0.51171875,
+      "learning_rate": 3.2570966767209166e-09,
+      "loss": 0.9837,
+      "mean_token_accuracy": 0.7583207984268665,
+      "num_tokens": 519553398.0,
+      "step": 2000
+    }
+  ],
+  "logging_steps": 50,
+  "max_steps": 2011,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 50000,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 4.417734959016444e+18,
+  "train_batch_size": 2,
+  "trial_name": null,
+  "trial_params": null
+}
--- a/checkpoint-2011/training_args.bin
+++ b/checkpoint-2011/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b7a70dbcd5c125fa9f57226dc92a2c81002b1337229a9e2a085e4ad26fa46511
+size 6289
--- a/checkpoint-2011/vocab.json
+++ b/checkpoint-2011/vocab.json
--- a/config.json
+++ b/config.json
@@ -0,0 +1,61 @@
+{
+  "architectures": [
+    "Qwen3ForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 151644,
+  "dtype": "bfloat16",
+  "eos_token_id": 151645,
+  "head_dim": 128,
+  "hidden_act": "silu",
+  "hidden_size": 2048,
+  "initializer_range": 0.02,
+  "intermediate_size": 6144,
+  "layer_types": [
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention"
+  ],
+  "max_position_embeddings": 32768,
+  "max_window_layers": 28,
+  "model_type": "qwen3",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 28,
+  "num_key_value_heads": 8,
+  "pad_token_id": 151645,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": null,
+  "rope_theta": 1000000,
+  "sliding_window": null,
+  "tie_word_embeddings": true,
+  "transformers_version": "4.57.3",
+  "use_cache": true,
+  "use_sliding_window": false,
+  "vocab_size": 151669
+}
--- a/generation_config.json
+++ b/generation_config.json
@@ -0,0 +1,9 @@
+{
+  "bos_token_id": 151644,
+  "eos_token_id": [
+    151645
+  ],
+  "max_new_tokens": 2048,
+  "pad_token_id": 151645,
+  "transformers_version": "4.57.3"
+}
--- a/merges.txt
+++ b/merges.txt
--- a/model.safetensors
+++ b/model.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f78fd28d6162fd41392fe469bb68cfc323d68863e59cf6c86ea5ad31af34e2d2
+size 3440091976
--- a/special_tokens_map.json
+++ b/special_tokens_map.json
@@ -0,0 +1,21 @@
+{
+  "additional_special_tokens": [
+    {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    }
+  ],
+  "bos_token": "<|im_start|>",
+  "eos_token": "<|im_end|>",
+  "pad_token": "<|im_end|>"
+}
--- a/tokenizer.json
+++ b/tokenizer.json
--- a/tokenizer_config.json
+++ b/tokenizer_config.json
@@ -0,0 +1,228 @@
+{
+  "add_bos_token": false,
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "151643": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151644": {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151645": {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151646": {
+      "content": "<|object_ref_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151647": {
+      "content": "<|object_ref_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151648": {
+      "content": "<|box_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151649": {
+      "content": "<|box_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151650": {
+      "content": "<|quad_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151651": {
+      "content": "<|quad_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151652": {
+      "content": "<|vision_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151653": {
+      "content": "<|vision_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151654": {
+      "content": "<|vision_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151655": {
+      "content": "<|image_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151656": {
+      "content": "<|video_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151657": {
+      "content": "<tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151658": {
+      "content": "</tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151659": {
+      "content": "<|fim_prefix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151660": {
+      "content": "<|fim_middle|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151661": {
+      "content": "<|fim_suffix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151662": {
+      "content": "<|fim_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151663": {
+      "content": "<|repo_name|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151664": {
+      "content": "<|file_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151665": {
+      "content": "<tool_response>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151666": {
+      "content": "</tool_response>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151667": {
+      "content": "<think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151668": {
+      "content": "</think>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>"
+  ],
+  "bos_token": "<|im_start|>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|im_end|>",
+  "errors": "replace",
+  "extra_special_tokens": {},
+  "model_max_length": 131072,
+  "pad_token": "<|im_end|>",
+  "split_special_tokens": false,
+  "tokenizer_class": "Qwen2Tokenizer",
+  "unk_token": null
+}
--- a/training_args.bin
+++ b/training_args.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b7a70dbcd5c125fa9f57226dc92a2c81002b1337229a9e2a085e4ad26fa46511
+size 6289
--- a/vocab.json
+++ b/vocab.json