commit 30b5c65275cde55251aae0669c9f7bf951143e2f Author: ModelHub XC Date: Tue Jun 16 08:09:17 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: eventhorizon28/cadforge-grpo-Qwen3-1.7B Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..52373fe --- /dev/null +++ b/.gitattributes @@ -0,0 +1,36 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..bebff19 --- /dev/null +++ b/README.md @@ -0,0 +1,68 @@ +--- +base_model: Qwen/Qwen3-1.7B +library_name: transformers +model_name: cadforge-grpo-Qwen3-1.7B +tags: +- generated_from_trainer +- grpo +- trl +- trackio:https://eventhorizon28-cadforge-grpo-Qwen3-1.7B.hf.space?project=huggingface&runs=eventhorizon28-1777197565&sidebar=collapsed +licence: license +--- + +# Model Card for cadforge-grpo-Qwen3-1.7B + +This model is a fine-tuned version of [Qwen/Qwen3-1.7B](https://huggingface.co/Qwen/Qwen3-1.7B). +It has been trained using [TRL](https://github.com/huggingface/trl). + +## Quick start + +```python +from transformers import pipeline + +question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?" +generator = pipeline("text-generation", model="eventhorizon28/cadforge-grpo-Qwen3-1.7B", device="cuda") +output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0] +print(output["generated_text"]) +``` + +## Training procedure + + +[Visualize in Trackio](https://eventhorizon28-cadforge-grpo-Qwen3-1.7B.hf.space?project=huggingface&runs=eventhorizon28-1777197565&sidebar=collapsed) + + +This model was trained with GRPO, a method introduced in [DeepSeekMath: Pushing the Limits of Mathematical Reasoning in Open Language Models](https://huggingface.co/papers/2402.03300). + +### Framework versions + +- TRL: 1.2.0 +- Transformers: 5.7.0.dev0 +- Pytorch: 2.8.0 +- Datasets: 4.8.4 +- Tokenizers: 0.22.2 + +## Citations + +Cite GRPO as: + +```bibtex +@article{shao2024deepseekmath, + title = {{DeepSeekMath: Pushing the Limits of Mathematical Reasoning in Open Language Models}}, + author = {Zhihong Shao and Peiyi Wang and Qihao Zhu and Runxin Xu and Junxiao Song and Mingchuan Zhang and Y. K. Li and Y. Wu and Daya Guo}, + year = 2024, + eprint = {arXiv:2402.03300}, +} +``` + +Cite TRL as: + +```bibtex +@software{vonwerra2020trl, + title = {{TRL: Transformers Reinforcement Learning}}, + author = {von Werra, Leandro and Belkada, Younes and Tunstall, Lewis and Beeching, Edward and Thrush, Tristan and Lambert, Nathan and Huang, Shengyi and Rasul, Kashif and Gallouédec, Quentin}, + license = {Apache-2.0}, + url = {https://github.com/huggingface/trl}, + year = {2020} +} +``` \ No newline at end of file diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000..01be9b3 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,89 @@ +{%- if tools %} + {{- '<|im_start|>system\n' }} + {%- if messages[0].role == 'system' %} + {{- messages[0].content + '\n\n' }} + {%- endif %} + {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within XML tags:\n" }} + {%- for tool in tools %} + {{- "\n" }} + {{- tool | tojson }} + {%- endfor %} + {{- "\n\n\nFor each function call, return a json object with function name and arguments within XML tags:\n\n{\"name\": , \"arguments\": }\n<|im_end|>\n" }} +{%- else %} + {%- if messages[0].role == 'system' %} + {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }} + {%- endif %} +{%- endif %} +{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %} +{%- for message in messages[::-1] %} + {%- set index = (messages|length - 1) - loop.index0 %} + {%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('') and message.content.endswith('')) %} + {%- set ns.multi_step_tool = false %} + {%- set ns.last_query_index = index %} + {%- endif %} +{%- endfor %} +{%- for message in messages %} + {%- if message.content is string %} + {%- set content = message.content %} + {%- else %} + {%- set content = '' %} + {%- endif %} + {%- if (message.role == "user") or (message.role == "system" and not loop.first) %} + {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }} + {%- elif message.role == "assistant" %} + {%- set reasoning_content = '' %} + {%- if message.reasoning_content is string %} + {%- set reasoning_content = message.reasoning_content %} + {%- else %} + {%- if '' in content %} + {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %} + {%- set content = content.split('')[-1].lstrip('\n') %} + {%- endif %} + {%- endif %} + {%- if loop.index0 > ns.last_query_index %} + {%- if loop.last or (not loop.last and reasoning_content) %} + {{- '<|im_start|>' + message.role + '\n\n' + reasoning_content.strip('\n') + '\n\n\n' + content.lstrip('\n') }} + {%- else %} + {{- '<|im_start|>' + message.role + '\n' + content }} + {%- endif %} + {%- else %} + {{- '<|im_start|>' + message.role + '\n' + content }} + {%- endif %} + {%- if message.tool_calls %} + {%- for tool_call in message.tool_calls %} + {%- if (loop.first and content) or (not loop.first) %} + {{- '\n' }} + {%- endif %} + {%- if tool_call.function %} + {%- set tool_call = tool_call.function %} + {%- endif %} + {{- '\n{"name": "' }} + {{- tool_call.name }} + {{- '", "arguments": ' }} + {%- if tool_call.arguments is string %} + {{- tool_call.arguments }} + {%- else %} + {{- tool_call.arguments | tojson }} + {%- endif %} + {{- '}\n' }} + {%- endfor %} + {%- endif %} + {{- '<|im_end|>\n' }} + {%- elif message.role == "tool" %} + {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|im_start|>user' }} + {%- endif %} + {{- '\n\n' }} + {{- content }} + {{- '\n' }} + {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %} + {{- '<|im_end|>\n' }} + {%- endif %} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|im_start|>assistant\n' }} + {%- if enable_thinking is defined and enable_thinking is false %} + {{- '\n\n\n\n' }} + {%- endif %} +{%- endif %} \ No newline at end of file diff --git a/completions/completions_00001.parquet b/completions/completions_00001.parquet new file mode 100644 index 0000000..fc27bbf --- /dev/null +++ b/completions/completions_00001.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29d168bbe02b531d00a3898090291b7ac8a6e366c0f50793d13c084bf65ea9ab +size 10380 diff --git a/completions/completions_00002.parquet b/completions/completions_00002.parquet new file mode 100644 index 0000000..fd4492b --- /dev/null +++ b/completions/completions_00002.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164b22442c464059c3ad387ae2e604fa357005929b8aeab70d5e36cd78a0cbda +size 16670 diff --git a/completions/completions_00003.parquet b/completions/completions_00003.parquet new file mode 100644 index 0000000..76f05d9 --- /dev/null +++ b/completions/completions_00003.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f95591d239371409249301027e856abdf3ba42177612a3e711f135b94204c246 +size 11446 diff --git a/completions/completions_00004.parquet b/completions/completions_00004.parquet new file mode 100644 index 0000000..0fb6526 --- /dev/null +++ b/completions/completions_00004.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7768f19d0175e14fc36d3a78a92095bb33618fff2566d3e913502e3b3725a722 +size 12263 diff --git a/completions/completions_00005.parquet b/completions/completions_00005.parquet new file mode 100644 index 0000000..7f2a867 --- /dev/null +++ b/completions/completions_00005.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae54b84c0ce883d9824d85b8a20a1e06d9b3704252557ddbec8fdd15d9ec3c5 +size 13318 diff --git a/completions/completions_00006.parquet b/completions/completions_00006.parquet new file mode 100644 index 0000000..5facd4e --- /dev/null +++ b/completions/completions_00006.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015da04b5b6418162177e79c2f616a539a0994e9b6c31d914a43eeabd8a620de +size 10999 diff --git a/completions/completions_00007.parquet b/completions/completions_00007.parquet new file mode 100644 index 0000000..9660840 --- /dev/null +++ b/completions/completions_00007.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3387ea7e16edb45eceaf2fe5475fc98357c47bebd30aca003587af4e5764ac68 +size 15046 diff --git a/completions/completions_00008.parquet b/completions/completions_00008.parquet new file mode 100644 index 0000000..7a4020e --- /dev/null +++ b/completions/completions_00008.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8de9ac613e9267542f4763b7857fb79cf720e54e75080032928e2c796adb0a02 +size 13830 diff --git a/completions/completions_00009.parquet b/completions/completions_00009.parquet new file mode 100644 index 0000000..40737f6 --- /dev/null +++ b/completions/completions_00009.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:688ba1182b18f2adc16a7bb60eb68ea268e0b72cc5319743e88ce2d3da6de5f0 +size 9145 diff --git a/completions/completions_00010.parquet b/completions/completions_00010.parquet new file mode 100644 index 0000000..21aec46 --- /dev/null +++ b/completions/completions_00010.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1da2932509d08a4647141bd9f188d797294c05264a83a9952d5e6df42d5ec624 +size 11055 diff --git a/completions/completions_00011.parquet b/completions/completions_00011.parquet new file mode 100644 index 0000000..f1b3695 --- /dev/null +++ b/completions/completions_00011.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d1d39169119d2201ffa7255eafbe88fdb32f4dbd2f7e64a1d70a31d129d58f9 +size 13935 diff --git a/completions/completions_00012.parquet b/completions/completions_00012.parquet new file mode 100644 index 0000000..7715c08 --- /dev/null +++ b/completions/completions_00012.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87f5ecab1e30be9f04c7aae4705cdd42f2b5e023c915e7e935e524abeb464bcd +size 13103 diff --git a/completions/completions_00013.parquet b/completions/completions_00013.parquet new file mode 100644 index 0000000..807ee1f --- /dev/null +++ b/completions/completions_00013.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa4b7643ff7373328f763569fc0b7eccd7b411fe846a57f1acc719ef9fe21bc +size 13763 diff --git a/completions/completions_00014.parquet b/completions/completions_00014.parquet new file mode 100644 index 0000000..2c80b5a --- /dev/null +++ b/completions/completions_00014.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:383a13f545857ce52c1909b92786ff32e0fc1a2b0b6b348601d5a62da7c56ade +size 9259 diff --git a/completions/completions_00015.parquet b/completions/completions_00015.parquet new file mode 100644 index 0000000..bde276a --- /dev/null +++ b/completions/completions_00015.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6a8ef2a68099313de9c2c62cf8fa35f9fda022f3ede19304ce66d775ea69a63 +size 11477 diff --git a/completions/completions_00016.parquet b/completions/completions_00016.parquet new file mode 100644 index 0000000..54ebcc1 --- /dev/null +++ b/completions/completions_00016.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8447fd2403179741d98566320247271bee45cd7ee9ee7ea4cbebd02604864c5 +size 12742 diff --git a/completions/completions_00017.parquet b/completions/completions_00017.parquet new file mode 100644 index 0000000..f43141a --- /dev/null +++ b/completions/completions_00017.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f42b25f1d94a4d53394dd6821826a4213cb138c08b98b6ccc9ddd006215fa56 +size 14401 diff --git a/completions/completions_00018.parquet b/completions/completions_00018.parquet new file mode 100644 index 0000000..73c95f1 --- /dev/null +++ b/completions/completions_00018.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7200dd2bcdfc891e06edfa16e3798b4a8255ae33b0b67370f2e5860a231d3a9 +size 13418 diff --git a/completions/completions_00019.parquet b/completions/completions_00019.parquet new file mode 100644 index 0000000..4793565 --- /dev/null +++ b/completions/completions_00019.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae478be552902a76783bc2b844e824e8104ba88696080026a30a31945b6b0c6 +size 13962 diff --git a/completions/completions_00020.parquet b/completions/completions_00020.parquet new file mode 100644 index 0000000..3bc35a6 --- /dev/null +++ b/completions/completions_00020.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd231974c70961efe15d8767273a540dc02168d5b32e7c644798879459b92b1 +size 13457 diff --git a/completions/completions_00021.parquet b/completions/completions_00021.parquet new file mode 100644 index 0000000..d2768f9 --- /dev/null +++ b/completions/completions_00021.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3914a7fdd5b37040e61ac6793e37e3dab09fbd784f67ede29e1827c0858f474 +size 13838 diff --git a/completions/completions_00022.parquet b/completions/completions_00022.parquet new file mode 100644 index 0000000..bd1f7f7 --- /dev/null +++ b/completions/completions_00022.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7374bf355717a5c68f9514fc40d474e29d6493291ef65dbe416a5a56906fa0cb +size 14869 diff --git a/completions/completions_00023.parquet b/completions/completions_00023.parquet new file mode 100644 index 0000000..3ae18da --- /dev/null +++ b/completions/completions_00023.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76e4c2960cfccc5246200268d8607f677125642bb4b36d93112792fcd83d625e +size 12877 diff --git a/completions/completions_00024.parquet b/completions/completions_00024.parquet new file mode 100644 index 0000000..f79ed05 --- /dev/null +++ b/completions/completions_00024.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b76c30af6405323f6459a781760943373b9ce786c31c51ba891217694a1f7331 +size 13684 diff --git a/completions/completions_00025.parquet b/completions/completions_00025.parquet new file mode 100644 index 0000000..12fcd6e --- /dev/null +++ b/completions/completions_00025.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fb5dbf36afbb3dc2e26ea7aea8bf3fadcd558b9a17f49ba37fc40078f114515 +size 11339 diff --git a/completions/completions_00026.parquet b/completions/completions_00026.parquet new file mode 100644 index 0000000..e29378c --- /dev/null +++ b/completions/completions_00026.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8950ed6a1b603667f4a4ffe4c824f47a8f135c2b0ef2d9c5406d5ed525d17106 +size 15189 diff --git a/completions/completions_00027.parquet b/completions/completions_00027.parquet new file mode 100644 index 0000000..1c8bf37 --- /dev/null +++ b/completions/completions_00027.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b08ce1979cba1f9252100aff4fb5e1efbf2ee33e660a33d93b945c720a566d09 +size 14639 diff --git a/completions/completions_00028.parquet b/completions/completions_00028.parquet new file mode 100644 index 0000000..9a5e7d8 --- /dev/null +++ b/completions/completions_00028.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ecdbaa3c699257e38b0e4abf436ae2c692f775e2993a83665a272cb56dccec +size 13694 diff --git a/completions/completions_00029.parquet b/completions/completions_00029.parquet new file mode 100644 index 0000000..714c530 --- /dev/null +++ b/completions/completions_00029.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7dd7500152d38ba2b91a0c11529a0a50b34df8f3edd3ba6731f634c204051b9 +size 12554 diff --git a/completions/completions_00030.parquet b/completions/completions_00030.parquet new file mode 100644 index 0000000..999e1cb --- /dev/null +++ b/completions/completions_00030.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b5df92a199dee08917a1fba275c4f5293c0664508711f10ef13674247f8b5e8 +size 13167 diff --git a/completions/completions_00031.parquet b/completions/completions_00031.parquet new file mode 100644 index 0000000..9cc07ff --- /dev/null +++ b/completions/completions_00031.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:056b2abd4ad3cff38bb315da108064d04ee846b508d509d8afff0263050fc178 +size 12380 diff --git a/completions/completions_00032.parquet b/completions/completions_00032.parquet new file mode 100644 index 0000000..7eabcee --- /dev/null +++ b/completions/completions_00032.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd4d12f4daaad1183cc1f3572e17c76beabeded350ef22e9b391c67f0705e44b +size 13149 diff --git a/completions/completions_00033.parquet b/completions/completions_00033.parquet new file mode 100644 index 0000000..fe7d89d --- /dev/null +++ b/completions/completions_00033.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2271050008989ffdb0630b25232e396977e18b5c2f416bdcaa8c724407328102 +size 12949 diff --git a/completions/completions_00034.parquet b/completions/completions_00034.parquet new file mode 100644 index 0000000..66cccc4 --- /dev/null +++ b/completions/completions_00034.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12d74f2c88213da97743ea5612d9cbc7d77ec63b5a78d92f14963a2f2994724e +size 12630 diff --git a/completions/completions_00035.parquet b/completions/completions_00035.parquet new file mode 100644 index 0000000..e1d1e06 --- /dev/null +++ b/completions/completions_00035.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7202705dbcbeda3a910583381c43579b8b2a32766063be8904ba4fecd00d0bf +size 13310 diff --git a/completions/completions_00036.parquet b/completions/completions_00036.parquet new file mode 100644 index 0000000..475c2fc --- /dev/null +++ b/completions/completions_00036.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:226f1ca1e16d9eb27d075c178815d34835d95dfefcfa5fdb4e23a7cead7fb6d8 +size 11494 diff --git a/completions/completions_00037.parquet b/completions/completions_00037.parquet new file mode 100644 index 0000000..6ea6179 --- /dev/null +++ b/completions/completions_00037.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94859de31d641b671deba29f649609c9718d5e423b02ff55694f5a9b268b2416 +size 13021 diff --git a/completions/completions_00038.parquet b/completions/completions_00038.parquet new file mode 100644 index 0000000..874bbec --- /dev/null +++ b/completions/completions_00038.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2dd8be427915a3887a7a1f5e01a8a2bb118bd25e9d18ed0661c76b790ff6bda +size 15063 diff --git a/completions/completions_00039.parquet b/completions/completions_00039.parquet new file mode 100644 index 0000000..b49415e --- /dev/null +++ b/completions/completions_00039.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:003c361a8ca944463629f8a914de52e71a7800f22bdd6d22d330f6dff132860f +size 13453 diff --git a/completions/completions_00040.parquet b/completions/completions_00040.parquet new file mode 100644 index 0000000..07e255a --- /dev/null +++ b/completions/completions_00040.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df52457366da6fa7dceb0b5ea9d550fdd308552cfdd755787be62ca333968a09 +size 13924 diff --git a/completions/completions_00041.parquet b/completions/completions_00041.parquet new file mode 100644 index 0000000..bab22de --- /dev/null +++ b/completions/completions_00041.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d00422bbf4a13a6e2b69fce14de534016e30c27134035dbb1a993b7f92da88bb +size 13210 diff --git a/completions/completions_00042.parquet b/completions/completions_00042.parquet new file mode 100644 index 0000000..e7e0ff8 --- /dev/null +++ b/completions/completions_00042.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f692493bfa872a6fd080d7d25549d1e576f628a6e0defcfe48c924f20a6790a +size 12426 diff --git a/completions/completions_00043.parquet b/completions/completions_00043.parquet new file mode 100644 index 0000000..85ed345 --- /dev/null +++ b/completions/completions_00043.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949e194312c28d98145d7e58ce757d374c6b10bdd7ea332c212d7c928e376d94 +size 12756 diff --git a/completions/completions_00044.parquet b/completions/completions_00044.parquet new file mode 100644 index 0000000..e29ea03 --- /dev/null +++ b/completions/completions_00044.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c9814b1e311a0b2006bf6e55bdf89b32054adf0d0335ed7635b341c360e4fda +size 15387 diff --git a/completions/completions_00045.parquet b/completions/completions_00045.parquet new file mode 100644 index 0000000..f894c1c --- /dev/null +++ b/completions/completions_00045.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cea1241984dc5e73db91c7c44e67eec4b1b86990f1f2efe39dcef1ccd3f3da5 +size 11264 diff --git a/completions/completions_00046.parquet b/completions/completions_00046.parquet new file mode 100644 index 0000000..8f94d5f --- /dev/null +++ b/completions/completions_00046.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2be4effe7ea7d70efcf1b39299d33c59d1d480961753008f0f253ba1a0379778 +size 15357 diff --git a/completions/completions_00047.parquet b/completions/completions_00047.parquet new file mode 100644 index 0000000..a49d8c0 --- /dev/null +++ b/completions/completions_00047.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e45d4ee82d5c8989bc600a589d6a514bfb83443830805a0e3bb150ab790108 +size 14468 diff --git a/completions/completions_00048.parquet b/completions/completions_00048.parquet new file mode 100644 index 0000000..59e0615 --- /dev/null +++ b/completions/completions_00048.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58700f0e88bc141ecff4e35c34a9ae38b4211ab4c483e82074f73b1f63d2b3fa +size 11206 diff --git a/completions/completions_00049.parquet b/completions/completions_00049.parquet new file mode 100644 index 0000000..79c78c0 --- /dev/null +++ b/completions/completions_00049.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cab183d20a939e38a6929fb1e474262c4fccdc09f6580d9074ca2bcd3c7ee17 +size 13377 diff --git a/completions/completions_00050.parquet b/completions/completions_00050.parquet new file mode 100644 index 0000000..8a51436 --- /dev/null +++ b/completions/completions_00050.parquet @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b684834bf557b6289b727cf154bf3c49805790de506de1dfa3e321c8021fae +size 14240 diff --git a/config.json b/config.json new file mode 100644 index 0000000..a59d6e2 --- /dev/null +++ b/config.json @@ -0,0 +1,63 @@ +{ + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "bos_token_id": null, + "dtype": "float32", + "eos_token_id": 151645, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 6144, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 40960, + "max_window_layers": 28, + "model_type": "qwen3", + "num_attention_heads": 16, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "pad_token_id": 151643, + "rms_norm_eps": 1e-06, + "rope_parameters": { + "rope_theta": 1000000, + "rope_type": "default" + }, + "sliding_window": null, + "tie_word_embeddings": true, + "transformers_version": "5.7.0.dev0", + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 151936 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..9787484 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,12 @@ +{ + "do_sample": true, + "eos_token_id": [ + 151645, + 151643 + ], + "pad_token_id": 151643, + "temperature": 0.6, + "top_k": 20, + "top_p": 0.95, + "transformers_version": "5.7.0.dev0" +} diff --git a/model.safetensors b/model.safetensors new file mode 100644 index 0000000..4307640 --- /dev/null +++ b/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:188780cf8cb6b1294d50e09593d60ecb4cf640f4da7d834eeaa2c303b6f207e1 +size 6882335328 diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..c7afbed --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be75606093db2094d7cd20f3c2f385c212750648bd6ea4fb2bf507a6a4c55506 +size 11422650 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..af5f35b --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,75 @@ +{ + "add_prefix_space": false, + "backend": "tokenizers", + "bos_token": null, + "clean_up_tokenization_spaces": false, + "eos_token": "<|im_end|>", + "errors": "replace", + "extra_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "is_local": false, + "local_files_only": false, + "model_max_length": 131072, + "pad_token": "<|endoftext|>", + "padding_side": "left", + "response_schema": { + "properties": { + "content": { + "type": "string" + }, + "reasoning_content": { + "type": "string" + }, + "role": { + "const": "assistant" + }, + "tool_calls": { + "items": { + "properties": { + "function": { + "properties": { + "arguments": { + "additionalProperties": {}, + "type": "object" + }, + "name": { + "type": "string" + } + }, + "type": "object" + }, + "type": { + "const": "function" + } + }, + "type": "object", + "x-parser": "json", + "x-parser-args": { + "transform": "{type: 'function', function: @}" + } + }, + "type": "array", + "x-regex-iterator": "\\s*(.+?)\\s*" + } + }, + "type": "object", + "x-regex": "^(?:\\n?(?:(?P.*?\\S.*?)\\n?|[\\s]*)\\s*)?(?P.*?)(?:\\n(?=))?(?=(?:|<\\|im_end\\|>|$))(?P(?:.+?\\s*)+)?\\s*(?:<\\|im_end\\|>|$)" + }, + "split_special_tokens": false, + "tokenizer_class": "Qwen2Tokenizer", + "truncation_side": "left", + "unk_token": null +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000..93d3fff --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e1153ef6b3a156ebfad3dd3aa112c057874f0b3037b3c21a5fd20f367f9cfa0 +size 7185