初始化项目,由ModelHub XC社区提供模型
Model: agarwalanu3103/clarify-rl-grpo-qwen3-1-7b Source: Original Platform
This commit is contained in:
15
training_summary.json
Normal file
15
training_summary.json
Normal file
@@ -0,0 +1,15 @@
|
||||
{
|
||||
"model": "Qwen/Qwen3-1.7B",
|
||||
"max_steps": 400,
|
||||
"num_generations": 8,
|
||||
"vllm_gpu_memory_utilization": 0.55,
|
||||
"max_completion_length": 1536,
|
||||
"train_seconds": 3238.236308813095,
|
||||
"stats": "TrainOutput(global_step=400, training_loss=0.018298895093612374, metrics={'train_runtime': 3189.1606, 'train_samples_per_second': 1.003, 'train_steps_per_second': 0.125, 'total_flos': 0.0, 'train_loss': 0.018298895093612374})",
|
||||
"failed": false,
|
||||
"failure_reason": "",
|
||||
"output_dir": "clarify-rl-grpo-qwen3-1-7b",
|
||||
"trackio_space_id": "clarify-rl-grpo-qwen3-1-7b",
|
||||
"num_log_entries": 401,
|
||||
"smoke_test": false
|
||||
}
|
||||
Reference in New Issue
Block a user