Model: Hyeongwon/PS_only_answer_Qwen3-4B-Base_0328-01-1e-5-seed43 Source: Original Platform
9 lines
231 B
JSON
9 lines
231 B
JSON
{
|
|
"epoch": 6.0,
|
|
"total_flos": 475851760140288.0,
|
|
"train_loss": 0.4284659847488502,
|
|
"train_runtime": 50380.648,
|
|
"train_samples": 18626,
|
|
"train_samples_per_second": 2.218,
|
|
"train_steps_per_second": 0.011
|
|
} |