Model: mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz256_lr16e5_epochs5 Source: Original Platform
8 lines
206 B
JSON
8 lines
206 B
JSON
{
|
|
"epoch": 5.0,
|
|
"total_flos": 7122204608430080.0,
|
|
"train_loss": 1.0036099467436066,
|
|
"train_runtime": 36219.8634,
|
|
"train_samples_per_second": 13.805,
|
|
"train_steps_per_second": 0.054
|
|
} |