Model: mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz256_lr2e5_epochs7 Source: Original Platform
8 lines
204 B
JSON
8 lines
204 B
JSON
{
|
|
"epoch": 7.0,
|
|
"total_flos": 9969287656374272.0,
|
|
"train_loss": 1.063590354692078,
|
|
"train_runtime": 97730.0822,
|
|
"train_samples_per_second": 7.163,
|
|
"train_steps_per_second": 0.028
|
|
} |