Model: mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz512_lr4e5_epochs5 Source: Original Platform
8 lines
220 B
JSON
8 lines
220 B
JSON
{
|
|
"epoch": 4.987212276214834,
|
|
"total_flos": 7100358600687616.0,
|
|
"train_loss": 1.0860105241261995,
|
|
"train_runtime": 35157.9071,
|
|
"train_samples_per_second": 14.222,
|
|
"train_steps_per_second": 0.028
|
|
} |