Model: mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz1024_lr16e5_epochs5 Source: Original Platform
8 lines
217 B
JSON
8 lines
217 B
JSON
{
|
|
"epoch": 4.961636828644501,
|
|
"total_flos": 7065760181780480.0,
|
|
"train_loss": 1.075610858509221,
|
|
"train_runtime": 69151.8205,
|
|
"train_samples_per_second": 7.23,
|
|
"train_steps_per_second": 0.007
|
|
} |