Model: xd2010/OLMoE-1B-7B-0125-sft-math7k-2epochs-frozen-router Source: Original Platform
8 lines
210 B
JSON
8 lines
210 B
JSON
{
|
|
"total_flos": 6812915466240.0,
|
|
"train_loss": 0.3203352055983779,
|
|
"train_runtime": 2102.8589,
|
|
"train_samples": 6851,
|
|
"train_samples_per_second": 9.774,
|
|
"train_steps_per_second": 0.077
|
|
} |