Model: laion/nemosci-tasrep-a1mfc-gfistaqc-dev1-scaff-maxeps-swes-r2eg__Qwen3-8B Source: Original Platform
16 lines
541 B
JSON
16 lines
541 B
JSON
{
|
|
"achieved_tflops_per_gpu": 20.323151459284283,
|
|
"achieved_tflops_per_gpu_theoretical": 741.9510992582738,
|
|
"epoch": 5.0,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21446937322616577,
|
|
"mfu_percent": 1.436265120797476,
|
|
"mfu_percent_theoretical": 52.4347066613621,
|
|
"total_flos": 1.3771174172166193e+19,
|
|
"train_loss": 0.058854675498723724,
|
|
"train_runtime": 21175.3179,
|
|
"train_samples_per_second": 21.0,
|
|
"train_steps_per_second": 0.219,
|
|
"valid_targets_mean": 6732.3,
|
|
"valid_targets_min": 192
|
|
} |