Model: ali-elganzory/open-sci-ref-v0.02-1.7b-nemotron-hq-300B-16k-SFT-Tulu3-decontaminated Source: Original Platform
8 lines
219 B
JSON
8 lines
219 B
JSON
{
|
|
"total_flos": 2.197196595737395e+16,
|
|
"train_loss": 0.7360902870387283,
|
|
"train_runtime": 33470.8922,
|
|
"train_samples": 936509,
|
|
"train_samples_per_second": 55.96,
|
|
"train_steps_per_second": 0.437
|
|
} |