Model: ali-elganzory/Baguettotron-longsft_16k-SFT-Tulu3-decontaminated Source: Original Platform
8 lines
217 B
JSON
8 lines
217 B
JSON
{
|
|
"total_flos": 2710644215513088.0,
|
|
"train_loss": 1.6633207928015101,
|
|
"train_runtime": 25736.6854,
|
|
"train_samples": 936509,
|
|
"train_samples_per_second": 72.776,
|
|
"train_steps_per_second": 0.569
|
|
} |