Model: ali-elganzory/1.7b-MixtureVitae-web_curated-100BT-longsft_16k-SFT-Tulu3-decontaminated Source: Original Platform
8 lines
219 B
JSON
8 lines
219 B
JSON
{
|
|
"total_flos": 2.19812273324032e+16,
|
|
"train_loss": 0.2031160936633208,
|
|
"train_runtime": 9356.8224,
|
|
"train_samples": 936509,
|
|
"train_samples_per_second": 200.177,
|
|
"train_steps_per_second": 1.564
|
|
} |