Model: ali-elganzory/Baguettotron-longsft_16k-DPO-Tulu3-decontaminated Source: Original Platform
9 lines
216 B
JSON
9 lines
216 B
JSON
{
|
|
"epoch": 1.0,
|
|
"total_flos": 0.0,
|
|
"train_loss": 4.194636241930751,
|
|
"train_runtime": 7092.6143,
|
|
"train_samples": 272585,
|
|
"train_samples_per_second": 38.432,
|
|
"train_steps_per_second": 0.3
|
|
} |