Model: xd2010/Qwen1.5-MOE-aux-free-sft-math7k-1e-3-gamma-part2-test Source: Original Platform
8 lines
216 B
JSON
8 lines
216 B
JSON
{
|
|
"total_flos": 2.0144468407196058e+17,
|
|
"train_loss": 0.17723823002604552,
|
|
"train_runtime": 1262.477,
|
|
"train_samples": 6851,
|
|
"train_samples_per_second": 5.427,
|
|
"train_steps_per_second": 0.17
|
|
} |