131 lines
2.8 KiB
JSON
131 lines
2.8 KiB
JSON
{
|
|
"best_metric": null,
|
|
"best_model_checkpoint": null,
|
|
"epoch": 13.791738382099828,
|
|
"global_step": 2000,
|
|
"is_hyper_param_search": false,
|
|
"is_local_process_zero": true,
|
|
"is_world_process_zero": true,
|
|
"log_history": [
|
|
{
|
|
"epoch": 1.03,
|
|
"learning_rate": 9.99965514863094e-07,
|
|
"loss": 0.0333,
|
|
"step": 150
|
|
},
|
|
{
|
|
"epoch": 2.07,
|
|
"learning_rate": 9.99862059452376e-07,
|
|
"loss": 0.0332,
|
|
"step": 300
|
|
},
|
|
{
|
|
"epoch": 3.1,
|
|
"learning_rate": 9.99758604041658e-07,
|
|
"loss": 0.0336,
|
|
"step": 450
|
|
},
|
|
{
|
|
"epoch": 3.45,
|
|
"eval_loss": 0.21229705214500427,
|
|
"eval_runtime": 487.1939,
|
|
"eval_samples_per_second": 10.649,
|
|
"eval_steps_per_second": 1.332,
|
|
"eval_wer": 0.1448122092799754,
|
|
"step": 500
|
|
},
|
|
{
|
|
"epoch": 4.14,
|
|
"learning_rate": 9.9965514863094e-07,
|
|
"loss": 0.0329,
|
|
"step": 600
|
|
},
|
|
{
|
|
"epoch": 5.17,
|
|
"learning_rate": 9.995516932202221e-07,
|
|
"loss": 0.0323,
|
|
"step": 750
|
|
},
|
|
{
|
|
"epoch": 6.21,
|
|
"learning_rate": 9.99448237809504e-07,
|
|
"loss": 0.0317,
|
|
"step": 900
|
|
},
|
|
{
|
|
"epoch": 6.9,
|
|
"eval_loss": 0.20801204442977905,
|
|
"eval_runtime": 282.77,
|
|
"eval_samples_per_second": 18.347,
|
|
"eval_steps_per_second": 2.295,
|
|
"eval_wer": 0.14550417099142737,
|
|
"step": 1000
|
|
},
|
|
{
|
|
"epoch": 7.24,
|
|
"learning_rate": 9.993454721015242e-07,
|
|
"loss": 0.0323,
|
|
"step": 1050
|
|
},
|
|
{
|
|
"epoch": 8.28,
|
|
"learning_rate": 9.992420166908062e-07,
|
|
"loss": 0.031,
|
|
"step": 1200
|
|
},
|
|
{
|
|
"epoch": 9.31,
|
|
"learning_rate": 9.991385612800883e-07,
|
|
"loss": 0.0314,
|
|
"step": 1350
|
|
},
|
|
{
|
|
"epoch": 10.34,
|
|
"learning_rate": 9.990351058693703e-07,
|
|
"loss": 0.0317,
|
|
"step": 1500
|
|
},
|
|
{
|
|
"epoch": 10.34,
|
|
"eval_loss": 0.2071654200553894,
|
|
"eval_runtime": 303.1157,
|
|
"eval_samples_per_second": 17.116,
|
|
"eval_steps_per_second": 2.141,
|
|
"eval_wer": 0.14465844001076386,
|
|
"step": 1500
|
|
},
|
|
{
|
|
"epoch": 11.38,
|
|
"learning_rate": 9.989316504586522e-07,
|
|
"loss": 0.031,
|
|
"step": 1650
|
|
},
|
|
{
|
|
"epoch": 12.41,
|
|
"learning_rate": 9.988281950479342e-07,
|
|
"loss": 0.0318,
|
|
"step": 1800
|
|
},
|
|
{
|
|
"epoch": 13.45,
|
|
"learning_rate": 9.987247396372162e-07,
|
|
"loss": 0.0314,
|
|
"step": 1950
|
|
},
|
|
{
|
|
"epoch": 13.79,
|
|
"eval_loss": 0.20706616342067719,
|
|
"eval_runtime": 287.3918,
|
|
"eval_samples_per_second": 18.052,
|
|
"eval_steps_per_second": 2.258,
|
|
"eval_wer": 0.1442355745204321,
|
|
"step": 2000
|
|
}
|
|
],
|
|
"max_steps": 1450000,
|
|
"num_train_epochs": 10000,
|
|
"total_flos": 5.652539665735567e+19,
|
|
"trial_name": null,
|
|
"trial_params": null
|
|
}
|