617 lines
14 KiB
JSON
617 lines
14 KiB
JSON
|
|
{
|
||
|
|
"best_metric": 0.472552783109405,
|
||
|
|
"best_model_checkpoint": "/content/drive/MyDrive/new_dataset/wav2vec2-large-xlsr-53-thai-finetune/checkpoint-500",
|
||
|
|
"epoch": 99.98765432098766,
|
||
|
|
"global_step": 2000,
|
||
|
|
"is_hyper_param_search": false,
|
||
|
|
"is_local_process_zero": true,
|
||
|
|
"is_world_process_zero": true,
|
||
|
|
"log_history": [
|
||
|
|
{
|
||
|
|
"epoch": 2.49,
|
||
|
|
"learning_rate": 0.0001,
|
||
|
|
"loss": 1.9911,
|
||
|
|
"step": 50
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 2.49,
|
||
|
|
"eval_loss": 1.2750070095062256,
|
||
|
|
"eval_runtime": 34.892,
|
||
|
|
"eval_samples_per_second": 12.238,
|
||
|
|
"eval_steps_per_second": 0.774,
|
||
|
|
"eval_wer": 0.6767754318618042,
|
||
|
|
"step": 50
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 4.99,
|
||
|
|
"learning_rate": 9.743589743589744e-05,
|
||
|
|
"loss": 1.2107,
|
||
|
|
"step": 100
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 4.99,
|
||
|
|
"eval_loss": 1.1088056564331055,
|
||
|
|
"eval_runtime": 34.7796,
|
||
|
|
"eval_samples_per_second": 12.277,
|
||
|
|
"eval_steps_per_second": 0.776,
|
||
|
|
"eval_wer": 0.5927063339731286,
|
||
|
|
"step": 100
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 7.49,
|
||
|
|
"learning_rate": 9.487179487179487e-05,
|
||
|
|
"loss": 0.9686,
|
||
|
|
"step": 150
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 7.49,
|
||
|
|
"eval_loss": 1.0476980209350586,
|
||
|
|
"eval_runtime": 34.6203,
|
||
|
|
"eval_samples_per_second": 12.334,
|
||
|
|
"eval_steps_per_second": 0.78,
|
||
|
|
"eval_wer": 0.5712092130518234,
|
||
|
|
"step": 150
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 9.99,
|
||
|
|
"learning_rate": 9.230769230769232e-05,
|
||
|
|
"loss": 0.7504,
|
||
|
|
"step": 200
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 9.99,
|
||
|
|
"eval_loss": 1.0640665292739868,
|
||
|
|
"eval_runtime": 34.843,
|
||
|
|
"eval_samples_per_second": 12.255,
|
||
|
|
"eval_steps_per_second": 0.775,
|
||
|
|
"eval_wer": 0.5504798464491363,
|
||
|
|
"step": 200
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 12.49,
|
||
|
|
"learning_rate": 8.974358974358975e-05,
|
||
|
|
"loss": 0.6352,
|
||
|
|
"step": 250
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 12.49,
|
||
|
|
"eval_loss": 1.095747709274292,
|
||
|
|
"eval_runtime": 33.9281,
|
||
|
|
"eval_samples_per_second": 12.585,
|
||
|
|
"eval_steps_per_second": 0.796,
|
||
|
|
"eval_wer": 0.5324376199616123,
|
||
|
|
"step": 250
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 14.99,
|
||
|
|
"learning_rate": 8.717948717948718e-05,
|
||
|
|
"loss": 0.5313,
|
||
|
|
"step": 300
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 14.99,
|
||
|
|
"eval_loss": 1.0491594076156616,
|
||
|
|
"eval_runtime": 33.7693,
|
||
|
|
"eval_samples_per_second": 12.645,
|
||
|
|
"eval_steps_per_second": 0.8,
|
||
|
|
"eval_wer": 0.5163147792706334,
|
||
|
|
"step": 300
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 17.49,
|
||
|
|
"learning_rate": 8.461538461538461e-05,
|
||
|
|
"loss": 0.4461,
|
||
|
|
"step": 350
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 17.49,
|
||
|
|
"eval_loss": 1.0721960067749023,
|
||
|
|
"eval_runtime": 33.9128,
|
||
|
|
"eval_samples_per_second": 12.591,
|
||
|
|
"eval_steps_per_second": 0.796,
|
||
|
|
"eval_wer": 0.5124760076775432,
|
||
|
|
"step": 350
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 19.99,
|
||
|
|
"learning_rate": 8.205128205128205e-05,
|
||
|
|
"loss": 0.4094,
|
||
|
|
"step": 400
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 19.99,
|
||
|
|
"eval_loss": 1.057926058769226,
|
||
|
|
"eval_runtime": 34.0347,
|
||
|
|
"eval_samples_per_second": 12.546,
|
||
|
|
"eval_steps_per_second": 0.793,
|
||
|
|
"eval_wer": 0.49750479846449136,
|
||
|
|
"step": 400
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 22.49,
|
||
|
|
"learning_rate": 7.948717948717948e-05,
|
||
|
|
"loss": 0.3467,
|
||
|
|
"step": 450
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 22.49,
|
||
|
|
"eval_loss": 1.0208101272583008,
|
||
|
|
"eval_runtime": 34.3752,
|
||
|
|
"eval_samples_per_second": 12.422,
|
||
|
|
"eval_steps_per_second": 0.785,
|
||
|
|
"eval_wer": 0.491362763915547,
|
||
|
|
"step": 450
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 24.99,
|
||
|
|
"learning_rate": 7.692307692307693e-05,
|
||
|
|
"loss": 0.3195,
|
||
|
|
"step": 500
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 24.99,
|
||
|
|
"eval_loss": 1.0337833166122437,
|
||
|
|
"eval_runtime": 33.8794,
|
||
|
|
"eval_samples_per_second": 12.604,
|
||
|
|
"eval_steps_per_second": 0.797,
|
||
|
|
"eval_wer": 0.472552783109405,
|
||
|
|
"step": 500
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 27.49,
|
||
|
|
"learning_rate": 7.435897435897436e-05,
|
||
|
|
"loss": 0.3005,
|
||
|
|
"step": 550
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 27.49,
|
||
|
|
"eval_loss": 1.0594605207443237,
|
||
|
|
"eval_runtime": 33.9955,
|
||
|
|
"eval_samples_per_second": 12.56,
|
||
|
|
"eval_steps_per_second": 0.794,
|
||
|
|
"eval_wer": 0.47946257197696734,
|
||
|
|
"step": 550
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 29.99,
|
||
|
|
"learning_rate": 7.17948717948718e-05,
|
||
|
|
"loss": 0.2933,
|
||
|
|
"step": 600
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 29.99,
|
||
|
|
"eval_loss": 1.017477035522461,
|
||
|
|
"eval_runtime": 33.8622,
|
||
|
|
"eval_samples_per_second": 12.61,
|
||
|
|
"eval_steps_per_second": 0.797,
|
||
|
|
"eval_wer": 0.472936660268714,
|
||
|
|
"step": 600
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 32.49,
|
||
|
|
"learning_rate": 6.923076923076924e-05,
|
||
|
|
"loss": 0.2601,
|
||
|
|
"step": 650
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 32.49,
|
||
|
|
"eval_loss": 1.099133014678955,
|
||
|
|
"eval_runtime": 34.4437,
|
||
|
|
"eval_samples_per_second": 12.397,
|
||
|
|
"eval_steps_per_second": 0.784,
|
||
|
|
"eval_wer": 0.4652591170825336,
|
||
|
|
"step": 650
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 34.99,
|
||
|
|
"learning_rate": 6.666666666666667e-05,
|
||
|
|
"loss": 0.2226,
|
||
|
|
"step": 700
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 34.99,
|
||
|
|
"eval_loss": 1.1290050745010376,
|
||
|
|
"eval_runtime": 34.6356,
|
||
|
|
"eval_samples_per_second": 12.328,
|
||
|
|
"eval_steps_per_second": 0.78,
|
||
|
|
"eval_wer": 0.47063339731285986,
|
||
|
|
"step": 700
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 37.49,
|
||
|
|
"learning_rate": 6.410256410256412e-05,
|
||
|
|
"loss": 0.2262,
|
||
|
|
"step": 750
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 37.49,
|
||
|
|
"eval_loss": 1.0954631567001343,
|
||
|
|
"eval_runtime": 35.3666,
|
||
|
|
"eval_samples_per_second": 12.074,
|
||
|
|
"eval_steps_per_second": 0.763,
|
||
|
|
"eval_wer": 0.45681381957773515,
|
||
|
|
"step": 750
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 39.99,
|
||
|
|
"learning_rate": 6.153846153846155e-05,
|
||
|
|
"loss": 0.2236,
|
||
|
|
"step": 800
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 39.99,
|
||
|
|
"eval_loss": 1.1119202375411987,
|
||
|
|
"eval_runtime": 35.0365,
|
||
|
|
"eval_samples_per_second": 12.187,
|
||
|
|
"eval_steps_per_second": 0.771,
|
||
|
|
"eval_wer": 0.4491362763915547,
|
||
|
|
"step": 800
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 42.49,
|
||
|
|
"learning_rate": 5.897435897435898e-05,
|
||
|
|
"loss": 0.2029,
|
||
|
|
"step": 850
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 42.49,
|
||
|
|
"eval_loss": 1.1375640630722046,
|
||
|
|
"eval_runtime": 35.2676,
|
||
|
|
"eval_samples_per_second": 12.107,
|
||
|
|
"eval_steps_per_second": 0.766,
|
||
|
|
"eval_wer": 0.45220729366602685,
|
||
|
|
"step": 850
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 44.99,
|
||
|
|
"learning_rate": 5.6410256410256414e-05,
|
||
|
|
"loss": 0.1876,
|
||
|
|
"step": 900
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 44.99,
|
||
|
|
"eval_loss": 1.142003059387207,
|
||
|
|
"eval_runtime": 35.6836,
|
||
|
|
"eval_samples_per_second": 11.966,
|
||
|
|
"eval_steps_per_second": 0.757,
|
||
|
|
"eval_wer": 0.4476007677543186,
|
||
|
|
"step": 900
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 47.49,
|
||
|
|
"learning_rate": 5.384615384615385e-05,
|
||
|
|
"loss": 0.1733,
|
||
|
|
"step": 950
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 47.49,
|
||
|
|
"eval_loss": 1.1137712001800537,
|
||
|
|
"eval_runtime": 34.9014,
|
||
|
|
"eval_samples_per_second": 12.234,
|
||
|
|
"eval_steps_per_second": 0.774,
|
||
|
|
"eval_wer": 0.44337811900191937,
|
||
|
|
"step": 950
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 49.99,
|
||
|
|
"learning_rate": 5.128205128205128e-05,
|
||
|
|
"loss": 0.161,
|
||
|
|
"step": 1000
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 49.99,
|
||
|
|
"eval_loss": 1.195468783378601,
|
||
|
|
"eval_runtime": 35.1209,
|
||
|
|
"eval_samples_per_second": 12.158,
|
||
|
|
"eval_steps_per_second": 0.769,
|
||
|
|
"eval_wer": 0.44798464491362766,
|
||
|
|
"step": 1000
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 52.49,
|
||
|
|
"learning_rate": 4.871794871794872e-05,
|
||
|
|
"loss": 0.1661,
|
||
|
|
"step": 1050
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 52.49,
|
||
|
|
"eval_loss": 1.1598896980285645,
|
||
|
|
"eval_runtime": 34.8413,
|
||
|
|
"eval_samples_per_second": 12.256,
|
||
|
|
"eval_steps_per_second": 0.775,
|
||
|
|
"eval_wer": 0.44606525911708256,
|
||
|
|
"step": 1050
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 54.99,
|
||
|
|
"learning_rate": 4.615384615384616e-05,
|
||
|
|
"loss": 0.1533,
|
||
|
|
"step": 1100
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 54.99,
|
||
|
|
"eval_loss": 1.143904447555542,
|
||
|
|
"eval_runtime": 34.3532,
|
||
|
|
"eval_samples_per_second": 12.43,
|
||
|
|
"eval_steps_per_second": 0.786,
|
||
|
|
"eval_wer": 0.4383877159309021,
|
||
|
|
"step": 1100
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 57.49,
|
||
|
|
"learning_rate": 4.358974358974359e-05,
|
||
|
|
"loss": 0.1565,
|
||
|
|
"step": 1150
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 57.49,
|
||
|
|
"eval_loss": 1.1354175806045532,
|
||
|
|
"eval_runtime": 34.4974,
|
||
|
|
"eval_samples_per_second": 12.378,
|
||
|
|
"eval_steps_per_second": 0.783,
|
||
|
|
"eval_wer": 0.4418426103646833,
|
||
|
|
"step": 1150
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 59.99,
|
||
|
|
"learning_rate": 4.1025641025641023e-05,
|
||
|
|
"loss": 0.1476,
|
||
|
|
"step": 1200
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 59.99,
|
||
|
|
"eval_loss": 1.1580840349197388,
|
||
|
|
"eval_runtime": 34.4611,
|
||
|
|
"eval_samples_per_second": 12.391,
|
||
|
|
"eval_steps_per_second": 0.783,
|
||
|
|
"eval_wer": 0.4410748560460653,
|
||
|
|
"step": 1200
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 62.49,
|
||
|
|
"learning_rate": 3.846153846153846e-05,
|
||
|
|
"loss": 0.1378,
|
||
|
|
"step": 1250
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 62.49,
|
||
|
|
"eval_loss": 1.1266977787017822,
|
||
|
|
"eval_runtime": 34.2613,
|
||
|
|
"eval_samples_per_second": 12.463,
|
||
|
|
"eval_steps_per_second": 0.788,
|
||
|
|
"eval_wer": 0.4303262955854127,
|
||
|
|
"step": 1250
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 64.99,
|
||
|
|
"learning_rate": 3.58974358974359e-05,
|
||
|
|
"loss": 0.1214,
|
||
|
|
"step": 1300
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 64.99,
|
||
|
|
"eval_loss": 1.165766716003418,
|
||
|
|
"eval_runtime": 33.9904,
|
||
|
|
"eval_samples_per_second": 12.562,
|
||
|
|
"eval_steps_per_second": 0.794,
|
||
|
|
"eval_wer": 0.42879078694817657,
|
||
|
|
"step": 1300
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 67.49,
|
||
|
|
"learning_rate": 3.3333333333333335e-05,
|
||
|
|
"loss": 0.133,
|
||
|
|
"step": 1350
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 67.49,
|
||
|
|
"eval_loss": 1.137351632118225,
|
||
|
|
"eval_runtime": 34.008,
|
||
|
|
"eval_samples_per_second": 12.556,
|
||
|
|
"eval_steps_per_second": 0.794,
|
||
|
|
"eval_wer": 0.43339731285988486,
|
||
|
|
"step": 1350
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 69.99,
|
||
|
|
"learning_rate": 3.0769230769230774e-05,
|
||
|
|
"loss": 0.1147,
|
||
|
|
"step": 1400
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 69.99,
|
||
|
|
"eval_loss": 1.1521999835968018,
|
||
|
|
"eval_runtime": 33.8683,
|
||
|
|
"eval_samples_per_second": 12.608,
|
||
|
|
"eval_steps_per_second": 0.797,
|
||
|
|
"eval_wer": 0.4245681381957774,
|
||
|
|
"step": 1400
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 72.49,
|
||
|
|
"learning_rate": 2.8205128205128207e-05,
|
||
|
|
"loss": 0.125,
|
||
|
|
"step": 1450
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 72.49,
|
||
|
|
"eval_loss": 1.1379369497299194,
|
||
|
|
"eval_runtime": 34.1582,
|
||
|
|
"eval_samples_per_second": 12.501,
|
||
|
|
"eval_steps_per_second": 0.79,
|
||
|
|
"eval_wer": 0.43570057581573896,
|
||
|
|
"step": 1450
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 74.99,
|
||
|
|
"learning_rate": 2.564102564102564e-05,
|
||
|
|
"loss": 0.1189,
|
||
|
|
"step": 1500
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 74.99,
|
||
|
|
"eval_loss": 1.1502233743667603,
|
||
|
|
"eval_runtime": 33.9539,
|
||
|
|
"eval_samples_per_second": 12.576,
|
||
|
|
"eval_steps_per_second": 0.795,
|
||
|
|
"eval_wer": 0.4284069097888676,
|
||
|
|
"step": 1500
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 77.49,
|
||
|
|
"learning_rate": 2.307692307692308e-05,
|
||
|
|
"loss": 0.1122,
|
||
|
|
"step": 1550
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 77.49,
|
||
|
|
"eval_loss": 1.1575168371200562,
|
||
|
|
"eval_runtime": 34.1792,
|
||
|
|
"eval_samples_per_second": 12.493,
|
||
|
|
"eval_steps_per_second": 0.79,
|
||
|
|
"eval_wer": 0.4314779270633397,
|
||
|
|
"step": 1550
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 79.99,
|
||
|
|
"learning_rate": 2.0512820512820512e-05,
|
||
|
|
"loss": 0.1235,
|
||
|
|
"step": 1600
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 79.99,
|
||
|
|
"eval_loss": 1.142774224281311,
|
||
|
|
"eval_runtime": 33.8121,
|
||
|
|
"eval_samples_per_second": 12.629,
|
||
|
|
"eval_steps_per_second": 0.799,
|
||
|
|
"eval_wer": 0.42610364683301344,
|
||
|
|
"step": 1600
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 82.49,
|
||
|
|
"learning_rate": 1.794871794871795e-05,
|
||
|
|
"loss": 0.1092,
|
||
|
|
"step": 1650
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 82.49,
|
||
|
|
"eval_loss": 1.1530485153198242,
|
||
|
|
"eval_runtime": 33.6852,
|
||
|
|
"eval_samples_per_second": 12.676,
|
||
|
|
"eval_steps_per_second": 0.802,
|
||
|
|
"eval_wer": 0.4341650671785029,
|
||
|
|
"step": 1650
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 84.99,
|
||
|
|
"learning_rate": 1.5384615384615387e-05,
|
||
|
|
"loss": 0.1185,
|
||
|
|
"step": 1700
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 84.99,
|
||
|
|
"eval_loss": 1.1284310817718506,
|
||
|
|
"eval_runtime": 33.8486,
|
||
|
|
"eval_samples_per_second": 12.615,
|
||
|
|
"eval_steps_per_second": 0.798,
|
||
|
|
"eval_wer": 0.42994241842610365,
|
||
|
|
"step": 1700
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 87.49,
|
||
|
|
"learning_rate": 1.282051282051282e-05,
|
||
|
|
"loss": 0.1048,
|
||
|
|
"step": 1750
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 87.49,
|
||
|
|
"eval_loss": 1.1434178352355957,
|
||
|
|
"eval_runtime": 33.9335,
|
||
|
|
"eval_samples_per_second": 12.583,
|
||
|
|
"eval_steps_per_second": 0.796,
|
||
|
|
"eval_wer": 0.4276391554702495,
|
||
|
|
"step": 1750
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 89.99,
|
||
|
|
"learning_rate": 1.0256410256410256e-05,
|
||
|
|
"loss": 0.1038,
|
||
|
|
"step": 1800
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 89.99,
|
||
|
|
"eval_loss": 1.1609505414962769,
|
||
|
|
"eval_runtime": 34.1384,
|
||
|
|
"eval_samples_per_second": 12.508,
|
||
|
|
"eval_steps_per_second": 0.791,
|
||
|
|
"eval_wer": 0.42418426103646834,
|
||
|
|
"step": 1800
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 92.49,
|
||
|
|
"learning_rate": 7.692307692307694e-06,
|
||
|
|
"loss": 0.1073,
|
||
|
|
"step": 1850
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 92.49,
|
||
|
|
"eval_loss": 1.1562278270721436,
|
||
|
|
"eval_runtime": 33.8455,
|
||
|
|
"eval_samples_per_second": 12.616,
|
||
|
|
"eval_steps_per_second": 0.798,
|
||
|
|
"eval_wer": 0.4238003838771593,
|
||
|
|
"step": 1850
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 94.99,
|
||
|
|
"learning_rate": 5.128205128205128e-06,
|
||
|
|
"loss": 0.1055,
|
||
|
|
"step": 1900
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 94.99,
|
||
|
|
"eval_loss": 1.1589001417160034,
|
||
|
|
"eval_runtime": 34.1041,
|
||
|
|
"eval_samples_per_second": 12.52,
|
||
|
|
"eval_steps_per_second": 0.792,
|
||
|
|
"eval_wer": 0.4214971209213052,
|
||
|
|
"step": 1900
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 97.49,
|
||
|
|
"learning_rate": 2.564102564102564e-06,
|
||
|
|
"loss": 0.1133,
|
||
|
|
"step": 1950
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 97.49,
|
||
|
|
"eval_loss": 1.1536645889282227,
|
||
|
|
"eval_runtime": 33.9701,
|
||
|
|
"eval_samples_per_second": 12.57,
|
||
|
|
"eval_steps_per_second": 0.795,
|
||
|
|
"eval_wer": 0.4238003838771593,
|
||
|
|
"step": 1950
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 99.99,
|
||
|
|
"learning_rate": 0.0,
|
||
|
|
"loss": 0.0992,
|
||
|
|
"step": 2000
|
||
|
|
},
|
||
|
|
{
|
||
|
|
"epoch": 99.99,
|
||
|
|
"eval_loss": 1.1553977727890015,
|
||
|
|
"eval_runtime": 33.8655,
|
||
|
|
"eval_samples_per_second": 12.609,
|
||
|
|
"eval_steps_per_second": 0.797,
|
||
|
|
"eval_wer": 0.42418426103646834,
|
||
|
|
"step": 2000
|
||
|
|
}
|
||
|
|
],
|
||
|
|
"max_steps": 2000,
|
||
|
|
"num_train_epochs": 100,
|
||
|
|
"total_flos": 1.6479245346890066e+19,
|
||
|
|
"trial_name": null,
|
||
|
|
"trial_params": null
|
||
|
|
}
|