Files
wav2vec2-large-xlsr-mecita-…/trainer_state.json
ModelHub XC 36f8fe9f41 初始化项目,由ModelHub XC社区提供模型
Model: alinerodrigues/wav2vec2-large-xlsr-mecita-coraa-portuguese-2-all-03
Source: Original Platform
2026-05-19 07:18:58 +08:00

986 lines
24 KiB
JSON

{
"best_metric": 0.1349739283323288,
"best_model_checkpoint": "wav2vec2-large-xlsr-mecita-coraa-portuguese-2-all-03/checkpoint-3698",
"epoch": 63.0,
"global_step": 5418,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"learning_rate": 3e-05,
"loss": 28.65,
"step": 1
},
{
"epoch": 1.0,
"eval_cer": 1.0,
"eval_loss": 3.1940298080444336,
"eval_runtime": 19.0983,
"eval_samples_per_second": 17.855,
"eval_steps_per_second": 2.252,
"eval_wer": 1.0,
"step": 86
},
{
"epoch": 1.16,
"learning_rate": 2.966511627906977e-05,
"loss": 8.1771,
"step": 100
},
{
"epoch": 2.0,
"eval_cer": 1.0,
"eval_loss": 2.9853453636169434,
"eval_runtime": 18.8941,
"eval_samples_per_second": 18.048,
"eval_steps_per_second": 2.276,
"eval_wer": 1.0,
"step": 172
},
{
"epoch": 2.33,
"learning_rate": 2.9316279069767443e-05,
"loss": 3.0358,
"step": 200
},
{
"epoch": 3.0,
"eval_cer": 1.0,
"eval_loss": 2.895540237426758,
"eval_runtime": 19.0821,
"eval_samples_per_second": 17.87,
"eval_steps_per_second": 2.253,
"eval_wer": 1.0,
"step": 258
},
{
"epoch": 3.49,
"learning_rate": 2.8967441860465116e-05,
"loss": 2.9359,
"step": 300
},
{
"epoch": 4.0,
"eval_cer": 1.0,
"eval_loss": 2.9086179733276367,
"eval_runtime": 19.1659,
"eval_samples_per_second": 17.792,
"eval_steps_per_second": 2.244,
"eval_wer": 1.0,
"step": 344
},
{
"epoch": 4.65,
"learning_rate": 2.861860465116279e-05,
"loss": 2.9026,
"step": 400
},
{
"epoch": 5.0,
"eval_cer": 0.9998215162197135,
"eval_loss": 2.694617509841919,
"eval_runtime": 18.8982,
"eval_samples_per_second": 18.044,
"eval_steps_per_second": 2.275,
"eval_wer": 0.9997623009270263,
"step": 430
},
{
"epoch": 5.81,
"learning_rate": 2.8269767441860464e-05,
"loss": 2.4934,
"step": 500
},
{
"epoch": 6.0,
"eval_cer": 0.1256525813216724,
"eval_loss": 0.9106346964836121,
"eval_runtime": 18.9322,
"eval_samples_per_second": 18.012,
"eval_steps_per_second": 2.271,
"eval_wer": 0.49441407178512004,
"step": 516
},
{
"epoch": 6.98,
"learning_rate": 2.7920930232558138e-05,
"loss": 1.1576,
"step": 600
},
{
"epoch": 7.0,
"eval_cer": 0.06273704877069296,
"eval_loss": 0.4618076980113983,
"eval_runtime": 19.1545,
"eval_samples_per_second": 17.803,
"eval_steps_per_second": 2.245,
"eval_wer": 0.22914190634656526,
"step": 602
},
{
"epoch": 8.0,
"eval_cer": 0.05381285975636964,
"eval_loss": 0.3426876664161682,
"eval_runtime": 19.3029,
"eval_samples_per_second": 17.666,
"eval_steps_per_second": 2.228,
"eval_wer": 0.18706917043023533,
"step": 688
},
{
"epoch": 8.14,
"learning_rate": 2.7572093023255812e-05,
"loss": 0.7498,
"step": 700
},
{
"epoch": 9.0,
"eval_cer": 0.04801213689705948,
"eval_loss": 0.283805251121521,
"eval_runtime": 18.9222,
"eval_samples_per_second": 18.021,
"eval_steps_per_second": 2.272,
"eval_wer": 0.16734014737342523,
"step": 774
},
{
"epoch": 9.3,
"learning_rate": 2.722325581395349e-05,
"loss": 0.5493,
"step": 800
},
{
"epoch": 10.0,
"eval_cer": 0.04417473562090045,
"eval_loss": 0.25037863850593567,
"eval_runtime": 19.1667,
"eval_samples_per_second": 17.791,
"eval_steps_per_second": 2.243,
"eval_wer": 0.14903731875445686,
"step": 860
},
{
"epoch": 10.47,
"learning_rate": 2.6874418604651163e-05,
"loss": 0.4735,
"step": 900
},
{
"epoch": 11.0,
"eval_cer": 0.041185132301102136,
"eval_loss": 0.23181051015853882,
"eval_runtime": 18.9289,
"eval_samples_per_second": 18.015,
"eval_steps_per_second": 2.272,
"eval_wer": 0.1388162586165914,
"step": 946
},
{
"epoch": 11.63,
"learning_rate": 2.6525581395348837e-05,
"loss": 0.4183,
"step": 1000
},
{
"epoch": 12.0,
"eval_cer": 0.037392351970014726,
"eval_loss": 0.2174120843410492,
"eval_runtime": 18.9003,
"eval_samples_per_second": 18.042,
"eval_steps_per_second": 2.275,
"eval_wer": 0.12146422628951747,
"step": 1032
},
{
"epoch": 12.79,
"learning_rate": 2.617674418604651e-05,
"loss": 0.3924,
"step": 1100
},
{
"epoch": 13.0,
"eval_cer": 0.03565213511222168,
"eval_loss": 0.20193208754062653,
"eval_runtime": 19.1675,
"eval_samples_per_second": 17.791,
"eval_steps_per_second": 2.243,
"eval_wer": 0.1126693605894937,
"step": 1118
},
{
"epoch": 13.95,
"learning_rate": 2.5827906976744185e-05,
"loss": 0.3497,
"step": 1200
},
{
"epoch": 14.0,
"eval_cer": 0.03431350676007318,
"eval_loss": 0.18761980533599854,
"eval_runtime": 19.269,
"eval_samples_per_second": 17.697,
"eval_steps_per_second": 2.232,
"eval_wer": 0.11124316615165201,
"step": 1204
},
{
"epoch": 15.0,
"eval_cer": 0.03507206282629066,
"eval_loss": 0.18645305931568146,
"eval_runtime": 18.9659,
"eval_samples_per_second": 17.98,
"eval_steps_per_second": 2.267,
"eval_wer": 0.1110054670786784,
"step": 1290
},
{
"epoch": 15.12,
"learning_rate": 2.5479069767441862e-05,
"loss": 0.3335,
"step": 1300
},
{
"epoch": 16.0,
"eval_cer": 0.0327517736825666,
"eval_loss": 0.17586949467658997,
"eval_runtime": 19.1261,
"eval_samples_per_second": 17.829,
"eval_steps_per_second": 2.248,
"eval_wer": 0.1064891846921797,
"step": 1376
},
{
"epoch": 16.28,
"learning_rate": 2.5130232558139536e-05,
"loss": 0.3259,
"step": 1400
},
{
"epoch": 17.0,
"eval_cer": 0.031011556824773547,
"eval_loss": 0.17175641655921936,
"eval_runtime": 18.8952,
"eval_samples_per_second": 18.047,
"eval_steps_per_second": 2.276,
"eval_wer": 0.0941288328975517,
"step": 1462
},
{
"epoch": 17.44,
"learning_rate": 2.478139534883721e-05,
"loss": 0.2822,
"step": 1500
},
{
"epoch": 18.0,
"eval_cer": 0.03074383115434385,
"eval_loss": 0.1663752645254135,
"eval_runtime": 19.0306,
"eval_samples_per_second": 17.919,
"eval_steps_per_second": 2.26,
"eval_wer": 0.09650582362728785,
"step": 1548
},
{
"epoch": 18.6,
"learning_rate": 2.4432558139534884e-05,
"loss": 0.2689,
"step": 1600
},
{
"epoch": 19.0,
"eval_cer": 0.030163758868412834,
"eval_loss": 0.16375425457954407,
"eval_runtime": 19.1028,
"eval_samples_per_second": 17.851,
"eval_steps_per_second": 2.251,
"eval_wer": 0.09507962918944617,
"step": 1634
},
{
"epoch": 19.77,
"learning_rate": 2.4083720930232558e-05,
"loss": 0.262,
"step": 1700
},
{
"epoch": 20.0,
"eval_cer": 0.030699210209272233,
"eval_loss": 0.1615932136774063,
"eval_runtime": 18.925,
"eval_samples_per_second": 18.019,
"eval_steps_per_second": 2.272,
"eval_wer": 0.09365343475160447,
"step": 1720
},
{
"epoch": 20.93,
"learning_rate": 2.373488372093023e-05,
"loss": 0.2623,
"step": 1800
},
{
"epoch": 21.0,
"eval_cer": 0.029896033197983132,
"eval_loss": 0.1573890894651413,
"eval_runtime": 18.8701,
"eval_samples_per_second": 18.071,
"eval_steps_per_second": 2.279,
"eval_wer": 0.09270263845971001,
"step": 1806
},
{
"epoch": 22.0,
"eval_cer": 0.030565347374057382,
"eval_loss": 0.15589450299739838,
"eval_runtime": 19.0532,
"eval_samples_per_second": 17.897,
"eval_steps_per_second": 2.257,
"eval_wer": 0.09436653197052532,
"step": 1892
},
{
"epoch": 22.09,
"learning_rate": 2.338604651162791e-05,
"loss": 0.2344,
"step": 1900
},
{
"epoch": 23.0,
"eval_cer": 0.029315960912052116,
"eval_loss": 0.15381626784801483,
"eval_runtime": 19.0478,
"eval_samples_per_second": 17.902,
"eval_steps_per_second": 2.257,
"eval_wer": 0.09198954124078916,
"step": 1978
},
{
"epoch": 23.26,
"learning_rate": 2.3037209302325583e-05,
"loss": 0.2315,
"step": 2000
},
{
"epoch": 24.0,
"eval_cer": 0.0298067913078399,
"eval_loss": 0.1532616764307022,
"eval_runtime": 19.3337,
"eval_samples_per_second": 17.638,
"eval_steps_per_second": 2.224,
"eval_wer": 0.09270263845971001,
"step": 2064
},
{
"epoch": 24.42,
"learning_rate": 2.2688372093023257e-05,
"loss": 0.2411,
"step": 2100
},
{
"epoch": 25.0,
"eval_cer": 0.029360581857123733,
"eval_loss": 0.15203775465488434,
"eval_runtime": 18.8831,
"eval_samples_per_second": 18.058,
"eval_steps_per_second": 2.277,
"eval_wer": 0.09080104587592108,
"step": 2150
},
{
"epoch": 25.58,
"learning_rate": 2.233953488372093e-05,
"loss": 0.2102,
"step": 2200
},
{
"epoch": 26.0,
"eval_cer": 0.02971754941769667,
"eval_loss": 0.14963804185390472,
"eval_runtime": 18.9765,
"eval_samples_per_second": 17.97,
"eval_steps_per_second": 2.266,
"eval_wer": 0.09222724031376278,
"step": 2236
},
{
"epoch": 26.74,
"learning_rate": 2.1990697674418605e-05,
"loss": 0.2115,
"step": 2300
},
{
"epoch": 27.0,
"eval_cer": 0.029762170362768285,
"eval_loss": 0.1473499834537506,
"eval_runtime": 18.9863,
"eval_samples_per_second": 17.96,
"eval_steps_per_second": 2.265,
"eval_wer": 0.09793201806512955,
"step": 2322
},
{
"epoch": 27.91,
"learning_rate": 2.1641860465116282e-05,
"loss": 0.2139,
"step": 2400
},
{
"epoch": 28.0,
"eval_cer": 0.029985275088126366,
"eval_loss": 0.14958611130714417,
"eval_runtime": 18.9624,
"eval_samples_per_second": 17.983,
"eval_steps_per_second": 2.268,
"eval_wer": 0.095792726408367,
"step": 2408
},
{
"epoch": 29.0,
"eval_cer": 0.02886975146133595,
"eval_loss": 0.14455682039260864,
"eval_runtime": 19.1059,
"eval_samples_per_second": 17.848,
"eval_steps_per_second": 2.251,
"eval_wer": 0.09032564772997385,
"step": 2494
},
{
"epoch": 29.07,
"learning_rate": 2.1293023255813956e-05,
"loss": 0.2218,
"step": 2500
},
{
"epoch": 30.0,
"eval_cer": 0.029137477131765652,
"eval_loss": 0.1481563001871109,
"eval_runtime": 19.0476,
"eval_samples_per_second": 17.903,
"eval_steps_per_second": 2.258,
"eval_wer": 0.09127644402186831,
"step": 2580
},
{
"epoch": 30.23,
"learning_rate": 2.094418604651163e-05,
"loss": 0.1982,
"step": 2600
},
{
"epoch": 31.0,
"eval_cer": 0.02837892106554817,
"eval_loss": 0.14385315775871277,
"eval_runtime": 18.9549,
"eval_samples_per_second": 17.99,
"eval_steps_per_second": 2.269,
"eval_wer": 0.08913715236510578,
"step": 2666
},
{
"epoch": 31.4,
"learning_rate": 2.0595348837209304e-05,
"loss": 0.196,
"step": 2700
},
{
"epoch": 32.0,
"eval_cer": 0.02860202579090625,
"eval_loss": 0.14276552200317383,
"eval_runtime": 19.1086,
"eval_samples_per_second": 17.845,
"eval_steps_per_second": 2.25,
"eval_wer": 0.09341573567863086,
"step": 2752
},
{
"epoch": 32.56,
"learning_rate": 2.0246511627906977e-05,
"loss": 0.1846,
"step": 2800
},
{
"epoch": 33.0,
"eval_cer": 0.028111195395118468,
"eval_loss": 0.14039289951324463,
"eval_runtime": 19.1208,
"eval_samples_per_second": 17.834,
"eval_steps_per_second": 2.249,
"eval_wer": 0.09056334680294748,
"step": 2838
},
{
"epoch": 33.72,
"learning_rate": 1.9897674418604655e-05,
"loss": 0.1873,
"step": 2900
},
{
"epoch": 34.0,
"eval_cer": 0.02717415554861452,
"eval_loss": 0.1395137906074524,
"eval_runtime": 19.1432,
"eval_samples_per_second": 17.813,
"eval_steps_per_second": 2.246,
"eval_wer": 0.08557166627050154,
"step": 2924
},
{
"epoch": 34.88,
"learning_rate": 1.954883720930233e-05,
"loss": 0.1854,
"step": 3000
},
{
"epoch": 35.0,
"eval_cer": 0.02677256704296997,
"eval_loss": 0.1353740692138672,
"eval_runtime": 19.2143,
"eval_samples_per_second": 17.747,
"eval_steps_per_second": 2.238,
"eval_wer": 0.08462086997860709,
"step": 3010
},
{
"epoch": 36.0,
"eval_cer": 0.027129534603542903,
"eval_loss": 0.1359284222126007,
"eval_runtime": 19.183,
"eval_samples_per_second": 17.776,
"eval_steps_per_second": 2.242,
"eval_wer": 0.08580936534347516,
"step": 3096
},
{
"epoch": 36.05,
"learning_rate": 1.9200000000000003e-05,
"loss": 0.1851,
"step": 3100
},
{
"epoch": 37.0,
"eval_cer": 0.027620364999330686,
"eval_loss": 0.13563700020313263,
"eval_runtime": 19.0319,
"eval_samples_per_second": 17.917,
"eval_steps_per_second": 2.259,
"eval_wer": 0.09032564772997385,
"step": 3182
},
{
"epoch": 37.21,
"learning_rate": 1.8851162790697673e-05,
"loss": 0.1733,
"step": 3200
},
{
"epoch": 38.0,
"eval_cer": 0.02704029271339967,
"eval_loss": 0.13802382349967957,
"eval_runtime": 19.2183,
"eval_samples_per_second": 17.744,
"eval_steps_per_second": 2.237,
"eval_wer": 0.08509626812455431,
"step": 3268
},
{
"epoch": 38.37,
"learning_rate": 1.8502325581395347e-05,
"loss": 0.1781,
"step": 3300
},
{
"epoch": 39.0,
"eval_cer": 0.02583552719646602,
"eval_loss": 0.13587680459022522,
"eval_runtime": 19.0209,
"eval_samples_per_second": 17.928,
"eval_steps_per_second": 2.261,
"eval_wer": 0.08129308295697647,
"step": 3354
},
{
"epoch": 39.53,
"learning_rate": 1.815348837209302e-05,
"loss": 0.1821,
"step": 3400
},
{
"epoch": 40.0,
"eval_cer": 0.027441881219044218,
"eval_loss": 0.13828882575035095,
"eval_runtime": 19.1283,
"eval_samples_per_second": 17.827,
"eval_steps_per_second": 2.248,
"eval_wer": 0.08628476348942239,
"step": 3440
},
{
"epoch": 40.7,
"learning_rate": 1.7804651162790698e-05,
"loss": 0.1724,
"step": 3500
},
{
"epoch": 41.0,
"eval_cer": 0.02650484137254027,
"eval_loss": 0.13766087591648102,
"eval_runtime": 19.2872,
"eval_samples_per_second": 17.68,
"eval_steps_per_second": 2.229,
"eval_wer": 0.08224387924887093,
"step": 3526
},
{
"epoch": 41.86,
"learning_rate": 1.7455813953488372e-05,
"loss": 0.1591,
"step": 3600
},
{
"epoch": 42.0,
"eval_cer": 0.026594083262683504,
"eval_loss": 0.13794943690299988,
"eval_runtime": 19.0157,
"eval_samples_per_second": 17.933,
"eval_steps_per_second": 2.261,
"eval_wer": 0.08438317090563346,
"step": 3612
},
{
"epoch": 43.0,
"eval_cer": 0.026103252866895722,
"eval_loss": 0.1349739283323288,
"eval_runtime": 18.9996,
"eval_samples_per_second": 17.948,
"eval_steps_per_second": 2.263,
"eval_wer": 0.08414547183265986,
"step": 3698
},
{
"epoch": 43.02,
"learning_rate": 1.7106976744186046e-05,
"loss": 0.168,
"step": 3700
},
{
"epoch": 44.0,
"eval_cer": 0.02650484137254027,
"eval_loss": 0.1362057477235794,
"eval_runtime": 19.2987,
"eval_samples_per_second": 17.67,
"eval_steps_per_second": 2.228,
"eval_wer": 0.08462086997860709,
"step": 3784
},
{
"epoch": 44.19,
"learning_rate": 1.675813953488372e-05,
"loss": 0.162,
"step": 3800
},
{
"epoch": 45.0,
"eval_cer": 0.02663870420775512,
"eval_loss": 0.13529056310653687,
"eval_runtime": 19.8929,
"eval_samples_per_second": 17.142,
"eval_steps_per_second": 2.162,
"eval_wer": 0.08200618017589731,
"step": 3870
},
{
"epoch": 45.35,
"learning_rate": 1.6409302325581394e-05,
"loss": 0.145,
"step": 3900
},
{
"epoch": 46.0,
"eval_cer": 0.026995671768328053,
"eval_loss": 0.14138084650039673,
"eval_runtime": 19.2935,
"eval_samples_per_second": 17.674,
"eval_steps_per_second": 2.229,
"eval_wer": 0.08485856905158069,
"step": 3956
},
{
"epoch": 46.51,
"learning_rate": 1.606046511627907e-05,
"loss": 0.1639,
"step": 4000
},
{
"epoch": 47.0,
"eval_cer": 0.026594083262683504,
"eval_loss": 0.13999956846237183,
"eval_runtime": 19.0568,
"eval_samples_per_second": 17.894,
"eval_steps_per_second": 2.256,
"eval_wer": 0.08367007368671261,
"step": 4042
},
{
"epoch": 47.67,
"learning_rate": 1.5711627906976745e-05,
"loss": 0.1572,
"step": 4100
},
{
"epoch": 48.0,
"eval_cer": 0.026058631921824105,
"eval_loss": 0.1387248933315277,
"eval_runtime": 19.0666,
"eval_samples_per_second": 17.885,
"eval_steps_per_second": 2.255,
"eval_wer": 0.08153078202995008,
"step": 4128
},
{
"epoch": 48.84,
"learning_rate": 1.536279069767442e-05,
"loss": 0.14,
"step": 4200
},
{
"epoch": 49.0,
"eval_cer": 0.02583552719646602,
"eval_loss": 0.1383592039346695,
"eval_runtime": 19.025,
"eval_samples_per_second": 17.924,
"eval_steps_per_second": 2.26,
"eval_wer": 0.08224387924887093,
"step": 4214
},
{
"epoch": 50.0,
"learning_rate": 1.5013953488372093e-05,
"loss": 0.1473,
"step": 4300
},
{
"epoch": 50.0,
"eval_cer": 0.026549462317611888,
"eval_loss": 0.13988161087036133,
"eval_runtime": 19.1678,
"eval_samples_per_second": 17.79,
"eval_steps_per_second": 2.243,
"eval_wer": 0.08271927739481816,
"step": 4300
},
{
"epoch": 51.0,
"eval_cer": 0.02650484137254027,
"eval_loss": 0.14077438414096832,
"eval_runtime": 19.0777,
"eval_samples_per_second": 17.874,
"eval_steps_per_second": 2.254,
"eval_wer": 0.08224387924887093,
"step": 4386
},
{
"epoch": 51.16,
"learning_rate": 1.4665116279069768e-05,
"loss": 0.1722,
"step": 4400
},
{
"epoch": 52.0,
"eval_cer": 0.026683325152826738,
"eval_loss": 0.1410902589559555,
"eval_runtime": 19.0905,
"eval_samples_per_second": 17.862,
"eval_steps_per_second": 2.252,
"eval_wer": 0.08509626812455431,
"step": 4472
},
{
"epoch": 52.33,
"learning_rate": 1.4316279069767442e-05,
"loss": 0.1518,
"step": 4500
},
{
"epoch": 53.0,
"eval_cer": 0.02730801838382937,
"eval_loss": 0.14102402329444885,
"eval_runtime": 19.0143,
"eval_samples_per_second": 17.934,
"eval_steps_per_second": 2.261,
"eval_wer": 0.08604706441644877,
"step": 4558
},
{
"epoch": 53.49,
"learning_rate": 1.3967441860465116e-05,
"loss": 0.1506,
"step": 4600
},
{
"epoch": 54.0,
"eval_cer": 0.02704029271339967,
"eval_loss": 0.14034318923950195,
"eval_runtime": 19.0734,
"eval_samples_per_second": 17.878,
"eval_steps_per_second": 2.254,
"eval_wer": 0.08580936534347516,
"step": 4644
},
{
"epoch": 54.65,
"learning_rate": 1.3618604651162792e-05,
"loss": 0.1442,
"step": 4700
},
{
"epoch": 55.0,
"eval_cer": 0.02623711570211057,
"eval_loss": 0.1380011886358261,
"eval_runtime": 19.092,
"eval_samples_per_second": 17.861,
"eval_steps_per_second": 2.252,
"eval_wer": 0.08319467554076539,
"step": 4730
},
{
"epoch": 55.81,
"learning_rate": 1.3269767441860466e-05,
"loss": 0.1427,
"step": 4800
},
{
"epoch": 56.0,
"eval_cer": 0.026549462317611888,
"eval_loss": 0.13952679932117462,
"eval_runtime": 19.0512,
"eval_samples_per_second": 17.899,
"eval_steps_per_second": 2.257,
"eval_wer": 0.08153078202995008,
"step": 4816
},
{
"epoch": 56.98,
"learning_rate": 1.292093023255814e-05,
"loss": 0.132,
"step": 4900
},
{
"epoch": 57.0,
"eval_cer": 0.025924769086609255,
"eval_loss": 0.13835428655147552,
"eval_runtime": 19.1303,
"eval_samples_per_second": 17.825,
"eval_steps_per_second": 2.248,
"eval_wer": 0.08129308295697647,
"step": 4902
},
{
"epoch": 58.0,
"eval_cer": 0.026058631921824105,
"eval_loss": 0.1352924406528473,
"eval_runtime": 19.3096,
"eval_samples_per_second": 17.66,
"eval_steps_per_second": 2.227,
"eval_wer": 0.0817684811029237,
"step": 4988
},
{
"epoch": 58.14,
"learning_rate": 1.2572093023255815e-05,
"loss": 0.1374,
"step": 5000
},
{
"epoch": 59.0,
"eval_cer": 0.02650484137254027,
"eval_loss": 0.140494242310524,
"eval_runtime": 19.0811,
"eval_samples_per_second": 17.871,
"eval_steps_per_second": 2.254,
"eval_wer": 0.08343237461373901,
"step": 5074
},
{
"epoch": 59.3,
"learning_rate": 1.2223255813953489e-05,
"loss": 0.1318,
"step": 5100
},
{
"epoch": 60.0,
"eval_cer": 0.02583552719646602,
"eval_loss": 0.1383277028799057,
"eval_runtime": 19.2077,
"eval_samples_per_second": 17.753,
"eval_steps_per_second": 2.239,
"eval_wer": 0.08105538388400285,
"step": 5160
},
{
"epoch": 60.47,
"learning_rate": 1.1874418604651165e-05,
"loss": 0.1339,
"step": 5200
},
{
"epoch": 61.0,
"eval_cer": 0.026058631921824105,
"eval_loss": 0.1385628879070282,
"eval_runtime": 19.3076,
"eval_samples_per_second": 17.661,
"eval_steps_per_second": 2.227,
"eval_wer": 0.08129308295697647,
"step": 5246
},
{
"epoch": 61.63,
"learning_rate": 1.1525581395348838e-05,
"loss": 0.1346,
"step": 5300
},
{
"epoch": 62.0,
"eval_cer": 0.025255454910535005,
"eval_loss": 0.13994893431663513,
"eval_runtime": 19.1977,
"eval_samples_per_second": 17.763,
"eval_steps_per_second": 2.24,
"eval_wer": 0.0801045875921084,
"step": 5332
},
{
"epoch": 62.79,
"learning_rate": 1.117674418604651e-05,
"loss": 0.1261,
"step": 5400
},
{
"epoch": 63.0,
"eval_cer": 0.026326357592253803,
"eval_loss": 0.14302104711532593,
"eval_runtime": 19.1245,
"eval_samples_per_second": 17.831,
"eval_steps_per_second": 2.248,
"eval_wer": 0.08319467554076539,
"step": 5418
},
{
"epoch": 63.0,
"step": 5418,
"total_flos": 4.528287283105284e+19,
"train_loss": 0.5869265782432654,
"train_runtime": 15592.601,
"train_samples_per_second": 17.592,
"train_steps_per_second": 0.552
}
],
"max_steps": 8600,
"num_train_epochs": 100,
"total_flos": 4.528287283105284e+19,
"trial_name": null,
"trial_params": null
}