wav2vec2-xls-r-300m-zh-CN / trainer_state.json
anantoj's picture
End of training
703b1d9
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 99.99963086009598,
"global_step": 67700,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.15,
"learning_rate": 3.6375e-06,
"loss": 135.2123,
"step": 100
},
{
"epoch": 0.3,
"learning_rate": 7.3875e-06,
"loss": 102.0052,
"step": 200
},
{
"epoch": 0.44,
"learning_rate": 1.1099999999999999e-05,
"loss": 85.3955,
"step": 300
},
{
"epoch": 0.59,
"learning_rate": 1.485e-05,
"loss": 78.0905,
"step": 400
},
{
"epoch": 0.74,
"learning_rate": 1.8599999999999998e-05,
"loss": 69.215,
"step": 500
},
{
"epoch": 0.74,
"eval_cer": 1.0,
"eval_loss": 74.97510528564453,
"eval_runtime": 128.2289,
"eval_samples_per_second": 15.761,
"eval_steps_per_second": 1.973,
"eval_wer": 1.0,
"step": 500
},
{
"epoch": 0.89,
"learning_rate": 2.2349999999999998e-05,
"loss": 58.6672,
"step": 600
},
{
"epoch": 1.03,
"learning_rate": 2.6099999999999997e-05,
"loss": 44.0383,
"step": 700
},
{
"epoch": 1.18,
"learning_rate": 2.985e-05,
"loss": 29.3981,
"step": 800
},
{
"epoch": 1.33,
"learning_rate": 3.36e-05,
"loss": 15.4855,
"step": 900
},
{
"epoch": 1.48,
"learning_rate": 3.735e-05,
"loss": 8.2109,
"step": 1000
},
{
"epoch": 1.48,
"eval_cer": 1.0,
"eval_loss": 7.061740875244141,
"eval_runtime": 114.3157,
"eval_samples_per_second": 17.679,
"eval_steps_per_second": 2.213,
"eval_wer": 1.0,
"step": 1000
},
{
"epoch": 1.62,
"learning_rate": 4.11e-05,
"loss": 6.7787,
"step": 1100
},
{
"epoch": 1.77,
"learning_rate": 4.484999999999999e-05,
"loss": 6.5334,
"step": 1200
},
{
"epoch": 1.92,
"learning_rate": 4.8599999999999995e-05,
"loss": 6.4625,
"step": 1300
},
{
"epoch": 2.07,
"learning_rate": 5.234999999999999e-05,
"loss": 6.4425,
"step": 1400
},
{
"epoch": 2.22,
"learning_rate": 5.6099999999999995e-05,
"loss": 6.4277,
"step": 1500
},
{
"epoch": 2.22,
"eval_cer": 1.0,
"eval_loss": 6.3811211585998535,
"eval_runtime": 113.5954,
"eval_samples_per_second": 17.791,
"eval_steps_per_second": 2.227,
"eval_wer": 1.0,
"step": 1500
},
{
"epoch": 2.36,
"learning_rate": 5.985e-05,
"loss": 6.403,
"step": 1600
},
{
"epoch": 2.51,
"learning_rate": 6.359999999999999e-05,
"loss": 6.3874,
"step": 1700
},
{
"epoch": 2.66,
"learning_rate": 6.735e-05,
"loss": 6.3883,
"step": 1800
},
{
"epoch": 2.81,
"learning_rate": 7.11e-05,
"loss": 6.3725,
"step": 1900
},
{
"epoch": 2.95,
"learning_rate": 7.484999999999999e-05,
"loss": 6.3513,
"step": 2000
},
{
"epoch": 2.95,
"eval_cer": 1.0,
"eval_loss": 6.306080341339111,
"eval_runtime": 112.6769,
"eval_samples_per_second": 17.936,
"eval_steps_per_second": 2.245,
"eval_wer": 1.0,
"step": 2000
},
{
"epoch": 3.1,
"learning_rate": 7.489041095890411e-05,
"loss": 6.3448,
"step": 2100
},
{
"epoch": 3.25,
"learning_rate": 7.477625570776254e-05,
"loss": 6.3001,
"step": 2200
},
{
"epoch": 3.4,
"learning_rate": 7.466210045662099e-05,
"loss": 6.299,
"step": 2300
},
{
"epoch": 3.54,
"learning_rate": 7.454794520547944e-05,
"loss": 6.2702,
"step": 2400
},
{
"epoch": 3.69,
"learning_rate": 7.443378995433789e-05,
"loss": 6.2522,
"step": 2500
},
{
"epoch": 3.69,
"eval_cer": 1.0,
"eval_loss": 6.214696884155273,
"eval_runtime": 112.5168,
"eval_samples_per_second": 17.962,
"eval_steps_per_second": 2.249,
"eval_wer": 1.0,
"step": 2500
},
{
"epoch": 3.84,
"learning_rate": 7.431963470319634e-05,
"loss": 6.2413,
"step": 2600
},
{
"epoch": 3.99,
"learning_rate": 7.420547945205478e-05,
"loss": 6.2068,
"step": 2700
},
{
"epoch": 4.14,
"learning_rate": 7.409132420091323e-05,
"loss": 6.1637,
"step": 2800
},
{
"epoch": 4.28,
"learning_rate": 7.397716894977168e-05,
"loss": 6.0668,
"step": 2900
},
{
"epoch": 4.43,
"learning_rate": 7.386301369863013e-05,
"loss": 5.9757,
"step": 3000
},
{
"epoch": 4.43,
"eval_cer": 0.992371009837382,
"eval_loss": 5.7906413078308105,
"eval_runtime": 112.7465,
"eval_samples_per_second": 17.925,
"eval_steps_per_second": 2.244,
"eval_wer": 1.1004453240969816,
"step": 3000
},
{
"epoch": 4.58,
"learning_rate": 7.374885844748858e-05,
"loss": 5.8919,
"step": 3100
},
{
"epoch": 4.73,
"learning_rate": 7.363470319634702e-05,
"loss": 5.7631,
"step": 3200
},
{
"epoch": 4.87,
"learning_rate": 7.352054794520547e-05,
"loss": 5.4749,
"step": 3300
},
{
"epoch": 5.02,
"learning_rate": 7.340639269406392e-05,
"loss": 5.2423,
"step": 3400
},
{
"epoch": 5.17,
"learning_rate": 7.329223744292237e-05,
"loss": 5.0642,
"step": 3500
},
{
"epoch": 5.17,
"eval_cer": 0.8214414776149368,
"eval_loss": 4.2983784675598145,
"eval_runtime": 113.4295,
"eval_samples_per_second": 17.817,
"eval_steps_per_second": 2.23,
"eval_wer": 1.772884710539337,
"step": 3500
},
{
"epoch": 5.32,
"learning_rate": 7.317808219178082e-05,
"loss": 4.9084,
"step": 3600
},
{
"epoch": 5.47,
"learning_rate": 7.306392694063926e-05,
"loss": 4.8479,
"step": 3700
},
{
"epoch": 5.61,
"learning_rate": 7.294977168949771e-05,
"loss": 4.7123,
"step": 3800
},
{
"epoch": 5.76,
"learning_rate": 7.283561643835616e-05,
"loss": 4.6807,
"step": 3900
},
{
"epoch": 5.91,
"learning_rate": 7.272146118721461e-05,
"loss": 4.6346,
"step": 4000
},
{
"epoch": 5.91,
"eval_cer": 0.7727765508933949,
"eval_loss": 3.7128512859344482,
"eval_runtime": 112.7717,
"eval_samples_per_second": 17.921,
"eval_steps_per_second": 2.243,
"eval_wer": 1.8946066303809994,
"step": 4000
},
{
"epoch": 6.06,
"learning_rate": 7.260730593607306e-05,
"loss": 4.5142,
"step": 4100
},
{
"epoch": 6.2,
"learning_rate": 7.249315068493149e-05,
"loss": 4.4345,
"step": 4200
},
{
"epoch": 6.35,
"learning_rate": 7.237899543378995e-05,
"loss": 4.3973,
"step": 4300
},
{
"epoch": 6.5,
"learning_rate": 7.226484018264839e-05,
"loss": 4.3012,
"step": 4400
},
{
"epoch": 6.65,
"learning_rate": 7.215068493150685e-05,
"loss": 4.267,
"step": 4500
},
{
"epoch": 6.65,
"eval_cer": 0.6921501706484642,
"eval_loss": 3.217658042907715,
"eval_runtime": 113.1901,
"eval_samples_per_second": 17.855,
"eval_steps_per_second": 2.235,
"eval_wer": 1.7525977238990598,
"step": 4500
},
{
"epoch": 6.79,
"learning_rate": 7.203767123287671e-05,
"loss": 4.2237,
"step": 4600
},
{
"epoch": 6.94,
"learning_rate": 7.192351598173514e-05,
"loss": 4.1326,
"step": 4700
},
{
"epoch": 7.09,
"learning_rate": 7.18093607305936e-05,
"loss": 4.0728,
"step": 4800
},
{
"epoch": 7.24,
"learning_rate": 7.169520547945204e-05,
"loss": 4.0127,
"step": 4900
},
{
"epoch": 7.39,
"learning_rate": 7.15810502283105e-05,
"loss": 3.9964,
"step": 5000
},
{
"epoch": 7.39,
"eval_cer": 0.6546476611122265,
"eval_loss": 2.8337087631225586,
"eval_runtime": 112.9864,
"eval_samples_per_second": 17.887,
"eval_steps_per_second": 2.239,
"eval_wer": 1.805541810984661,
"step": 5000
},
{
"epoch": 7.53,
"learning_rate": 7.146689497716894e-05,
"loss": 3.9397,
"step": 5100
},
{
"epoch": 7.68,
"learning_rate": 7.13527397260274e-05,
"loss": 3.8843,
"step": 5200
},
{
"epoch": 7.83,
"learning_rate": 7.123972602739726e-05,
"loss": 3.8829,
"step": 5300
},
{
"epoch": 7.98,
"learning_rate": 7.112557077625571e-05,
"loss": 3.8111,
"step": 5400
},
{
"epoch": 8.12,
"learning_rate": 7.101141552511414e-05,
"loss": 3.8035,
"step": 5500
},
{
"epoch": 8.12,
"eval_cer": 0.6992170246938366,
"eval_loss": 2.572591543197632,
"eval_runtime": 113.1543,
"eval_samples_per_second": 17.861,
"eval_steps_per_second": 2.236,
"eval_wer": 2.1850569025235034,
"step": 5500
},
{
"epoch": 8.27,
"learning_rate": 7.08972602739726e-05,
"loss": 3.7678,
"step": 5600
},
{
"epoch": 8.42,
"learning_rate": 7.078310502283104e-05,
"loss": 3.7781,
"step": 5700
},
{
"epoch": 8.57,
"learning_rate": 7.06689497716895e-05,
"loss": 3.7481,
"step": 5800
},
{
"epoch": 8.71,
"learning_rate": 7.055479452054793e-05,
"loss": 3.6356,
"step": 5900
},
{
"epoch": 8.86,
"learning_rate": 7.04406392694064e-05,
"loss": 3.6273,
"step": 6000
},
{
"epoch": 8.86,
"eval_cer": 0.651074081509737,
"eval_loss": 2.3390893936157227,
"eval_runtime": 111.201,
"eval_samples_per_second": 18.174,
"eval_steps_per_second": 2.275,
"eval_wer": 2.102919346857991,
"step": 6000
},
{
"epoch": 9.01,
"learning_rate": 7.032648401826483e-05,
"loss": 3.5851,
"step": 6100
},
{
"epoch": 9.16,
"learning_rate": 7.021232876712329e-05,
"loss": 3.5359,
"step": 6200
},
{
"epoch": 9.31,
"learning_rate": 7.009817351598173e-05,
"loss": 3.5385,
"step": 6300
},
{
"epoch": 9.45,
"learning_rate": 6.998401826484017e-05,
"loss": 3.5492,
"step": 6400
},
{
"epoch": 9.6,
"learning_rate": 6.986986301369862e-05,
"loss": 3.5248,
"step": 6500
},
{
"epoch": 9.6,
"eval_cer": 0.6858863681991568,
"eval_loss": 2.1943578720092773,
"eval_runtime": 112.8084,
"eval_samples_per_second": 17.915,
"eval_steps_per_second": 2.243,
"eval_wer": 2.3617021276595747,
"step": 6500
},
{
"epoch": 9.75,
"learning_rate": 6.975570776255707e-05,
"loss": 3.4791,
"step": 6600
},
{
"epoch": 9.9,
"learning_rate": 6.964269406392693e-05,
"loss": 3.4611,
"step": 6700
},
{
"epoch": 10.04,
"learning_rate": 6.952853881278538e-05,
"loss": 3.4418,
"step": 6800
},
{
"epoch": 10.19,
"learning_rate": 6.941438356164383e-05,
"loss": 3.4109,
"step": 6900
},
{
"epoch": 10.34,
"learning_rate": 6.930022831050228e-05,
"loss": 3.3683,
"step": 7000
},
{
"epoch": 10.34,
"eval_cer": 0.6063039550291106,
"eval_loss": 1.982745885848999,
"eval_runtime": 112.9729,
"eval_samples_per_second": 17.889,
"eval_steps_per_second": 2.239,
"eval_wer": 2.1014349332013853,
"step": 7000
},
{
"epoch": 10.49,
"learning_rate": 6.918721461187214e-05,
"loss": 3.3105,
"step": 7100
},
{
"epoch": 10.63,
"learning_rate": 6.907305936073059e-05,
"loss": 3.3242,
"step": 7200
},
{
"epoch": 10.78,
"learning_rate": 6.895890410958903e-05,
"loss": 3.3008,
"step": 7300
},
{
"epoch": 10.93,
"learning_rate": 6.884474885844748e-05,
"loss": 3.236,
"step": 7400
},
{
"epoch": 11.08,
"learning_rate": 6.873059360730593e-05,
"loss": 3.2411,
"step": 7500
},
{
"epoch": 11.08,
"eval_cer": 0.5135113431037944,
"eval_loss": 1.8609611988067627,
"eval_runtime": 112.6,
"eval_samples_per_second": 17.948,
"eval_steps_per_second": 2.247,
"eval_wer": 1.6160316674913409,
"step": 7500
},
{
"epoch": 11.23,
"learning_rate": 6.861643835616438e-05,
"loss": 3.2234,
"step": 7600
},
{
"epoch": 11.37,
"learning_rate": 6.850228310502283e-05,
"loss": 3.2441,
"step": 7700
},
{
"epoch": 11.52,
"learning_rate": 6.838812785388127e-05,
"loss": 3.2143,
"step": 7800
},
{
"epoch": 11.67,
"learning_rate": 6.827511415525114e-05,
"loss": 3.1661,
"step": 7900
},
{
"epoch": 11.82,
"learning_rate": 6.816095890410958e-05,
"loss": 3.1299,
"step": 8000
},
{
"epoch": 11.82,
"eval_cer": 0.4946396305962658,
"eval_loss": 1.744581937789917,
"eval_runtime": 113.3696,
"eval_samples_per_second": 17.827,
"eval_steps_per_second": 2.232,
"eval_wer": 1.59475507174666,
"step": 8000
},
{
"epoch": 11.96,
"learning_rate": 6.804680365296803e-05,
"loss": 3.1423,
"step": 8100
},
{
"epoch": 12.11,
"learning_rate": 6.793264840182648e-05,
"loss": 3.0895,
"step": 8200
},
{
"epoch": 12.26,
"learning_rate": 6.781849315068493e-05,
"loss": 3.0671,
"step": 8300
},
{
"epoch": 12.41,
"learning_rate": 6.770433789954338e-05,
"loss": 3.0724,
"step": 8400
},
{
"epoch": 12.56,
"learning_rate": 6.759018264840182e-05,
"loss": 3.0574,
"step": 8500
},
{
"epoch": 12.56,
"eval_cer": 0.4051395302148163,
"eval_loss": 1.6454455852508545,
"eval_runtime": 113.3175,
"eval_samples_per_second": 17.835,
"eval_steps_per_second": 2.233,
"eval_wer": 1.1291439881246907,
"step": 8500
},
{
"epoch": 12.7,
"learning_rate": 6.747602739726027e-05,
"loss": 3.047,
"step": 8600
},
{
"epoch": 12.85,
"learning_rate": 6.736187214611872e-05,
"loss": 3.0417,
"step": 8700
},
{
"epoch": 13.0,
"learning_rate": 6.724771689497717e-05,
"loss": 3.0791,
"step": 8800
},
{
"epoch": 13.15,
"learning_rate": 6.713356164383562e-05,
"loss": 3.0183,
"step": 8900
},
{
"epoch": 13.29,
"learning_rate": 6.701940639269405e-05,
"loss": 2.985,
"step": 9000
},
{
"epoch": 13.29,
"eval_cer": 0.38931941377233487,
"eval_loss": 1.5918797254562378,
"eval_runtime": 113.1024,
"eval_samples_per_second": 17.869,
"eval_steps_per_second": 2.237,
"eval_wer": 1.0672934190994556,
"step": 9000
},
{
"epoch": 13.44,
"learning_rate": 6.690525114155251e-05,
"loss": 3.001,
"step": 9100
},
{
"epoch": 13.59,
"learning_rate": 6.679109589041095e-05,
"loss": 2.9494,
"step": 9200
},
{
"epoch": 13.74,
"learning_rate": 6.667694063926941e-05,
"loss": 2.966,
"step": 9300
},
{
"epoch": 13.88,
"learning_rate": 6.656278538812784e-05,
"loss": 2.931,
"step": 9400
},
{
"epoch": 14.03,
"learning_rate": 6.64486301369863e-05,
"loss": 2.9573,
"step": 9500
},
{
"epoch": 14.03,
"eval_cer": 0.3765910459747039,
"eval_loss": 1.4903326034545898,
"eval_runtime": 113.3108,
"eval_samples_per_second": 17.836,
"eval_steps_per_second": 2.233,
"eval_wer": 1.0603661553686294,
"step": 9500
},
{
"epoch": 14.18,
"learning_rate": 6.633447488584474e-05,
"loss": 2.9104,
"step": 9600
},
{
"epoch": 14.33,
"learning_rate": 6.622031963470319e-05,
"loss": 2.9196,
"step": 9700
},
{
"epoch": 14.48,
"learning_rate": 6.610616438356163e-05,
"loss": 2.9326,
"step": 9800
},
{
"epoch": 14.62,
"learning_rate": 6.599200913242008e-05,
"loss": 2.9378,
"step": 9900
},
{
"epoch": 14.77,
"learning_rate": 6.587785388127853e-05,
"loss": 2.8897,
"step": 10000
},
{
"epoch": 14.77,
"eval_cer": 0.3652680184701867,
"eval_loss": 1.4614206552505493,
"eval_runtime": 113.6791,
"eval_samples_per_second": 17.778,
"eval_steps_per_second": 2.226,
"eval_wer": 1.0059376546264225,
"step": 10000
},
{
"epoch": 14.92,
"learning_rate": 6.576369863013698e-05,
"loss": 2.8819,
"step": 10100
},
{
"epoch": 15.07,
"learning_rate": 6.564954337899543e-05,
"loss": 2.8727,
"step": 10200
},
{
"epoch": 15.21,
"learning_rate": 6.553538812785387e-05,
"loss": 2.8518,
"step": 10300
},
{
"epoch": 15.36,
"learning_rate": 6.542123287671232e-05,
"loss": 2.8674,
"step": 10400
},
{
"epoch": 15.51,
"learning_rate": 6.530707762557077e-05,
"loss": 2.8169,
"step": 10500
},
{
"epoch": 15.51,
"eval_cer": 0.3549889580405541,
"eval_loss": 1.3997114896774292,
"eval_runtime": 113.6295,
"eval_samples_per_second": 17.786,
"eval_steps_per_second": 2.227,
"eval_wer": 1.0029688273132114,
"step": 10500
},
{
"epoch": 15.66,
"learning_rate": 6.519292237442922e-05,
"loss": 2.8574,
"step": 10600
},
{
"epoch": 15.8,
"learning_rate": 6.507876712328767e-05,
"loss": 2.813,
"step": 10700
},
{
"epoch": 15.95,
"learning_rate": 6.496461187214611e-05,
"loss": 2.8157,
"step": 10800
},
{
"epoch": 16.1,
"learning_rate": 6.485045662100456e-05,
"loss": 2.7573,
"step": 10900
},
{
"epoch": 16.25,
"learning_rate": 6.473630136986301e-05,
"loss": 2.8155,
"step": 11000
},
{
"epoch": 16.25,
"eval_cer": 0.344147761493676,
"eval_loss": 1.344403862953186,
"eval_runtime": 114.1268,
"eval_samples_per_second": 17.708,
"eval_steps_per_second": 2.217,
"eval_wer": 0.9980207817911925,
"step": 11000
},
{
"epoch": 16.4,
"learning_rate": 6.462214611872146e-05,
"loss": 2.7492,
"step": 11100
},
{
"epoch": 16.54,
"learning_rate": 6.45079908675799e-05,
"loss": 2.7507,
"step": 11200
},
{
"epoch": 16.69,
"learning_rate": 6.439383561643835e-05,
"loss": 2.7498,
"step": 11300
},
{
"epoch": 16.84,
"learning_rate": 6.42796803652968e-05,
"loss": 2.7684,
"step": 11400
},
{
"epoch": 16.99,
"learning_rate": 6.416552511415525e-05,
"loss": 2.7595,
"step": 11500
},
{
"epoch": 16.99,
"eval_cer": 0.332543665930536,
"eval_loss": 1.291101098060608,
"eval_runtime": 113.7438,
"eval_samples_per_second": 17.768,
"eval_steps_per_second": 2.224,
"eval_wer": 0.9703117268678871,
"step": 11500
},
{
"epoch": 17.13,
"learning_rate": 6.405136986301368e-05,
"loss": 2.6838,
"step": 11600
},
{
"epoch": 17.28,
"learning_rate": 6.393721461187215e-05,
"loss": 2.7349,
"step": 11700
},
{
"epoch": 17.43,
"learning_rate": 6.382305936073058e-05,
"loss": 2.6699,
"step": 11800
},
{
"epoch": 17.58,
"learning_rate": 6.370890410958904e-05,
"loss": 2.6713,
"step": 11900
},
{
"epoch": 17.72,
"learning_rate": 6.359474885844748e-05,
"loss": 2.7107,
"step": 12000
},
{
"epoch": 17.72,
"eval_cer": 0.32274643645854245,
"eval_loss": 1.246199369430542,
"eval_runtime": 113.0259,
"eval_samples_per_second": 17.881,
"eval_steps_per_second": 2.238,
"eval_wer": 0.9564571994062345,
"step": 12000
},
{
"epoch": 17.87,
"learning_rate": 6.348059360730594e-05,
"loss": 2.6684,
"step": 12100
},
{
"epoch": 18.02,
"learning_rate": 6.336643835616437e-05,
"loss": 2.6952,
"step": 12200
},
{
"epoch": 18.17,
"learning_rate": 6.325228310502283e-05,
"loss": 2.674,
"step": 12300
},
{
"epoch": 18.32,
"learning_rate": 6.313812785388127e-05,
"loss": 2.6453,
"step": 12400
},
{
"epoch": 18.46,
"learning_rate": 6.302397260273972e-05,
"loss": 2.6358,
"step": 12500
},
{
"epoch": 18.46,
"eval_cer": 0.3333467175266011,
"eval_loss": 1.2466477155685425,
"eval_runtime": 113.2849,
"eval_samples_per_second": 17.84,
"eval_steps_per_second": 2.233,
"eval_wer": 0.9955467590301831,
"step": 12500
},
{
"epoch": 18.61,
"learning_rate": 6.290981735159816e-05,
"loss": 2.6803,
"step": 12600
},
{
"epoch": 18.76,
"learning_rate": 6.279566210045661e-05,
"loss": 2.65,
"step": 12700
},
{
"epoch": 18.91,
"learning_rate": 6.268150684931506e-05,
"loss": 2.6329,
"step": 12800
},
{
"epoch": 19.05,
"learning_rate": 6.256735159817351e-05,
"loss": 2.6163,
"step": 12900
},
{
"epoch": 19.2,
"learning_rate": 6.245319634703196e-05,
"loss": 2.5801,
"step": 13000
},
{
"epoch": 19.2,
"eval_cer": 0.3226259787191327,
"eval_loss": 1.2059358358383179,
"eval_runtime": 112.9979,
"eval_samples_per_second": 17.885,
"eval_steps_per_second": 2.239,
"eval_wer": 1.0009896091044037,
"step": 13000
},
{
"epoch": 19.35,
"learning_rate": 6.23390410958904e-05,
"loss": 2.5665,
"step": 13100
},
{
"epoch": 19.5,
"learning_rate": 6.222602739726027e-05,
"loss": 2.6008,
"step": 13200
},
{
"epoch": 19.65,
"learning_rate": 6.211187214611871e-05,
"loss": 2.6289,
"step": 13300
},
{
"epoch": 19.79,
"learning_rate": 6.199771689497716e-05,
"loss": 2.5758,
"step": 13400
},
{
"epoch": 19.94,
"learning_rate": 6.188356164383561e-05,
"loss": 2.5554,
"step": 13500
},
{
"epoch": 19.94,
"eval_cer": 0.32234491066050996,
"eval_loss": 1.1918950080871582,
"eval_runtime": 113.3722,
"eval_samples_per_second": 17.826,
"eval_steps_per_second": 2.232,
"eval_wer": 1.0094012864918358,
"step": 13500
},
{
"epoch": 20.09,
"learning_rate": 6.176940639269406e-05,
"loss": 2.5404,
"step": 13600
},
{
"epoch": 20.24,
"learning_rate": 6.16552511415525e-05,
"loss": 2.4976,
"step": 13700
},
{
"epoch": 20.38,
"learning_rate": 6.154109589041095e-05,
"loss": 2.5373,
"step": 13800
},
{
"epoch": 20.53,
"learning_rate": 6.14269406392694e-05,
"loss": 2.5567,
"step": 13900
},
{
"epoch": 20.68,
"learning_rate": 6.131278538812785e-05,
"loss": 2.5314,
"step": 14000
},
{
"epoch": 20.68,
"eval_cer": 0.3155591246737603,
"eval_loss": 1.1703130006790161,
"eval_runtime": 113.4999,
"eval_samples_per_second": 17.806,
"eval_steps_per_second": 2.229,
"eval_wer": 0.9846610588817417,
"step": 14000
},
{
"epoch": 20.83,
"learning_rate": 6.11986301369863e-05,
"loss": 2.5179,
"step": 14100
},
{
"epoch": 20.97,
"learning_rate": 6.108447488584475e-05,
"loss": 2.5583,
"step": 14200
},
{
"epoch": 21.12,
"learning_rate": 6.097031963470319e-05,
"loss": 2.5269,
"step": 14300
},
{
"epoch": 21.27,
"learning_rate": 6.085616438356164e-05,
"loss": 2.5432,
"step": 14400
},
{
"epoch": 21.42,
"learning_rate": 6.074200913242008e-05,
"loss": 2.509,
"step": 14500
},
{
"epoch": 21.42,
"eval_cer": 0.3177273639831359,
"eval_loss": 1.173261284828186,
"eval_runtime": 113.3988,
"eval_samples_per_second": 17.822,
"eval_steps_per_second": 2.231,
"eval_wer": 0.9896091044037605,
"step": 14500
},
{
"epoch": 21.57,
"learning_rate": 6.062785388127854e-05,
"loss": 2.5077,
"step": 14600
},
{
"epoch": 21.71,
"learning_rate": 6.051369863013698e-05,
"loss": 2.4927,
"step": 14700
},
{
"epoch": 21.86,
"learning_rate": 6.039954337899543e-05,
"loss": 2.5003,
"step": 14800
},
{
"epoch": 22.01,
"learning_rate": 6.0285388127853875e-05,
"loss": 2.4673,
"step": 14900
},
{
"epoch": 22.16,
"learning_rate": 6.017123287671232e-05,
"loss": 2.4391,
"step": 15000
},
{
"epoch": 22.16,
"eval_cer": 0.3164023288496286,
"eval_loss": 1.181095838546753,
"eval_runtime": 113.7552,
"eval_samples_per_second": 17.766,
"eval_steps_per_second": 2.224,
"eval_wer": 0.9722909450766947,
"step": 15000
},
{
"epoch": 22.3,
"learning_rate": 6.005707762557077e-05,
"loss": 2.5065,
"step": 15100
},
{
"epoch": 22.45,
"learning_rate": 5.994292237442922e-05,
"loss": 2.4362,
"step": 15200
},
{
"epoch": 22.6,
"learning_rate": 5.982876712328766e-05,
"loss": 2.4788,
"step": 15300
},
{
"epoch": 22.75,
"learning_rate": 5.9714611872146115e-05,
"loss": 2.4702,
"step": 15400
},
{
"epoch": 22.89,
"learning_rate": 5.9600456621004556e-05,
"loss": 2.4631,
"step": 15500
},
{
"epoch": 22.89,
"eval_cer": 0.3059225055209797,
"eval_loss": 1.1381694078445435,
"eval_runtime": 114.6577,
"eval_samples_per_second": 17.626,
"eval_steps_per_second": 2.207,
"eval_wer": 0.9698169223156853,
"step": 15500
},
{
"epoch": 23.04,
"learning_rate": 5.948630136986301e-05,
"loss": 2.4725,
"step": 15600
},
{
"epoch": 23.19,
"learning_rate": 5.937328767123287e-05,
"loss": 2.4331,
"step": 15700
},
{
"epoch": 23.34,
"learning_rate": 5.9259132420091314e-05,
"loss": 2.4275,
"step": 15800
},
{
"epoch": 23.49,
"learning_rate": 5.914497716894977e-05,
"loss": 2.444,
"step": 15900
},
{
"epoch": 23.63,
"learning_rate": 5.903082191780821e-05,
"loss": 2.4414,
"step": 16000
},
{
"epoch": 23.63,
"eval_cer": 0.2972495482834772,
"eval_loss": 1.0892748832702637,
"eval_runtime": 114.5627,
"eval_samples_per_second": 17.641,
"eval_steps_per_second": 2.208,
"eval_wer": 0.9643740722414647,
"step": 16000
},
{
"epoch": 23.78,
"learning_rate": 5.8916666666666664e-05,
"loss": 2.3934,
"step": 16100
},
{
"epoch": 23.93,
"learning_rate": 5.8802511415525106e-05,
"loss": 2.4254,
"step": 16200
},
{
"epoch": 24.08,
"learning_rate": 5.8688356164383554e-05,
"loss": 2.4022,
"step": 16300
},
{
"epoch": 24.22,
"learning_rate": 5.8574200913242e-05,
"loss": 2.3613,
"step": 16400
},
{
"epoch": 24.37,
"learning_rate": 5.846004566210045e-05,
"loss": 2.3771,
"step": 16500
},
{
"epoch": 24.37,
"eval_cer": 0.2954025296125276,
"eval_loss": 1.0930148363113403,
"eval_runtime": 114.2056,
"eval_samples_per_second": 17.696,
"eval_steps_per_second": 2.215,
"eval_wer": 0.9505195447798119,
"step": 16500
},
{
"epoch": 24.52,
"learning_rate": 5.83458904109589e-05,
"loss": 2.3801,
"step": 16600
},
{
"epoch": 24.67,
"learning_rate": 5.8231735159817346e-05,
"loss": 2.3638,
"step": 16700
},
{
"epoch": 24.82,
"learning_rate": 5.8117579908675794e-05,
"loss": 2.3813,
"step": 16800
},
{
"epoch": 24.96,
"learning_rate": 5.800342465753424e-05,
"loss": 2.388,
"step": 16900
},
{
"epoch": 25.11,
"learning_rate": 5.788926940639268e-05,
"loss": 2.3658,
"step": 17000
},
{
"epoch": 25.11,
"eval_cer": 0.2925918490262999,
"eval_loss": 1.0755608081817627,
"eval_runtime": 112.4178,
"eval_samples_per_second": 17.978,
"eval_steps_per_second": 2.251,
"eval_wer": 0.9609104403760514,
"step": 17000
},
{
"epoch": 25.26,
"learning_rate": 5.777511415525114e-05,
"loss": 2.3624,
"step": 17100
},
{
"epoch": 25.41,
"learning_rate": 5.766095890410958e-05,
"loss": 2.376,
"step": 17200
},
{
"epoch": 25.55,
"learning_rate": 5.7546803652968034e-05,
"loss": 2.3337,
"step": 17300
},
{
"epoch": 25.7,
"learning_rate": 5.7432648401826475e-05,
"loss": 2.332,
"step": 17400
},
{
"epoch": 25.85,
"learning_rate": 5.731849315068493e-05,
"loss": 2.3215,
"step": 17500
},
{
"epoch": 25.85,
"eval_cer": 0.2889781168440072,
"eval_loss": 1.0512421131134033,
"eval_runtime": 113.4988,
"eval_samples_per_second": 17.806,
"eval_steps_per_second": 2.229,
"eval_wer": 0.9614052449282533,
"step": 17500
},
{
"epoch": 26.0,
"learning_rate": 5.720433789954337e-05,
"loss": 2.3507,
"step": 17600
},
{
"epoch": 26.14,
"learning_rate": 5.709246575342465e-05,
"loss": 2.3051,
"step": 17700
},
{
"epoch": 26.29,
"learning_rate": 5.69783105022831e-05,
"loss": 2.2839,
"step": 17800
},
{
"epoch": 26.44,
"learning_rate": 5.686415525114155e-05,
"loss": 2.3098,
"step": 17900
},
{
"epoch": 26.59,
"learning_rate": 5.675e-05,
"loss": 2.3327,
"step": 18000
},
{
"epoch": 26.59,
"eval_cer": 0.32816703473198156,
"eval_loss": 1.0626572370529175,
"eval_runtime": 113.1488,
"eval_samples_per_second": 17.861,
"eval_steps_per_second": 2.236,
"eval_wer": 1.198416625432954,
"step": 18000
},
{
"epoch": 26.74,
"learning_rate": 5.663584474885844e-05,
"loss": 2.2986,
"step": 18100
},
{
"epoch": 26.88,
"learning_rate": 5.652168949771689e-05,
"loss": 2.3408,
"step": 18200
},
{
"epoch": 27.03,
"learning_rate": 5.6407534246575334e-05,
"loss": 2.311,
"step": 18300
},
{
"epoch": 27.18,
"learning_rate": 5.629337899543379e-05,
"loss": 2.2481,
"step": 18400
},
{
"epoch": 27.33,
"learning_rate": 5.617922374429223e-05,
"loss": 2.3055,
"step": 18500
},
{
"epoch": 27.33,
"eval_cer": 0.2841196546878137,
"eval_loss": 1.0581693649291992,
"eval_runtime": 113.906,
"eval_samples_per_second": 17.743,
"eval_steps_per_second": 2.221,
"eval_wer": 0.9520039584364176,
"step": 18500
},
{
"epoch": 27.47,
"learning_rate": 5.6065068493150685e-05,
"loss": 2.3342,
"step": 18600
},
{
"epoch": 27.62,
"learning_rate": 5.5950913242009126e-05,
"loss": 2.3318,
"step": 18700
},
{
"epoch": 27.77,
"learning_rate": 5.583675799086758e-05,
"loss": 2.2844,
"step": 18800
},
{
"epoch": 27.92,
"learning_rate": 5.572260273972602e-05,
"loss": 2.3207,
"step": 18900
},
{
"epoch": 28.06,
"learning_rate": 5.560844748858447e-05,
"loss": 2.299,
"step": 19000
},
{
"epoch": 28.06,
"eval_cer": 0.2816703473198153,
"eval_loss": 1.0356189012527466,
"eval_runtime": 114.3143,
"eval_samples_per_second": 17.679,
"eval_steps_per_second": 2.213,
"eval_wer": 0.9480455220188025,
"step": 19000
},
{
"epoch": 28.21,
"learning_rate": 5.549429223744292e-05,
"loss": 2.269,
"step": 19100
},
{
"epoch": 28.36,
"learning_rate": 5.5380136986301366e-05,
"loss": 2.2875,
"step": 19200
},
{
"epoch": 28.51,
"learning_rate": 5.5265981735159814e-05,
"loss": 2.241,
"step": 19300
},
{
"epoch": 28.66,
"learning_rate": 5.515182648401826e-05,
"loss": 2.2714,
"step": 19400
},
{
"epoch": 28.8,
"learning_rate": 5.5037671232876703e-05,
"loss": 2.2673,
"step": 19500
},
{
"epoch": 28.8,
"eval_cer": 0.27709295322224453,
"eval_loss": 1.030503749847412,
"eval_runtime": 113.8786,
"eval_samples_per_second": 17.747,
"eval_steps_per_second": 2.222,
"eval_wer": 0.9366650173181593,
"step": 19500
},
{
"epoch": 28.95,
"learning_rate": 5.492351598173516e-05,
"loss": 2.2386,
"step": 19600
},
{
"epoch": 29.1,
"learning_rate": 5.48093607305936e-05,
"loss": 2.2634,
"step": 19700
},
{
"epoch": 29.25,
"learning_rate": 5.4695205479452054e-05,
"loss": 2.2135,
"step": 19800
},
{
"epoch": 29.39,
"learning_rate": 5.4581050228310495e-05,
"loss": 2.2101,
"step": 19900
},
{
"epoch": 29.54,
"learning_rate": 5.446689497716895e-05,
"loss": 2.2166,
"step": 20000
},
{
"epoch": 29.54,
"eval_cer": 0.27018670949608514,
"eval_loss": 1.0138665437698364,
"eval_runtime": 113.1869,
"eval_samples_per_second": 17.855,
"eval_steps_per_second": 2.235,
"eval_wer": 0.9223156853043047,
"step": 20000
},
{
"epoch": 29.69,
"learning_rate": 5.435273972602739e-05,
"loss": 2.2537,
"step": 20100
},
{
"epoch": 29.84,
"learning_rate": 5.4238584474885846e-05,
"loss": 2.2282,
"step": 20200
},
{
"epoch": 29.98,
"learning_rate": 5.412442922374429e-05,
"loss": 2.2253,
"step": 20300
},
{
"epoch": 30.13,
"learning_rate": 5.4010273972602735e-05,
"loss": 2.1831,
"step": 20400
},
{
"epoch": 30.28,
"learning_rate": 5.389611872146118e-05,
"loss": 2.2378,
"step": 20500
},
{
"epoch": 30.28,
"eval_cer": 0.27215418590644447,
"eval_loss": 1.009473204612732,
"eval_runtime": 113.8468,
"eval_samples_per_second": 17.752,
"eval_steps_per_second": 2.222,
"eval_wer": 0.9267689262741218,
"step": 20500
},
{
"epoch": 30.43,
"learning_rate": 5.378196347031963e-05,
"loss": 2.2226,
"step": 20600
},
{
"epoch": 30.58,
"learning_rate": 5.366780821917808e-05,
"loss": 2.212,
"step": 20700
},
{
"epoch": 30.72,
"learning_rate": 5.355365296803653e-05,
"loss": 2.2008,
"step": 20800
},
{
"epoch": 30.87,
"learning_rate": 5.343949771689497e-05,
"loss": 2.1976,
"step": 20900
},
{
"epoch": 31.02,
"learning_rate": 5.332534246575342e-05,
"loss": 2.2168,
"step": 21000
},
{
"epoch": 31.02,
"eval_cer": 0.26906243726159407,
"eval_loss": 1.000132441520691,
"eval_runtime": 113.357,
"eval_samples_per_second": 17.829,
"eval_steps_per_second": 2.232,
"eval_wer": 0.9084611578426521,
"step": 21000
},
{
"epoch": 31.17,
"learning_rate": 5.3211187214611865e-05,
"loss": 2.1397,
"step": 21100
},
{
"epoch": 31.31,
"learning_rate": 5.309703196347032e-05,
"loss": 2.1295,
"step": 21200
},
{
"epoch": 31.46,
"learning_rate": 5.298287671232876e-05,
"loss": 2.1799,
"step": 21300
},
{
"epoch": 31.61,
"learning_rate": 5.2868721461187215e-05,
"loss": 2.1911,
"step": 21400
},
{
"epoch": 31.76,
"learning_rate": 5.2754566210045657e-05,
"loss": 2.1766,
"step": 21500
},
{
"epoch": 31.76,
"eval_cer": 0.2640032122063843,
"eval_loss": 0.9883873462677002,
"eval_runtime": 112.449,
"eval_samples_per_second": 17.973,
"eval_steps_per_second": 2.25,
"eval_wer": 0.904997525977239,
"step": 21500
},
{
"epoch": 31.91,
"learning_rate": 5.264041095890411e-05,
"loss": 2.1739,
"step": 21600
},
{
"epoch": 32.05,
"learning_rate": 5.252625570776255e-05,
"loss": 2.1613,
"step": 21700
},
{
"epoch": 32.2,
"learning_rate": 5.2413242009132414e-05,
"loss": 2.1642,
"step": 21800
},
{
"epoch": 32.35,
"learning_rate": 5.229908675799087e-05,
"loss": 2.1227,
"step": 21900
},
{
"epoch": 32.5,
"learning_rate": 5.218493150684931e-05,
"loss": 2.1715,
"step": 22000
},
{
"epoch": 32.5,
"eval_cer": 0.271913270427625,
"eval_loss": 0.9729828834533691,
"eval_runtime": 113.2869,
"eval_samples_per_second": 17.84,
"eval_steps_per_second": 2.233,
"eval_wer": 0.9505195447798119,
"step": 22000
},
{
"epoch": 32.64,
"learning_rate": 5.207077625570776e-05,
"loss": 2.1648,
"step": 22100
},
{
"epoch": 32.79,
"learning_rate": 5.1956621004566206e-05,
"loss": 2.1391,
"step": 22200
},
{
"epoch": 32.94,
"learning_rate": 5.1842465753424654e-05,
"loss": 2.1289,
"step": 22300
},
{
"epoch": 33.09,
"learning_rate": 5.17283105022831e-05,
"loss": 2.1069,
"step": 22400
},
{
"epoch": 33.23,
"learning_rate": 5.161415525114155e-05,
"loss": 2.1104,
"step": 22500
},
{
"epoch": 33.23,
"eval_cer": 0.2655691628187111,
"eval_loss": 0.975226104259491,
"eval_runtime": 113.7072,
"eval_samples_per_second": 17.774,
"eval_steps_per_second": 2.225,
"eval_wer": 0.9361702127659575,
"step": 22500
},
{
"epoch": 33.38,
"learning_rate": 5.149999999999999e-05,
"loss": 2.104,
"step": 22600
},
{
"epoch": 33.53,
"learning_rate": 5.1385844748858446e-05,
"loss": 2.1359,
"step": 22700
},
{
"epoch": 33.68,
"learning_rate": 5.127168949771689e-05,
"loss": 2.1363,
"step": 22800
},
{
"epoch": 33.83,
"learning_rate": 5.115753424657534e-05,
"loss": 2.1217,
"step": 22900
},
{
"epoch": 33.97,
"learning_rate": 5.1043378995433783e-05,
"loss": 2.1158,
"step": 23000
},
{
"epoch": 33.97,
"eval_cer": 0.26239710901425417,
"eval_loss": 0.971994161605835,
"eval_runtime": 113.8291,
"eval_samples_per_second": 17.755,
"eval_steps_per_second": 2.223,
"eval_wer": 0.9262741217219198,
"step": 23000
},
{
"epoch": 34.12,
"learning_rate": 5.092922374429224e-05,
"loss": 2.1035,
"step": 23100
},
{
"epoch": 34.27,
"learning_rate": 5.081506849315068e-05,
"loss": 2.0811,
"step": 23200
},
{
"epoch": 34.42,
"learning_rate": 5.070091324200913e-05,
"loss": 2.0994,
"step": 23300
},
{
"epoch": 34.56,
"learning_rate": 5.0586757990867575e-05,
"loss": 2.1054,
"step": 23400
},
{
"epoch": 34.71,
"learning_rate": 5.047260273972602e-05,
"loss": 2.0718,
"step": 23500
},
{
"epoch": 34.71,
"eval_cer": 0.27588837582814696,
"eval_loss": 0.9573031663894653,
"eval_runtime": 113.0887,
"eval_samples_per_second": 17.871,
"eval_steps_per_second": 2.237,
"eval_wer": 1.000494804552202,
"step": 23500
},
{
"epoch": 34.86,
"learning_rate": 5.035844748858447e-05,
"loss": 2.1031,
"step": 23600
},
{
"epoch": 35.01,
"learning_rate": 5.024429223744292e-05,
"loss": 2.0799,
"step": 23700
},
{
"epoch": 35.16,
"learning_rate": 5.013127853881278e-05,
"loss": 2.0666,
"step": 23800
},
{
"epoch": 35.3,
"learning_rate": 5.001712328767123e-05,
"loss": 2.079,
"step": 23900
},
{
"epoch": 35.45,
"learning_rate": 4.990296803652968e-05,
"loss": 2.0824,
"step": 24000
},
{
"epoch": 35.45,
"eval_cer": 0.26428428026500705,
"eval_loss": 0.960873007774353,
"eval_runtime": 113.6706,
"eval_samples_per_second": 17.779,
"eval_steps_per_second": 2.226,
"eval_wer": 0.9524987629886195,
"step": 24000
},
{
"epoch": 35.6,
"learning_rate": 4.978881278538812e-05,
"loss": 2.0896,
"step": 24100
},
{
"epoch": 35.75,
"learning_rate": 4.967465753424657e-05,
"loss": 2.0978,
"step": 24200
},
{
"epoch": 35.89,
"learning_rate": 4.9560502283105014e-05,
"loss": 2.0796,
"step": 24300
},
{
"epoch": 36.04,
"learning_rate": 4.944634703196347e-05,
"loss": 2.047,
"step": 24400
},
{
"epoch": 36.19,
"learning_rate": 4.933219178082191e-05,
"loss": 2.0591,
"step": 24500
},
{
"epoch": 36.19,
"eval_cer": 0.26669343505320214,
"eval_loss": 0.9662116169929504,
"eval_runtime": 112.5392,
"eval_samples_per_second": 17.958,
"eval_steps_per_second": 2.248,
"eval_wer": 0.9569520039584364,
"step": 24500
},
{
"epoch": 36.34,
"learning_rate": 4.9218036529680365e-05,
"loss": 2.0458,
"step": 24600
},
{
"epoch": 36.48,
"learning_rate": 4.910502283105023e-05,
"loss": 2.0697,
"step": 24700
},
{
"epoch": 36.63,
"learning_rate": 4.899086757990867e-05,
"loss": 2.0633,
"step": 24800
},
{
"epoch": 36.78,
"learning_rate": 4.887671232876712e-05,
"loss": 2.0296,
"step": 24900
},
{
"epoch": 36.93,
"learning_rate": 4.8762557077625564e-05,
"loss": 2.0768,
"step": 25000
},
{
"epoch": 36.93,
"eval_cer": 0.26456534832362977,
"eval_loss": 0.9527919292449951,
"eval_runtime": 113.2105,
"eval_samples_per_second": 17.852,
"eval_steps_per_second": 2.235,
"eval_wer": 0.9574468085106383,
"step": 25000
},
{
"epoch": 37.08,
"learning_rate": 4.864840182648401e-05,
"loss": 2.0588,
"step": 25100
},
{
"epoch": 37.22,
"learning_rate": 4.853424657534246e-05,
"loss": 2.0251,
"step": 25200
},
{
"epoch": 37.37,
"learning_rate": 4.842009132420091e-05,
"loss": 2.0823,
"step": 25300
},
{
"epoch": 37.52,
"learning_rate": 4.8305936073059356e-05,
"loss": 2.0337,
"step": 25400
},
{
"epoch": 37.67,
"learning_rate": 4.8191780821917804e-05,
"loss": 2.0893,
"step": 25500
},
{
"epoch": 37.67,
"eval_cer": 0.2612326841999599,
"eval_loss": 0.9809953570365906,
"eval_runtime": 112.6858,
"eval_samples_per_second": 17.935,
"eval_steps_per_second": 2.245,
"eval_wer": 0.9168728352300841,
"step": 25500
},
{
"epoch": 37.81,
"learning_rate": 4.807762557077625e-05,
"loss": 2.0755,
"step": 25600
},
{
"epoch": 37.96,
"learning_rate": 4.79634703196347e-05,
"loss": 2.0494,
"step": 25700
},
{
"epoch": 38.11,
"learning_rate": 4.784931506849314e-05,
"loss": 2.0441,
"step": 25800
},
{
"epoch": 38.26,
"learning_rate": 4.7735159817351596e-05,
"loss": 2.022,
"step": 25900
},
{
"epoch": 38.4,
"learning_rate": 4.762100456621004e-05,
"loss": 2.0282,
"step": 26000
},
{
"epoch": 38.4,
"eval_cer": 0.2527604898614736,
"eval_loss": 0.9555507302284241,
"eval_runtime": 115.3715,
"eval_samples_per_second": 17.517,
"eval_steps_per_second": 2.193,
"eval_wer": 0.8876793666501732,
"step": 26000
},
{
"epoch": 38.55,
"learning_rate": 4.750684931506849e-05,
"loss": 2.0534,
"step": 26100
},
{
"epoch": 38.7,
"learning_rate": 4.739269406392693e-05,
"loss": 2.0246,
"step": 26200
},
{
"epoch": 38.85,
"learning_rate": 4.727853881278539e-05,
"loss": 2.027,
"step": 26300
},
{
"epoch": 39.0,
"learning_rate": 4.716438356164383e-05,
"loss": 2.0049,
"step": 26400
},
{
"epoch": 39.14,
"learning_rate": 4.705022831050228e-05,
"loss": 1.997,
"step": 26500
},
{
"epoch": 39.14,
"eval_cer": 0.2500702670146557,
"eval_loss": 0.9522635340690613,
"eval_runtime": 113.4036,
"eval_samples_per_second": 17.821,
"eval_steps_per_second": 2.231,
"eval_wer": 0.8723404255319149,
"step": 26500
},
{
"epoch": 39.29,
"learning_rate": 4.6936073059360725e-05,
"loss": 2.0177,
"step": 26600
},
{
"epoch": 39.44,
"learning_rate": 4.682191780821917e-05,
"loss": 2.0133,
"step": 26700
},
{
"epoch": 39.59,
"learning_rate": 4.670776255707762e-05,
"loss": 1.9869,
"step": 26800
},
{
"epoch": 39.73,
"learning_rate": 4.659360730593607e-05,
"loss": 2.0126,
"step": 26900
},
{
"epoch": 39.88,
"learning_rate": 4.647945205479452e-05,
"loss": 2.0209,
"step": 27000
},
{
"epoch": 39.88,
"eval_cer": 0.2503111824934752,
"eval_loss": 0.9542492032051086,
"eval_runtime": 112.4842,
"eval_samples_per_second": 17.967,
"eval_steps_per_second": 2.249,
"eval_wer": 0.8772884710539337,
"step": 27000
},
{
"epoch": 40.03,
"learning_rate": 4.6365296803652965e-05,
"loss": 2.0127,
"step": 27100
},
{
"epoch": 40.18,
"learning_rate": 4.6251141552511406e-05,
"loss": 1.9615,
"step": 27200
},
{
"epoch": 40.32,
"learning_rate": 4.613698630136986e-05,
"loss": 2.0066,
"step": 27300
},
{
"epoch": 40.47,
"learning_rate": 4.60228310502283e-05,
"loss": 1.9535,
"step": 27400
},
{
"epoch": 40.62,
"learning_rate": 4.590867579908676e-05,
"loss": 1.987,
"step": 27500
},
{
"epoch": 40.62,
"eval_cer": 0.25003011443485246,
"eval_loss": 0.9427167177200317,
"eval_runtime": 113.6661,
"eval_samples_per_second": 17.78,
"eval_steps_per_second": 2.226,
"eval_wer": 0.8866897575457694,
"step": 27500
},
{
"epoch": 40.77,
"learning_rate": 4.57945205479452e-05,
"loss": 2.0127,
"step": 27600
},
{
"epoch": 40.92,
"learning_rate": 4.568036529680365e-05,
"loss": 2.0376,
"step": 27700
},
{
"epoch": 41.06,
"learning_rate": 4.5566210045662094e-05,
"loss": 1.9884,
"step": 27800
},
{
"epoch": 41.21,
"learning_rate": 4.545205479452054e-05,
"loss": 1.9957,
"step": 27900
},
{
"epoch": 41.36,
"learning_rate": 4.533789954337899e-05,
"loss": 1.9663,
"step": 28000
},
{
"epoch": 41.36,
"eval_cer": 0.2546476611122265,
"eval_loss": 0.9546382427215576,
"eval_runtime": 113.2668,
"eval_samples_per_second": 17.843,
"eval_steps_per_second": 2.234,
"eval_wer": 0.9064819396338446,
"step": 28000
},
{
"epoch": 41.51,
"learning_rate": 4.522374429223744e-05,
"loss": 1.9957,
"step": 28100
},
{
"epoch": 41.65,
"learning_rate": 4.5109589041095886e-05,
"loss": 1.9788,
"step": 28200
},
{
"epoch": 41.8,
"learning_rate": 4.4995433789954334e-05,
"loss": 1.992,
"step": 28300
},
{
"epoch": 41.95,
"learning_rate": 4.4881278538812775e-05,
"loss": 1.9798,
"step": 28400
},
{
"epoch": 42.1,
"learning_rate": 4.476712328767123e-05,
"loss": 1.9945,
"step": 28500
},
{
"epoch": 42.1,
"eval_cer": 0.2536036940373419,
"eval_loss": 0.9430962204933167,
"eval_runtime": 113.3718,
"eval_samples_per_second": 17.826,
"eval_steps_per_second": 2.232,
"eval_wer": 0.9119247897080653,
"step": 28500
},
{
"epoch": 42.25,
"learning_rate": 4.465296803652967e-05,
"loss": 1.9457,
"step": 28600
},
{
"epoch": 42.39,
"learning_rate": 4.4538812785388126e-05,
"loss": 1.9808,
"step": 28700
},
{
"epoch": 42.54,
"learning_rate": 4.442465753424657e-05,
"loss": 1.9565,
"step": 28800
},
{
"epoch": 42.69,
"learning_rate": 4.431050228310502e-05,
"loss": 1.9395,
"step": 28900
},
{
"epoch": 42.84,
"learning_rate": 4.4196347031963463e-05,
"loss": 1.9604,
"step": 29000
},
{
"epoch": 42.84,
"eval_cer": 0.24898614735996788,
"eval_loss": 0.936680018901825,
"eval_runtime": 113.5751,
"eval_samples_per_second": 17.794,
"eval_steps_per_second": 2.228,
"eval_wer": 0.9030183077684315,
"step": 29000
},
{
"epoch": 42.98,
"learning_rate": 4.4083333333333325e-05,
"loss": 1.9569,
"step": 29100
},
{
"epoch": 43.13,
"learning_rate": 4.396917808219178e-05,
"loss": 1.9521,
"step": 29200
},
{
"epoch": 43.28,
"learning_rate": 4.385502283105022e-05,
"loss": 1.9383,
"step": 29300
},
{
"epoch": 43.43,
"learning_rate": 4.3740867579908676e-05,
"loss": 1.9199,
"step": 29400
},
{
"epoch": 43.57,
"learning_rate": 4.362671232876712e-05,
"loss": 1.933,
"step": 29500
},
{
"epoch": 43.57,
"eval_cer": 0.2431640232884963,
"eval_loss": 0.9071494936943054,
"eval_runtime": 113.901,
"eval_samples_per_second": 17.743,
"eval_steps_per_second": 2.221,
"eval_wer": 0.8916378030677882,
"step": 29500
},
{
"epoch": 43.72,
"learning_rate": 4.3512557077625565e-05,
"loss": 1.9212,
"step": 29600
},
{
"epoch": 43.87,
"learning_rate": 4.339840182648401e-05,
"loss": 1.9337,
"step": 29700
},
{
"epoch": 44.02,
"learning_rate": 4.328424657534246e-05,
"loss": 1.9216,
"step": 29800
},
{
"epoch": 44.17,
"learning_rate": 4.317009132420091e-05,
"loss": 1.8678,
"step": 29900
},
{
"epoch": 44.31,
"learning_rate": 4.305593607305936e-05,
"loss": 1.9227,
"step": 30000
},
{
"epoch": 44.31,
"eval_cer": 0.24284280265007027,
"eval_loss": 0.9047707319259644,
"eval_runtime": 114.4717,
"eval_samples_per_second": 17.655,
"eval_steps_per_second": 2.21,
"eval_wer": 0.8881741712023751,
"step": 30000
},
{
"epoch": 44.46,
"learning_rate": 4.29417808219178e-05,
"loss": 1.9218,
"step": 30100
},
{
"epoch": 44.61,
"learning_rate": 4.282762557077625e-05,
"loss": 1.8979,
"step": 30200
},
{
"epoch": 44.76,
"learning_rate": 4.2713470319634694e-05,
"loss": 1.8942,
"step": 30300
},
{
"epoch": 44.9,
"learning_rate": 4.259931506849315e-05,
"loss": 1.9312,
"step": 30400
},
{
"epoch": 45.05,
"learning_rate": 4.248515981735159e-05,
"loss": 1.8784,
"step": 30500
},
{
"epoch": 45.05,
"eval_cer": 0.24372615940574183,
"eval_loss": 0.9106321930885315,
"eval_runtime": 113.4695,
"eval_samples_per_second": 17.811,
"eval_steps_per_second": 2.23,
"eval_wer": 0.8990598713508164,
"step": 30500
},
{
"epoch": 45.2,
"learning_rate": 4.2371004566210045e-05,
"loss": 1.8804,
"step": 30600
},
{
"epoch": 45.35,
"learning_rate": 4.2256849315068486e-05,
"loss": 1.8806,
"step": 30700
},
{
"epoch": 45.49,
"learning_rate": 4.214269406392694e-05,
"loss": 1.8847,
"step": 30800
},
{
"epoch": 45.64,
"learning_rate": 4.20296803652968e-05,
"loss": 1.8782,
"step": 30900
},
{
"epoch": 45.79,
"learning_rate": 4.1915525114155244e-05,
"loss": 1.8844,
"step": 31000
},
{
"epoch": 45.79,
"eval_cer": 0.237863882754467,
"eval_loss": 0.8996090292930603,
"eval_runtime": 113.2035,
"eval_samples_per_second": 17.853,
"eval_steps_per_second": 2.235,
"eval_wer": 0.875804057397328,
"step": 31000
},
{
"epoch": 45.94,
"learning_rate": 4.180136986301369e-05,
"loss": 1.8547,
"step": 31100
},
{
"epoch": 46.09,
"learning_rate": 4.168721461187214e-05,
"loss": 1.8476,
"step": 31200
},
{
"epoch": 46.23,
"learning_rate": 4.157305936073059e-05,
"loss": 1.8317,
"step": 31300
},
{
"epoch": 46.38,
"learning_rate": 4.1458904109589036e-05,
"loss": 1.8754,
"step": 31400
},
{
"epoch": 46.53,
"learning_rate": 4.1344748858447484e-05,
"loss": 1.8776,
"step": 31500
},
{
"epoch": 46.53,
"eval_cer": 0.23946998594659707,
"eval_loss": 0.9027520418167114,
"eval_runtime": 112.8193,
"eval_samples_per_second": 17.914,
"eval_steps_per_second": 2.243,
"eval_wer": 0.8797624938149431,
"step": 31500
},
{
"epoch": 46.68,
"learning_rate": 4.1230593607305925e-05,
"loss": 1.8392,
"step": 31600
},
{
"epoch": 46.82,
"learning_rate": 4.111643835616438e-05,
"loss": 1.8412,
"step": 31700
},
{
"epoch": 46.97,
"learning_rate": 4.100228310502282e-05,
"loss": 1.8716,
"step": 31800
},
{
"epoch": 47.12,
"learning_rate": 4.0888127853881276e-05,
"loss": 1.83,
"step": 31900
},
{
"epoch": 47.27,
"learning_rate": 4.077397260273972e-05,
"loss": 1.8372,
"step": 32000
},
{
"epoch": 47.27,
"eval_cer": 0.23790403533427024,
"eval_loss": 0.9047237634658813,
"eval_runtime": 113.7608,
"eval_samples_per_second": 17.765,
"eval_steps_per_second": 2.224,
"eval_wer": 0.8777832756061356,
"step": 32000
},
{
"epoch": 47.41,
"learning_rate": 4.065981735159817e-05,
"loss": 1.8219,
"step": 32100
},
{
"epoch": 47.56,
"learning_rate": 4.054566210045661e-05,
"loss": 1.8591,
"step": 32200
},
{
"epoch": 47.71,
"learning_rate": 4.043150684931507e-05,
"loss": 1.8271,
"step": 32300
},
{
"epoch": 47.86,
"learning_rate": 4.031735159817351e-05,
"loss": 1.8388,
"step": 32400
},
{
"epoch": 48.01,
"learning_rate": 4.020319634703196e-05,
"loss": 1.832,
"step": 32500
},
{
"epoch": 48.01,
"eval_cer": 0.2392692230475808,
"eval_loss": 0.9015888571739197,
"eval_runtime": 113.7725,
"eval_samples_per_second": 17.764,
"eval_steps_per_second": 2.224,
"eval_wer": 0.8941118258287977,
"step": 32500
},
{
"epoch": 48.15,
"learning_rate": 4.0089041095890405e-05,
"loss": 1.8286,
"step": 32600
},
{
"epoch": 48.3,
"learning_rate": 3.997488584474885e-05,
"loss": 1.8156,
"step": 32700
},
{
"epoch": 48.45,
"learning_rate": 3.98607305936073e-05,
"loss": 1.8137,
"step": 32800
},
{
"epoch": 48.6,
"learning_rate": 3.974657534246575e-05,
"loss": 1.816,
"step": 32900
},
{
"epoch": 48.74,
"learning_rate": 3.963242009132419e-05,
"loss": 1.8154,
"step": 33000
},
{
"epoch": 48.74,
"eval_cer": 0.23722144147761492,
"eval_loss": 0.8914681077003479,
"eval_runtime": 114.1832,
"eval_samples_per_second": 17.7,
"eval_steps_per_second": 2.216,
"eval_wer": 0.8916378030677882,
"step": 33000
},
{
"epoch": 48.89,
"learning_rate": 3.9518264840182645e-05,
"loss": 1.8166,
"step": 33100
},
{
"epoch": 49.04,
"learning_rate": 3.9404109589041086e-05,
"loss": 1.7795,
"step": 33200
},
{
"epoch": 49.19,
"learning_rate": 3.928995433789954e-05,
"loss": 1.7661,
"step": 33300
},
{
"epoch": 49.34,
"learning_rate": 3.917579908675798e-05,
"loss": 1.8,
"step": 33400
},
{
"epoch": 49.48,
"learning_rate": 3.906164383561644e-05,
"loss": 1.8072,
"step": 33500
},
{
"epoch": 49.48,
"eval_cer": 0.23653884762095964,
"eval_loss": 0.8781279921531677,
"eval_runtime": 113.0385,
"eval_samples_per_second": 17.879,
"eval_steps_per_second": 2.238,
"eval_wer": 0.8871845620979713,
"step": 33500
},
{
"epoch": 49.63,
"learning_rate": 3.89486301369863e-05,
"loss": 1.7845,
"step": 33600
},
{
"epoch": 49.78,
"learning_rate": 3.883447488584475e-05,
"loss": 1.785,
"step": 33700
},
{
"epoch": 49.93,
"learning_rate": 3.8720319634703195e-05,
"loss": 1.784,
"step": 33800
},
{
"epoch": 50.07,
"learning_rate": 3.860616438356164e-05,
"loss": 1.7633,
"step": 33900
},
{
"epoch": 50.22,
"learning_rate": 3.8492009132420084e-05,
"loss": 1.7489,
"step": 34000
},
{
"epoch": 50.22,
"eval_cer": 0.234049387673158,
"eval_loss": 0.8738340139389038,
"eval_runtime": 114.2979,
"eval_samples_per_second": 17.682,
"eval_steps_per_second": 2.214,
"eval_wer": 0.8955962394854032,
"step": 34000
},
{
"epoch": 50.37,
"learning_rate": 3.837785388127854e-05,
"loss": 1.7925,
"step": 34100
},
{
"epoch": 50.52,
"learning_rate": 3.826369863013698e-05,
"loss": 1.7551,
"step": 34200
},
{
"epoch": 50.66,
"learning_rate": 3.8149543378995435e-05,
"loss": 1.7946,
"step": 34300
},
{
"epoch": 50.81,
"learning_rate": 3.8035388127853876e-05,
"loss": 1.7948,
"step": 34400
},
{
"epoch": 50.96,
"learning_rate": 3.792123287671233e-05,
"loss": 1.7928,
"step": 34500
},
{
"epoch": 50.96,
"eval_cer": 0.2322826741618149,
"eval_loss": 0.8683820962905884,
"eval_runtime": 113.3816,
"eval_samples_per_second": 17.825,
"eval_steps_per_second": 2.231,
"eval_wer": 0.8871845620979713,
"step": 34500
},
{
"epoch": 51.11,
"learning_rate": 3.780707762557077e-05,
"loss": 1.8077,
"step": 34600
},
{
"epoch": 51.26,
"learning_rate": 3.769292237442923e-05,
"loss": 1.7541,
"step": 34700
},
{
"epoch": 51.4,
"learning_rate": 3.757876712328767e-05,
"loss": 1.7685,
"step": 34800
},
{
"epoch": 51.55,
"learning_rate": 3.7464611872146116e-05,
"loss": 1.7638,
"step": 34900
},
{
"epoch": 51.7,
"learning_rate": 3.7350456621004564e-05,
"loss": 1.7748,
"step": 35000
},
{
"epoch": 51.7,
"eval_cer": 0.23208191126279865,
"eval_loss": 0.8722881078720093,
"eval_runtime": 114.2085,
"eval_samples_per_second": 17.696,
"eval_steps_per_second": 2.215,
"eval_wer": 0.871845620979713,
"step": 35000
},
{
"epoch": 51.85,
"learning_rate": 3.723630136986301e-05,
"loss": 1.7681,
"step": 35100
},
{
"epoch": 51.99,
"learning_rate": 3.712214611872146e-05,
"loss": 1.7296,
"step": 35200
},
{
"epoch": 52.14,
"learning_rate": 3.700799086757991e-05,
"loss": 1.7553,
"step": 35300
},
{
"epoch": 52.29,
"learning_rate": 3.689383561643835e-05,
"loss": 1.7645,
"step": 35400
},
{
"epoch": 52.44,
"learning_rate": 3.67796803652968e-05,
"loss": 1.7355,
"step": 35500
},
{
"epoch": 52.44,
"eval_cer": 0.2331258783376832,
"eval_loss": 0.8760409951210022,
"eval_runtime": 113.1141,
"eval_samples_per_second": 17.867,
"eval_steps_per_second": 2.237,
"eval_wer": 0.88421573478476,
"step": 35500
},
{
"epoch": 52.58,
"learning_rate": 3.6665525114155245e-05,
"loss": 1.7223,
"step": 35600
},
{
"epoch": 52.73,
"learning_rate": 3.655136986301369e-05,
"loss": 1.7647,
"step": 35700
},
{
"epoch": 52.88,
"learning_rate": 3.643721461187214e-05,
"loss": 1.7258,
"step": 35800
},
{
"epoch": 53.03,
"learning_rate": 3.632305936073059e-05,
"loss": 1.7425,
"step": 35900
},
{
"epoch": 53.18,
"learning_rate": 3.620890410958904e-05,
"loss": 1.7167,
"step": 36000
},
{
"epoch": 53.18,
"eval_cer": 0.23236297932142141,
"eval_loss": 0.8746222853660583,
"eval_runtime": 112.5705,
"eval_samples_per_second": 17.953,
"eval_steps_per_second": 2.247,
"eval_wer": 0.8817417120237506,
"step": 36000
},
{
"epoch": 53.32,
"learning_rate": 3.6094748858447485e-05,
"loss": 1.7699,
"step": 36100
},
{
"epoch": 53.47,
"learning_rate": 3.598059360730593e-05,
"loss": 1.7263,
"step": 36200
},
{
"epoch": 53.62,
"learning_rate": 3.586643835616438e-05,
"loss": 1.74,
"step": 36300
},
{
"epoch": 53.77,
"learning_rate": 3.575228310502283e-05,
"loss": 1.7331,
"step": 36400
},
{
"epoch": 53.91,
"learning_rate": 3.563812785388128e-05,
"loss": 1.7479,
"step": 36500
},
{
"epoch": 53.91,
"eval_cer": 0.22810680586227666,
"eval_loss": 0.8762161731719971,
"eval_runtime": 112.6782,
"eval_samples_per_second": 17.936,
"eval_steps_per_second": 2.245,
"eval_wer": 0.8753092528451262,
"step": 36500
},
{
"epoch": 54.06,
"learning_rate": 3.5523972602739725e-05,
"loss": 1.745,
"step": 36600
},
{
"epoch": 54.21,
"learning_rate": 3.540981735159817e-05,
"loss": 1.7267,
"step": 36700
},
{
"epoch": 54.36,
"learning_rate": 3.5295662100456614e-05,
"loss": 1.7239,
"step": 36800
},
{
"epoch": 54.5,
"learning_rate": 3.518150684931506e-05,
"loss": 1.7326,
"step": 36900
},
{
"epoch": 54.65,
"learning_rate": 3.506735159817351e-05,
"loss": 1.7428,
"step": 37000
},
{
"epoch": 54.65,
"eval_cer": 0.22766512748444087,
"eval_loss": 0.8732947707176208,
"eval_runtime": 114.6142,
"eval_samples_per_second": 17.633,
"eval_steps_per_second": 2.207,
"eval_wer": 0.8698664027709055,
"step": 37000
},
{
"epoch": 54.8,
"learning_rate": 3.495319634703196e-05,
"loss": 1.7414,
"step": 37100
},
{
"epoch": 54.95,
"learning_rate": 3.4839041095890406e-05,
"loss": 1.7484,
"step": 37200
},
{
"epoch": 55.1,
"learning_rate": 3.4724885844748854e-05,
"loss": 1.6943,
"step": 37300
},
{
"epoch": 55.24,
"learning_rate": 3.46107305936073e-05,
"loss": 1.7224,
"step": 37400
},
{
"epoch": 55.39,
"learning_rate": 3.449657534246575e-05,
"loss": 1.7058,
"step": 37500
},
{
"epoch": 55.39,
"eval_cer": 0.22625978719132706,
"eval_loss": 0.8816365003585815,
"eval_runtime": 114.0721,
"eval_samples_per_second": 17.717,
"eval_steps_per_second": 2.218,
"eval_wer": 0.8649183572488867,
"step": 37500
},
{
"epoch": 55.54,
"learning_rate": 3.43824200913242e-05,
"loss": 1.7052,
"step": 37600
},
{
"epoch": 55.69,
"learning_rate": 3.4268264840182646e-05,
"loss": 1.711,
"step": 37700
},
{
"epoch": 55.83,
"learning_rate": 3.415525114155251e-05,
"loss": 1.7245,
"step": 37800
},
{
"epoch": 55.98,
"learning_rate": 3.4041095890410956e-05,
"loss": 1.7193,
"step": 37900
},
{
"epoch": 56.13,
"learning_rate": 3.3926940639269404e-05,
"loss": 1.7045,
"step": 38000
},
{
"epoch": 56.13,
"eval_cer": 0.2296727564746035,
"eval_loss": 0.8732736110687256,
"eval_runtime": 115.1044,
"eval_samples_per_second": 17.558,
"eval_steps_per_second": 2.198,
"eval_wer": 0.8688767936665017,
"step": 38000
},
{
"epoch": 56.28,
"learning_rate": 3.381278538812785e-05,
"loss": 1.7185,
"step": 38100
},
{
"epoch": 56.43,
"learning_rate": 3.36986301369863e-05,
"loss": 1.6965,
"step": 38200
},
{
"epoch": 56.57,
"learning_rate": 3.358447488584475e-05,
"loss": 1.6843,
"step": 38300
},
{
"epoch": 56.72,
"learning_rate": 3.347031963470319e-05,
"loss": 1.7138,
"step": 38400
},
{
"epoch": 56.87,
"learning_rate": 3.335616438356164e-05,
"loss": 1.709,
"step": 38500
},
{
"epoch": 56.87,
"eval_cer": 0.22320819112627988,
"eval_loss": 0.8648238182067871,
"eval_runtime": 113.8724,
"eval_samples_per_second": 17.748,
"eval_steps_per_second": 2.222,
"eval_wer": 0.8654131618010885,
"step": 38500
},
{
"epoch": 57.02,
"learning_rate": 3.3242009132420085e-05,
"loss": 1.6913,
"step": 38600
},
{
"epoch": 57.16,
"learning_rate": 3.312785388127853e-05,
"loss": 1.6798,
"step": 38700
},
{
"epoch": 57.31,
"learning_rate": 3.301369863013698e-05,
"loss": 1.6548,
"step": 38800
},
{
"epoch": 57.46,
"learning_rate": 3.289954337899543e-05,
"loss": 1.6862,
"step": 38900
},
{
"epoch": 57.61,
"learning_rate": 3.278538812785388e-05,
"loss": 1.6799,
"step": 39000
},
{
"epoch": 57.61,
"eval_cer": 0.22441276852037745,
"eval_loss": 0.8717127442359924,
"eval_runtime": 113.7564,
"eval_samples_per_second": 17.766,
"eval_steps_per_second": 2.224,
"eval_wer": 0.8579910935180604,
"step": 39000
},
{
"epoch": 57.75,
"learning_rate": 3.2671232876712325e-05,
"loss": 1.6937,
"step": 39100
},
{
"epoch": 57.9,
"learning_rate": 3.255707762557077e-05,
"loss": 1.6659,
"step": 39200
},
{
"epoch": 58.05,
"learning_rate": 3.244292237442922e-05,
"loss": 1.7202,
"step": 39300
},
{
"epoch": 58.2,
"learning_rate": 3.232876712328767e-05,
"loss": 1.6737,
"step": 39400
},
{
"epoch": 58.35,
"learning_rate": 3.221461187214612e-05,
"loss": 1.664,
"step": 39500
},
{
"epoch": 58.35,
"eval_cer": 0.225938566552901,
"eval_loss": 0.8653290867805481,
"eval_runtime": 114.0905,
"eval_samples_per_second": 17.714,
"eval_steps_per_second": 2.218,
"eval_wer": 0.8723404255319149,
"step": 39500
},
{
"epoch": 58.49,
"learning_rate": 3.2100456621004565e-05,
"loss": 1.6909,
"step": 39600
},
{
"epoch": 58.64,
"learning_rate": 3.198630136986301e-05,
"loss": 1.6565,
"step": 39700
},
{
"epoch": 58.79,
"learning_rate": 3.1872146118721454e-05,
"loss": 1.6563,
"step": 39800
},
{
"epoch": 58.94,
"learning_rate": 3.17579908675799e-05,
"loss": 1.658,
"step": 39900
},
{
"epoch": 59.08,
"learning_rate": 3.164383561643835e-05,
"loss": 1.6488,
"step": 40000
},
{
"epoch": 59.08,
"eval_cer": 0.22710299136719533,
"eval_loss": 0.8637419939041138,
"eval_runtime": 114.7268,
"eval_samples_per_second": 17.616,
"eval_steps_per_second": 2.205,
"eval_wer": 0.880257298367145,
"step": 40000
},
{
"epoch": 59.23,
"learning_rate": 3.15296803652968e-05,
"loss": 1.6174,
"step": 40100
},
{
"epoch": 59.38,
"learning_rate": 3.1415525114155246e-05,
"loss": 1.6634,
"step": 40200
},
{
"epoch": 59.53,
"learning_rate": 3.1301369863013694e-05,
"loss": 1.649,
"step": 40300
},
{
"epoch": 59.67,
"learning_rate": 3.118721461187214e-05,
"loss": 1.645,
"step": 40400
},
{
"epoch": 59.82,
"learning_rate": 3.107305936073059e-05,
"loss": 1.6298,
"step": 40500
},
{
"epoch": 59.82,
"eval_cer": 0.22533627785585225,
"eval_loss": 0.8553184866905212,
"eval_runtime": 113.9415,
"eval_samples_per_second": 17.737,
"eval_steps_per_second": 2.22,
"eval_wer": 0.8767936665017318,
"step": 40500
},
{
"epoch": 59.97,
"learning_rate": 3.096004566210045e-05,
"loss": 1.6439,
"step": 40600
},
{
"epoch": 60.12,
"learning_rate": 3.08458904109589e-05,
"loss": 1.645,
"step": 40700
},
{
"epoch": 60.27,
"learning_rate": 3.073173515981735e-05,
"loss": 1.6105,
"step": 40800
},
{
"epoch": 60.41,
"learning_rate": 3.0617579908675796e-05,
"loss": 1.6258,
"step": 40900
},
{
"epoch": 60.56,
"learning_rate": 3.050342465753424e-05,
"loss": 1.6185,
"step": 41000
},
{
"epoch": 60.56,
"eval_cer": 0.2240112427223449,
"eval_loss": 0.8511665463447571,
"eval_runtime": 113.6325,
"eval_samples_per_second": 17.785,
"eval_steps_per_second": 2.226,
"eval_wer": 0.871845620979713,
"step": 41000
},
{
"epoch": 60.71,
"learning_rate": 3.038926940639269e-05,
"loss": 1.6054,
"step": 41100
},
{
"epoch": 60.86,
"learning_rate": 3.0275114155251137e-05,
"loss": 1.6495,
"step": 41200
},
{
"epoch": 61.0,
"learning_rate": 3.0160958904109585e-05,
"loss": 1.6341,
"step": 41300
},
{
"epoch": 61.15,
"learning_rate": 3.0046803652968033e-05,
"loss": 1.6092,
"step": 41400
},
{
"epoch": 61.3,
"learning_rate": 2.993264840182648e-05,
"loss": 1.574,
"step": 41500
},
{
"epoch": 61.3,
"eval_cer": 0.22509536237703273,
"eval_loss": 0.8579218983650208,
"eval_runtime": 114.0127,
"eval_samples_per_second": 17.726,
"eval_steps_per_second": 2.219,
"eval_wer": 0.8772884710539337,
"step": 41500
},
{
"epoch": 61.45,
"learning_rate": 2.981849315068493e-05,
"loss": 1.604,
"step": 41600
},
{
"epoch": 61.6,
"learning_rate": 2.9704337899543373e-05,
"loss": 1.6208,
"step": 41700
},
{
"epoch": 61.74,
"learning_rate": 2.959018264840182e-05,
"loss": 1.5976,
"step": 41800
},
{
"epoch": 61.89,
"learning_rate": 2.947602739726027e-05,
"loss": 1.6118,
"step": 41900
},
{
"epoch": 62.04,
"learning_rate": 2.9361872146118717e-05,
"loss": 1.6192,
"step": 42000
},
{
"epoch": 62.04,
"eval_cer": 0.22421200562136118,
"eval_loss": 0.8499256372451782,
"eval_runtime": 115.1721,
"eval_samples_per_second": 17.548,
"eval_steps_per_second": 2.197,
"eval_wer": 0.8743196437407225,
"step": 42000
},
{
"epoch": 62.19,
"learning_rate": 2.9247716894977165e-05,
"loss": 1.5818,
"step": 42100
},
{
"epoch": 62.33,
"learning_rate": 2.9133561643835613e-05,
"loss": 1.5852,
"step": 42200
},
{
"epoch": 62.48,
"learning_rate": 2.901940639269406e-05,
"loss": 1.6057,
"step": 42300
},
{
"epoch": 62.63,
"learning_rate": 2.8905251141552506e-05,
"loss": 1.5922,
"step": 42400
},
{
"epoch": 62.78,
"learning_rate": 2.8791095890410954e-05,
"loss": 1.6275,
"step": 42500
},
{
"epoch": 62.78,
"eval_cer": 0.22160208793414976,
"eval_loss": 0.8418570756912231,
"eval_runtime": 114.0321,
"eval_samples_per_second": 17.723,
"eval_steps_per_second": 2.219,
"eval_wer": 0.875804057397328,
"step": 42500
},
{
"epoch": 62.92,
"learning_rate": 2.8676940639269402e-05,
"loss": 1.5781,
"step": 42600
},
{
"epoch": 63.07,
"learning_rate": 2.856278538812785e-05,
"loss": 1.5754,
"step": 42700
},
{
"epoch": 63.22,
"learning_rate": 2.8449771689497715e-05,
"loss": 1.5775,
"step": 42800
},
{
"epoch": 63.37,
"learning_rate": 2.8335616438356163e-05,
"loss": 1.568,
"step": 42900
},
{
"epoch": 63.52,
"learning_rate": 2.822146118721461e-05,
"loss": 1.5697,
"step": 43000
},
{
"epoch": 63.52,
"eval_cer": 0.2221642240513953,
"eval_loss": 0.8445881009101868,
"eval_runtime": 114.2892,
"eval_samples_per_second": 17.683,
"eval_steps_per_second": 2.214,
"eval_wer": 0.8698664027709055,
"step": 43000
},
{
"epoch": 63.66,
"learning_rate": 2.810730593607306e-05,
"loss": 1.6005,
"step": 43100
},
{
"epoch": 63.81,
"learning_rate": 2.7993150684931507e-05,
"loss": 1.5897,
"step": 43200
},
{
"epoch": 63.96,
"learning_rate": 2.7878995433789955e-05,
"loss": 1.5433,
"step": 43300
},
{
"epoch": 64.11,
"learning_rate": 2.7764840182648403e-05,
"loss": 1.5925,
"step": 43400
},
{
"epoch": 64.25,
"learning_rate": 2.7650684931506847e-05,
"loss": 1.5384,
"step": 43500
},
{
"epoch": 64.25,
"eval_cer": 0.21995583216221642,
"eval_loss": 0.8461813926696777,
"eval_runtime": 113.6821,
"eval_samples_per_second": 17.778,
"eval_steps_per_second": 2.226,
"eval_wer": 0.8579910935180604,
"step": 43500
},
{
"epoch": 64.4,
"learning_rate": 2.7536529680365295e-05,
"loss": 1.5826,
"step": 43600
},
{
"epoch": 64.55,
"learning_rate": 2.7422374429223743e-05,
"loss": 1.5888,
"step": 43700
},
{
"epoch": 64.7,
"learning_rate": 2.730821917808219e-05,
"loss": 1.5746,
"step": 43800
},
{
"epoch": 64.84,
"learning_rate": 2.719406392694064e-05,
"loss": 1.5332,
"step": 43900
},
{
"epoch": 64.99,
"learning_rate": 2.7079908675799087e-05,
"loss": 1.5115,
"step": 44000
},
{
"epoch": 64.99,
"eval_cer": 0.22140132503513352,
"eval_loss": 0.8466500043869019,
"eval_runtime": 113.7712,
"eval_samples_per_second": 17.764,
"eval_steps_per_second": 2.224,
"eval_wer": 0.867392380009896,
"step": 44000
},
{
"epoch": 65.14,
"learning_rate": 2.6965753424657535e-05,
"loss": 1.5704,
"step": 44100
},
{
"epoch": 65.29,
"learning_rate": 2.685159817351598e-05,
"loss": 1.5518,
"step": 44200
},
{
"epoch": 65.44,
"learning_rate": 2.6737442922374428e-05,
"loss": 1.5502,
"step": 44300
},
{
"epoch": 65.58,
"learning_rate": 2.6623287671232876e-05,
"loss": 1.5401,
"step": 44400
},
{
"epoch": 65.73,
"learning_rate": 2.6509132420091324e-05,
"loss": 1.5547,
"step": 44500
},
{
"epoch": 65.73,
"eval_cer": 0.22043766311985544,
"eval_loss": 0.8505166172981262,
"eval_runtime": 114.0059,
"eval_samples_per_second": 17.727,
"eval_steps_per_second": 2.219,
"eval_wer": 0.8668975754576942,
"step": 44500
},
{
"epoch": 65.88,
"learning_rate": 2.6394977168949772e-05,
"loss": 1.5391,
"step": 44600
},
{
"epoch": 66.03,
"learning_rate": 2.628082191780822e-05,
"loss": 1.5263,
"step": 44700
},
{
"epoch": 66.17,
"learning_rate": 2.6166666666666668e-05,
"loss": 1.5159,
"step": 44800
},
{
"epoch": 66.32,
"learning_rate": 2.6052511415525113e-05,
"loss": 1.5416,
"step": 44900
},
{
"epoch": 66.47,
"learning_rate": 2.593835616438356e-05,
"loss": 1.5597,
"step": 45000
},
{
"epoch": 66.47,
"eval_cer": 0.2192330857257579,
"eval_loss": 0.8420690298080444,
"eval_runtime": 114.4813,
"eval_samples_per_second": 17.654,
"eval_steps_per_second": 2.21,
"eval_wer": 0.8683819891142999,
"step": 45000
},
{
"epoch": 66.62,
"learning_rate": 2.582420091324201e-05,
"loss": 1.5107,
"step": 45100
},
{
"epoch": 66.76,
"learning_rate": 2.5710045662100457e-05,
"loss": 1.5373,
"step": 45200
},
{
"epoch": 66.91,
"learning_rate": 2.5595890410958905e-05,
"loss": 1.503,
"step": 45300
},
{
"epoch": 67.06,
"learning_rate": 2.5482876712328766e-05,
"loss": 1.5408,
"step": 45400
},
{
"epoch": 67.21,
"learning_rate": 2.5368721461187214e-05,
"loss": 1.505,
"step": 45500
},
{
"epoch": 67.21,
"eval_cer": 0.21867094960851235,
"eval_loss": 0.8485424518585205,
"eval_runtime": 113.1044,
"eval_samples_per_second": 17.868,
"eval_steps_per_second": 2.237,
"eval_wer": 0.8619495299356754,
"step": 45500
},
{
"epoch": 67.36,
"learning_rate": 2.5254566210045662e-05,
"loss": 1.5071,
"step": 45600
},
{
"epoch": 67.5,
"learning_rate": 2.514041095890411e-05,
"loss": 1.5392,
"step": 45700
},
{
"epoch": 67.65,
"learning_rate": 2.5026255707762555e-05,
"loss": 1.5284,
"step": 45800
},
{
"epoch": 67.8,
"learning_rate": 2.4912100456621003e-05,
"loss": 1.5282,
"step": 45900
},
{
"epoch": 67.95,
"learning_rate": 2.479794520547945e-05,
"loss": 1.5101,
"step": 46000
},
{
"epoch": 67.95,
"eval_cer": 0.22035735796024894,
"eval_loss": 0.8489089012145996,
"eval_runtime": 114.6545,
"eval_samples_per_second": 17.627,
"eval_steps_per_second": 2.207,
"eval_wer": 0.8649183572488867,
"step": 46000
},
{
"epoch": 68.09,
"learning_rate": 2.46837899543379e-05,
"loss": 1.503,
"step": 46100
},
{
"epoch": 68.24,
"learning_rate": 2.4569634703196347e-05,
"loss": 1.5194,
"step": 46200
},
{
"epoch": 68.39,
"learning_rate": 2.4455479452054795e-05,
"loss": 1.493,
"step": 46300
},
{
"epoch": 68.54,
"learning_rate": 2.434132420091324e-05,
"loss": 1.5327,
"step": 46400
},
{
"epoch": 68.69,
"learning_rate": 2.4227168949771687e-05,
"loss": 1.5199,
"step": 46500
},
{
"epoch": 68.69,
"eval_cer": 0.21802850833166032,
"eval_loss": 0.8407037258148193,
"eval_runtime": 114.1903,
"eval_samples_per_second": 17.699,
"eval_steps_per_second": 2.216,
"eval_wer": 0.8619495299356754,
"step": 46500
},
{
"epoch": 68.83,
"learning_rate": 2.4113013698630135e-05,
"loss": 1.489,
"step": 46600
},
{
"epoch": 68.98,
"learning_rate": 2.3998858447488583e-05,
"loss": 1.4968,
"step": 46700
},
{
"epoch": 69.13,
"learning_rate": 2.388470319634703e-05,
"loss": 1.4959,
"step": 46800
},
{
"epoch": 69.28,
"learning_rate": 2.377054794520548e-05,
"loss": 1.4913,
"step": 46900
},
{
"epoch": 69.42,
"learning_rate": 2.3656392694063927e-05,
"loss": 1.5207,
"step": 47000
},
{
"epoch": 69.42,
"eval_cer": 0.2162617948203172,
"eval_loss": 0.8378761410713196,
"eval_runtime": 113.9918,
"eval_samples_per_second": 17.729,
"eval_steps_per_second": 2.219,
"eval_wer": 0.8495794161306284,
"step": 47000
},
{
"epoch": 69.57,
"learning_rate": 2.3542237442922372e-05,
"loss": 1.4881,
"step": 47100
},
{
"epoch": 69.72,
"learning_rate": 2.342808219178082e-05,
"loss": 1.4951,
"step": 47200
},
{
"epoch": 69.87,
"learning_rate": 2.3313926940639268e-05,
"loss": 1.5063,
"step": 47300
},
{
"epoch": 70.01,
"learning_rate": 2.320091324200913e-05,
"loss": 1.4925,
"step": 47400
},
{
"epoch": 70.16,
"learning_rate": 2.3086757990867578e-05,
"loss": 1.478,
"step": 47500
},
{
"epoch": 70.16,
"eval_cer": 0.2163420999799237,
"eval_loss": 0.835663914680481,
"eval_runtime": 115.4983,
"eval_samples_per_second": 17.498,
"eval_steps_per_second": 2.191,
"eval_wer": 0.859475507174666,
"step": 47500
},
{
"epoch": 70.31,
"learning_rate": 2.2972602739726026e-05,
"loss": 1.4823,
"step": 47600
},
{
"epoch": 70.46,
"learning_rate": 2.2858447488584474e-05,
"loss": 1.5068,
"step": 47700
},
{
"epoch": 70.61,
"learning_rate": 2.2744292237442922e-05,
"loss": 1.5096,
"step": 47800
},
{
"epoch": 70.75,
"learning_rate": 2.263013698630137e-05,
"loss": 1.4897,
"step": 47900
},
{
"epoch": 70.9,
"learning_rate": 2.2515981735159814e-05,
"loss": 1.4817,
"step": 48000
},
{
"epoch": 70.9,
"eval_cer": 0.21513752258582614,
"eval_loss": 0.8346221446990967,
"eval_runtime": 113.9435,
"eval_samples_per_second": 17.737,
"eval_steps_per_second": 2.22,
"eval_wer": 0.8495794161306284,
"step": 48000
},
{
"epoch": 71.05,
"learning_rate": 2.2401826484018262e-05,
"loss": 1.5342,
"step": 48100
},
{
"epoch": 71.2,
"learning_rate": 2.228767123287671e-05,
"loss": 1.4723,
"step": 48200
},
{
"epoch": 71.34,
"learning_rate": 2.217351598173516e-05,
"loss": 1.4929,
"step": 48300
},
{
"epoch": 71.49,
"learning_rate": 2.2059360730593606e-05,
"loss": 1.4785,
"step": 48400
},
{
"epoch": 71.64,
"learning_rate": 2.1945205479452054e-05,
"loss": 1.4827,
"step": 48500
},
{
"epoch": 71.64,
"eval_cer": 0.216864083517366,
"eval_loss": 0.8362293243408203,
"eval_runtime": 114.6857,
"eval_samples_per_second": 17.622,
"eval_steps_per_second": 2.206,
"eval_wer": 0.8624443344878773,
"step": 48500
},
{
"epoch": 71.79,
"learning_rate": 2.1831050228310502e-05,
"loss": 1.4732,
"step": 48600
},
{
"epoch": 71.93,
"learning_rate": 2.1716894977168947e-05,
"loss": 1.4611,
"step": 48700
},
{
"epoch": 72.08,
"learning_rate": 2.1602739726027395e-05,
"loss": 1.4621,
"step": 48800
},
{
"epoch": 72.23,
"learning_rate": 2.1488584474885843e-05,
"loss": 1.4636,
"step": 48900
},
{
"epoch": 72.38,
"learning_rate": 2.137442922374429e-05,
"loss": 1.4513,
"step": 49000
},
{
"epoch": 72.38,
"eval_cer": 0.21369202971290904,
"eval_loss": 0.835486888885498,
"eval_runtime": 113.6809,
"eval_samples_per_second": 17.778,
"eval_steps_per_second": 2.226,
"eval_wer": 0.8451261751608115,
"step": 49000
},
{
"epoch": 72.53,
"learning_rate": 2.126027397260274e-05,
"loss": 1.4469,
"step": 49100
},
{
"epoch": 72.67,
"learning_rate": 2.1146118721461187e-05,
"loss": 1.4521,
"step": 49200
},
{
"epoch": 72.82,
"learning_rate": 2.1031963470319635e-05,
"loss": 1.4285,
"step": 49300
},
{
"epoch": 72.97,
"learning_rate": 2.091780821917808e-05,
"loss": 1.4663,
"step": 49400
},
{
"epoch": 73.12,
"learning_rate": 2.0803652968036527e-05,
"loss": 1.4988,
"step": 49500
},
{
"epoch": 73.12,
"eval_cer": 0.21606103192130094,
"eval_loss": 0.8324964642524719,
"eval_runtime": 114.8092,
"eval_samples_per_second": 17.603,
"eval_steps_per_second": 2.204,
"eval_wer": 0.8624443344878773,
"step": 49500
},
{
"epoch": 73.26,
"learning_rate": 2.0689497716894975e-05,
"loss": 1.4531,
"step": 49600
},
{
"epoch": 73.41,
"learning_rate": 2.0576484018264837e-05,
"loss": 1.4415,
"step": 49700
},
{
"epoch": 73.56,
"learning_rate": 2.0462328767123285e-05,
"loss": 1.4415,
"step": 49800
},
{
"epoch": 73.71,
"learning_rate": 2.0348173515981733e-05,
"loss": 1.4495,
"step": 49900
},
{
"epoch": 73.85,
"learning_rate": 2.023401826484018e-05,
"loss": 1.4267,
"step": 50000
},
{
"epoch": 73.85,
"eval_cer": 0.21565950612326842,
"eval_loss": 0.8395733833312988,
"eval_runtime": 113.3592,
"eval_samples_per_second": 17.828,
"eval_steps_per_second": 2.232,
"eval_wer": 0.8480950024740228,
"step": 50000
},
{
"epoch": 74.0,
"learning_rate": 2.011986301369863e-05,
"loss": 1.4187,
"step": 50100
},
{
"epoch": 74.15,
"learning_rate": 2.0005707762557077e-05,
"loss": 1.4261,
"step": 50200
},
{
"epoch": 74.3,
"learning_rate": 1.9891552511415522e-05,
"loss": 1.3826,
"step": 50300
},
{
"epoch": 74.45,
"learning_rate": 1.977739726027397e-05,
"loss": 1.4491,
"step": 50400
},
{
"epoch": 74.59,
"learning_rate": 1.9663242009132418e-05,
"loss": 1.4421,
"step": 50500
},
{
"epoch": 74.59,
"eval_cer": 0.21216623168038545,
"eval_loss": 0.8354990482330322,
"eval_runtime": 114.0851,
"eval_samples_per_second": 17.715,
"eval_steps_per_second": 2.218,
"eval_wer": 0.8490846115784265,
"step": 50500
},
{
"epoch": 74.74,
"learning_rate": 1.9549086757990866e-05,
"loss": 1.4689,
"step": 50600
},
{
"epoch": 74.89,
"learning_rate": 1.9434931506849314e-05,
"loss": 1.4471,
"step": 50700
},
{
"epoch": 75.04,
"learning_rate": 1.9320776255707762e-05,
"loss": 1.4333,
"step": 50800
},
{
"epoch": 75.18,
"learning_rate": 1.920662100456621e-05,
"loss": 1.4211,
"step": 50900
},
{
"epoch": 75.33,
"learning_rate": 1.9092465753424654e-05,
"loss": 1.4311,
"step": 51000
},
{
"epoch": 75.33,
"eval_cer": 0.2118048584621562,
"eval_loss": 0.8357799649238586,
"eval_runtime": 112.9085,
"eval_samples_per_second": 17.899,
"eval_steps_per_second": 2.241,
"eval_wer": 0.8476001979218208,
"step": 51000
},
{
"epoch": 75.48,
"learning_rate": 1.8978310502283102e-05,
"loss": 1.4136,
"step": 51100
},
{
"epoch": 75.63,
"learning_rate": 1.886415525114155e-05,
"loss": 1.4144,
"step": 51200
},
{
"epoch": 75.78,
"learning_rate": 1.875e-05,
"loss": 1.4479,
"step": 51300
},
{
"epoch": 75.92,
"learning_rate": 1.8635844748858446e-05,
"loss": 1.4218,
"step": 51400
},
{
"epoch": 76.07,
"learning_rate": 1.8521689497716894e-05,
"loss": 1.4174,
"step": 51500
},
{
"epoch": 76.07,
"eval_cer": 0.21007829753061635,
"eval_loss": 0.8288608193397522,
"eval_runtime": 114.429,
"eval_samples_per_second": 17.662,
"eval_steps_per_second": 2.211,
"eval_wer": 0.8451261751608115,
"step": 51500
},
{
"epoch": 76.22,
"learning_rate": 1.8407534246575342e-05,
"loss": 1.4225,
"step": 51600
},
{
"epoch": 76.37,
"learning_rate": 1.8294520547945204e-05,
"loss": 1.4181,
"step": 51700
},
{
"epoch": 76.51,
"learning_rate": 1.8180365296803652e-05,
"loss": 1.3998,
"step": 51800
},
{
"epoch": 76.66,
"learning_rate": 1.8066210045662097e-05,
"loss": 1.4383,
"step": 51900
},
{
"epoch": 76.81,
"learning_rate": 1.7952054794520545e-05,
"loss": 1.4349,
"step": 52000
},
{
"epoch": 76.81,
"eval_cer": 0.21401325035133506,
"eval_loss": 0.8371652960777283,
"eval_runtime": 113.9028,
"eval_samples_per_second": 17.743,
"eval_steps_per_second": 2.221,
"eval_wer": 0.8579910935180604,
"step": 52000
},
{
"epoch": 76.96,
"learning_rate": 1.7837899543378993e-05,
"loss": 1.4007,
"step": 52100
},
{
"epoch": 77.1,
"learning_rate": 1.772374429223744e-05,
"loss": 1.4512,
"step": 52200
},
{
"epoch": 77.25,
"learning_rate": 1.760958904109589e-05,
"loss": 1.3999,
"step": 52300
},
{
"epoch": 77.4,
"learning_rate": 1.7495433789954337e-05,
"loss": 1.4224,
"step": 52400
},
{
"epoch": 77.55,
"learning_rate": 1.7381278538812785e-05,
"loss": 1.3959,
"step": 52500
},
{
"epoch": 77.55,
"eval_cer": 0.21156394298333667,
"eval_loss": 0.8324997425079346,
"eval_runtime": 112.9164,
"eval_samples_per_second": 17.898,
"eval_steps_per_second": 2.241,
"eval_wer": 0.8436417615042059,
"step": 52500
},
{
"epoch": 77.7,
"learning_rate": 1.726712328767123e-05,
"loss": 1.4086,
"step": 52600
},
{
"epoch": 77.84,
"learning_rate": 1.7152968036529677e-05,
"loss": 1.4345,
"step": 52700
},
{
"epoch": 77.99,
"learning_rate": 1.7038812785388125e-05,
"loss": 1.3828,
"step": 52800
},
{
"epoch": 78.14,
"learning_rate": 1.6924657534246573e-05,
"loss": 1.4159,
"step": 52900
},
{
"epoch": 78.29,
"learning_rate": 1.681050228310502e-05,
"loss": 1.4087,
"step": 53000
},
{
"epoch": 78.29,
"eval_cer": 0.21051997590845212,
"eval_loss": 0.8351333141326904,
"eval_runtime": 114.5275,
"eval_samples_per_second": 17.646,
"eval_steps_per_second": 2.209,
"eval_wer": 0.8446313706086096,
"step": 53000
},
{
"epoch": 78.43,
"learning_rate": 1.669634703196347e-05,
"loss": 1.4303,
"step": 53100
},
{
"epoch": 78.58,
"learning_rate": 1.6582191780821917e-05,
"loss": 1.4233,
"step": 53200
},
{
"epoch": 78.73,
"learning_rate": 1.6468036529680362e-05,
"loss": 1.3758,
"step": 53300
},
{
"epoch": 78.88,
"learning_rate": 1.635388127853881e-05,
"loss": 1.3703,
"step": 53400
},
{
"epoch": 79.03,
"learning_rate": 1.6239726027397258e-05,
"loss": 1.415,
"step": 53500
},
{
"epoch": 79.03,
"eval_cer": 0.21228668941979523,
"eval_loss": 0.8363248109817505,
"eval_runtime": 115.4621,
"eval_samples_per_second": 17.504,
"eval_steps_per_second": 2.191,
"eval_wer": 0.8476001979218208,
"step": 53500
},
{
"epoch": 79.17,
"learning_rate": 1.6125570776255706e-05,
"loss": 1.3768,
"step": 53600
},
{
"epoch": 79.32,
"learning_rate": 1.6011415525114154e-05,
"loss": 1.399,
"step": 53700
},
{
"epoch": 79.47,
"learning_rate": 1.5897260273972602e-05,
"loss": 1.4076,
"step": 53800
},
{
"epoch": 79.62,
"learning_rate": 1.5784246575342464e-05,
"loss": 1.3912,
"step": 53900
},
{
"epoch": 79.76,
"learning_rate": 1.567009132420091e-05,
"loss": 1.4122,
"step": 54000
},
{
"epoch": 79.76,
"eval_cer": 0.21116241718530415,
"eval_loss": 0.8309991359710693,
"eval_runtime": 113.1017,
"eval_samples_per_second": 17.869,
"eval_steps_per_second": 2.237,
"eval_wer": 0.8480950024740228,
"step": 54000
},
{
"epoch": 79.91,
"learning_rate": 1.5557077625570773e-05,
"loss": 1.3916,
"step": 54100
},
{
"epoch": 80.06,
"learning_rate": 1.544292237442922e-05,
"loss": 1.4167,
"step": 54200
},
{
"epoch": 80.21,
"learning_rate": 1.532876712328767e-05,
"loss": 1.4019,
"step": 54300
},
{
"epoch": 80.35,
"learning_rate": 1.5214611872146117e-05,
"loss": 1.3909,
"step": 54400
},
{
"epoch": 80.5,
"learning_rate": 1.5100456621004565e-05,
"loss": 1.3969,
"step": 54500
},
{
"epoch": 80.5,
"eval_cer": 0.20951616141337082,
"eval_loss": 0.8239215612411499,
"eval_runtime": 113.6855,
"eval_samples_per_second": 17.777,
"eval_steps_per_second": 2.225,
"eval_wer": 0.8446313706086096,
"step": 54500
},
{
"epoch": 80.65,
"learning_rate": 1.4986301369863012e-05,
"loss": 1.3952,
"step": 54600
},
{
"epoch": 80.8,
"learning_rate": 1.487214611872146e-05,
"loss": 1.3998,
"step": 54700
},
{
"epoch": 80.94,
"learning_rate": 1.4757990867579908e-05,
"loss": 1.3902,
"step": 54800
},
{
"epoch": 81.09,
"learning_rate": 1.4643835616438356e-05,
"loss": 1.3526,
"step": 54900
},
{
"epoch": 81.24,
"learning_rate": 1.4529680365296802e-05,
"loss": 1.361,
"step": 55000
},
{
"epoch": 81.24,
"eval_cer": 0.20907448303553502,
"eval_loss": 0.8281779289245605,
"eval_runtime": 112.7357,
"eval_samples_per_second": 17.927,
"eval_steps_per_second": 2.244,
"eval_wer": 0.8426521523998021,
"step": 55000
},
{
"epoch": 81.39,
"learning_rate": 1.441552511415525e-05,
"loss": 1.4054,
"step": 55100
},
{
"epoch": 81.54,
"learning_rate": 1.4302511415525112e-05,
"loss": 1.4048,
"step": 55200
},
{
"epoch": 81.68,
"learning_rate": 1.418835616438356e-05,
"loss": 1.401,
"step": 55300
},
{
"epoch": 81.83,
"learning_rate": 1.4074200913242008e-05,
"loss": 1.3824,
"step": 55400
},
{
"epoch": 81.98,
"learning_rate": 1.3960045662100454e-05,
"loss": 1.3611,
"step": 55500
},
{
"epoch": 81.98,
"eval_cer": 0.20923509335474805,
"eval_loss": 0.8281756043434143,
"eval_runtime": 114.1698,
"eval_samples_per_second": 17.702,
"eval_steps_per_second": 2.216,
"eval_wer": 0.8406729341909945,
"step": 55500
},
{
"epoch": 82.13,
"learning_rate": 1.3845890410958902e-05,
"loss": 1.4021,
"step": 55600
},
{
"epoch": 82.27,
"learning_rate": 1.373173515981735e-05,
"loss": 1.3655,
"step": 55700
},
{
"epoch": 82.42,
"learning_rate": 1.3617579908675798e-05,
"loss": 1.368,
"step": 55800
},
{
"epoch": 82.57,
"learning_rate": 1.3503424657534244e-05,
"loss": 1.355,
"step": 55900
},
{
"epoch": 82.72,
"learning_rate": 1.3389269406392692e-05,
"loss": 1.3677,
"step": 56000
},
{
"epoch": 82.72,
"eval_cer": 0.2083517365990765,
"eval_loss": 0.8234991431236267,
"eval_runtime": 113.0903,
"eval_samples_per_second": 17.871,
"eval_steps_per_second": 2.237,
"eval_wer": 0.8436417615042059,
"step": 56000
},
{
"epoch": 82.87,
"learning_rate": 1.327511415525114e-05,
"loss": 1.3752,
"step": 56100
},
{
"epoch": 83.01,
"learning_rate": 1.3160958904109586e-05,
"loss": 1.3599,
"step": 56200
},
{
"epoch": 83.16,
"learning_rate": 1.3046803652968034e-05,
"loss": 1.331,
"step": 56300
},
{
"epoch": 83.31,
"learning_rate": 1.2932648401826482e-05,
"loss": 1.3881,
"step": 56400
},
{
"epoch": 83.46,
"learning_rate": 1.281849315068493e-05,
"loss": 1.3361,
"step": 56500
},
{
"epoch": 83.46,
"eval_cer": 0.20686609114635615,
"eval_loss": 0.8230801224708557,
"eval_runtime": 113.4808,
"eval_samples_per_second": 17.809,
"eval_steps_per_second": 2.229,
"eval_wer": 0.8377041068777833,
"step": 56500
},
{
"epoch": 83.6,
"learning_rate": 1.2704337899543377e-05,
"loss": 1.3507,
"step": 56600
},
{
"epoch": 83.75,
"learning_rate": 1.2590182648401825e-05,
"loss": 1.3529,
"step": 56700
},
{
"epoch": 83.9,
"learning_rate": 1.2476027397260273e-05,
"loss": 1.3656,
"step": 56800
},
{
"epoch": 84.05,
"learning_rate": 1.2361872146118719e-05,
"loss": 1.3621,
"step": 56900
},
{
"epoch": 84.19,
"learning_rate": 1.2247716894977167e-05,
"loss": 1.3779,
"step": 57000
},
{
"epoch": 84.19,
"eval_cer": 0.2069865488857659,
"eval_loss": 0.8206142783164978,
"eval_runtime": 112.7557,
"eval_samples_per_second": 17.924,
"eval_steps_per_second": 2.244,
"eval_wer": 0.8436417615042059,
"step": 57000
},
{
"epoch": 84.34,
"learning_rate": 1.2133561643835615e-05,
"loss": 1.3326,
"step": 57100
},
{
"epoch": 84.49,
"learning_rate": 1.2019406392694063e-05,
"loss": 1.3411,
"step": 57200
},
{
"epoch": 84.64,
"learning_rate": 1.190525114155251e-05,
"loss": 1.3424,
"step": 57300
},
{
"epoch": 84.79,
"learning_rate": 1.1791095890410957e-05,
"loss": 1.342,
"step": 57400
},
{
"epoch": 84.93,
"learning_rate": 1.1676940639269405e-05,
"loss": 1.3727,
"step": 57500
},
{
"epoch": 84.93,
"eval_cer": 0.20646456534832364,
"eval_loss": 0.8204257488250732,
"eval_runtime": 112.5887,
"eval_samples_per_second": 17.95,
"eval_steps_per_second": 2.247,
"eval_wer": 0.839188520534389,
"step": 57500
},
{
"epoch": 85.08,
"learning_rate": 1.1562785388127852e-05,
"loss": 1.3352,
"step": 57600
},
{
"epoch": 85.23,
"learning_rate": 1.14486301369863e-05,
"loss": 1.3232,
"step": 57700
},
{
"epoch": 85.38,
"learning_rate": 1.1334474885844748e-05,
"loss": 1.3534,
"step": 57800
},
{
"epoch": 85.52,
"learning_rate": 1.1220319634703194e-05,
"loss": 1.3834,
"step": 57900
},
{
"epoch": 85.67,
"learning_rate": 1.1106164383561642e-05,
"loss": 1.3317,
"step": 58000
},
{
"epoch": 85.67,
"eval_cer": 0.20654487050793013,
"eval_loss": 0.8206654787063599,
"eval_runtime": 113.345,
"eval_samples_per_second": 17.831,
"eval_steps_per_second": 2.232,
"eval_wer": 0.8436417615042059,
"step": 58000
},
{
"epoch": 85.82,
"learning_rate": 1.099200913242009e-05,
"loss": 1.3349,
"step": 58100
},
{
"epoch": 85.97,
"learning_rate": 1.0877853881278538e-05,
"loss": 1.326,
"step": 58200
},
{
"epoch": 86.12,
"learning_rate": 1.0763698630136984e-05,
"loss": 1.3541,
"step": 58300
},
{
"epoch": 86.26,
"learning_rate": 1.0649543378995432e-05,
"loss": 1.3306,
"step": 58400
},
{
"epoch": 86.41,
"learning_rate": 1.053538812785388e-05,
"loss": 1.3332,
"step": 58500
},
{
"epoch": 86.41,
"eval_cer": 0.20554105601284883,
"eval_loss": 0.818649172782898,
"eval_runtime": 113.2293,
"eval_samples_per_second": 17.849,
"eval_steps_per_second": 2.234,
"eval_wer": 0.8357248886689758,
"step": 58500
},
{
"epoch": 86.56,
"learning_rate": 1.0421232876712326e-05,
"loss": 1.3258,
"step": 58600
},
{
"epoch": 86.71,
"learning_rate": 1.0307077625570774e-05,
"loss": 1.3269,
"step": 58700
},
{
"epoch": 86.85,
"learning_rate": 1.0192922374429222e-05,
"loss": 1.3411,
"step": 58800
},
{
"epoch": 87.0,
"learning_rate": 1.007876712328767e-05,
"loss": 1.3136,
"step": 58900
},
{
"epoch": 87.15,
"learning_rate": 9.964611872146117e-06,
"loss": 1.3299,
"step": 59000
},
{
"epoch": 87.15,
"eval_cer": 0.20754868500301143,
"eval_loss": 0.8192667961120605,
"eval_runtime": 113.1322,
"eval_samples_per_second": 17.864,
"eval_steps_per_second": 2.236,
"eval_wer": 0.8416625432953984,
"step": 59000
},
{
"epoch": 87.3,
"learning_rate": 9.850456621004565e-06,
"loss": 1.3134,
"step": 59100
},
{
"epoch": 87.44,
"learning_rate": 9.736301369863013e-06,
"loss": 1.3108,
"step": 59200
},
{
"epoch": 87.59,
"learning_rate": 9.622146118721459e-06,
"loss": 1.3347,
"step": 59300
},
{
"epoch": 87.74,
"learning_rate": 9.507990867579907e-06,
"loss": 1.314,
"step": 59400
},
{
"epoch": 87.89,
"learning_rate": 9.393835616438355e-06,
"loss": 1.3129,
"step": 59500
},
{
"epoch": 87.89,
"eval_cer": 0.20650471792812689,
"eval_loss": 0.8182885050773621,
"eval_runtime": 112.6479,
"eval_samples_per_second": 17.941,
"eval_steps_per_second": 2.246,
"eval_wer": 0.8431469569520039,
"step": 59500
},
{
"epoch": 88.04,
"learning_rate": 9.279680365296803e-06,
"loss": 1.3839,
"step": 59600
},
{
"epoch": 88.18,
"learning_rate": 9.166666666666665e-06,
"loss": 1.3179,
"step": 59700
},
{
"epoch": 88.33,
"learning_rate": 9.052511415525113e-06,
"loss": 1.3065,
"step": 59800
},
{
"epoch": 88.48,
"learning_rate": 8.93835616438356e-06,
"loss": 1.3093,
"step": 59900
},
{
"epoch": 88.63,
"learning_rate": 8.824200913242009e-06,
"loss": 1.3352,
"step": 60000
},
{
"epoch": 88.63,
"eval_cer": 0.20622364986950412,
"eval_loss": 0.8150643110275269,
"eval_runtime": 112.8416,
"eval_samples_per_second": 17.91,
"eval_steps_per_second": 2.242,
"eval_wer": 0.847105393369619,
"step": 60000
},
{
"epoch": 88.77,
"learning_rate": 8.710045662100455e-06,
"loss": 1.3146,
"step": 60100
},
{
"epoch": 88.92,
"learning_rate": 8.595890410958903e-06,
"loss": 1.3185,
"step": 60200
},
{
"epoch": 89.07,
"learning_rate": 8.481735159817351e-06,
"loss": 1.291,
"step": 60300
},
{
"epoch": 89.22,
"learning_rate": 8.367579908675797e-06,
"loss": 1.2985,
"step": 60400
},
{
"epoch": 89.36,
"learning_rate": 8.253424657534245e-06,
"loss": 1.3026,
"step": 60500
},
{
"epoch": 89.36,
"eval_cer": 0.20666532824733988,
"eval_loss": 0.8124769330024719,
"eval_runtime": 113.2992,
"eval_samples_per_second": 17.838,
"eval_steps_per_second": 2.233,
"eval_wer": 0.8485898070262247,
"step": 60500
},
{
"epoch": 89.51,
"learning_rate": 8.139269406392693e-06,
"loss": 1.3266,
"step": 60600
},
{
"epoch": 89.66,
"learning_rate": 8.025114155251141e-06,
"loss": 1.2908,
"step": 60700
},
{
"epoch": 89.81,
"learning_rate": 7.910958904109588e-06,
"loss": 1.3219,
"step": 60800
},
{
"epoch": 89.96,
"learning_rate": 7.796803652968036e-06,
"loss": 1.3354,
"step": 60900
},
{
"epoch": 90.1,
"learning_rate": 7.682648401826484e-06,
"loss": 1.3468,
"step": 61000
},
{
"epoch": 90.1,
"eval_cer": 0.2058221240714716,
"eval_loss": 0.8124193549156189,
"eval_runtime": 113.1466,
"eval_samples_per_second": 17.862,
"eval_steps_per_second": 2.236,
"eval_wer": 0.8406729341909945,
"step": 61000
},
{
"epoch": 90.25,
"learning_rate": 7.568493150684931e-06,
"loss": 1.2959,
"step": 61100
},
{
"epoch": 90.4,
"learning_rate": 7.454337899543378e-06,
"loss": 1.3095,
"step": 61200
},
{
"epoch": 90.55,
"learning_rate": 7.340182648401826e-06,
"loss": 1.3018,
"step": 61300
},
{
"epoch": 90.69,
"learning_rate": 7.226027397260273e-06,
"loss": 1.3182,
"step": 61400
},
{
"epoch": 90.84,
"learning_rate": 7.111872146118721e-06,
"loss": 1.3028,
"step": 61500
},
{
"epoch": 90.84,
"eval_cer": 0.20509937763501304,
"eval_loss": 0.8122348189353943,
"eval_runtime": 113.8373,
"eval_samples_per_second": 17.753,
"eval_steps_per_second": 2.222,
"eval_wer": 0.8461157842652153,
"step": 61500
},
{
"epoch": 90.99,
"learning_rate": 6.997716894977168e-06,
"loss": 1.2779,
"step": 61600
},
{
"epoch": 91.14,
"learning_rate": 6.883561643835615e-06,
"loss": 1.3199,
"step": 61700
},
{
"epoch": 91.28,
"learning_rate": 6.769406392694063e-06,
"loss": 1.282,
"step": 61800
},
{
"epoch": 91.43,
"learning_rate": 6.6552511415525104e-06,
"loss": 1.3319,
"step": 61900
},
{
"epoch": 91.58,
"learning_rate": 6.5410958904109584e-06,
"loss": 1.2884,
"step": 62000
},
{
"epoch": 91.58,
"eval_cer": 0.20477815699658702,
"eval_loss": 0.8086355328559875,
"eval_runtime": 114.5869,
"eval_samples_per_second": 17.637,
"eval_steps_per_second": 2.208,
"eval_wer": 0.8426521523998021,
"step": 62000
},
{
"epoch": 91.73,
"learning_rate": 6.4269406392694056e-06,
"loss": 1.3206,
"step": 62100
},
{
"epoch": 91.88,
"learning_rate": 6.3127853881278536e-06,
"loss": 1.3219,
"step": 62200
},
{
"epoch": 92.02,
"learning_rate": 6.198630136986301e-06,
"loss": 1.2887,
"step": 62300
},
{
"epoch": 92.17,
"learning_rate": 6.084474885844748e-06,
"loss": 1.3125,
"step": 62400
},
{
"epoch": 92.32,
"learning_rate": 5.970319634703196e-06,
"loss": 1.3005,
"step": 62500
},
{
"epoch": 92.32,
"eval_cer": 0.2054607508532423,
"eval_loss": 0.8109722137451172,
"eval_runtime": 114.6224,
"eval_samples_per_second": 17.632,
"eval_steps_per_second": 2.207,
"eval_wer": 0.838693715982187,
"step": 62500
},
{
"epoch": 92.47,
"learning_rate": 5.856164383561643e-06,
"loss": 1.3115,
"step": 62600
},
{
"epoch": 92.61,
"learning_rate": 5.7431506849315064e-06,
"loss": 1.3024,
"step": 62700
},
{
"epoch": 92.76,
"learning_rate": 5.628995433789954e-06,
"loss": 1.2729,
"step": 62800
},
{
"epoch": 92.91,
"learning_rate": 5.514840182648402e-06,
"loss": 1.2953,
"step": 62900
},
{
"epoch": 93.06,
"learning_rate": 5.400684931506849e-06,
"loss": 1.2996,
"step": 63000
},
{
"epoch": 93.06,
"eval_cer": 0.20570166633206183,
"eval_loss": 0.8125805854797363,
"eval_runtime": 113.0806,
"eval_samples_per_second": 17.872,
"eval_steps_per_second": 2.237,
"eval_wer": 0.8327560613557645,
"step": 63000
},
{
"epoch": 93.21,
"learning_rate": 5.286529680365297e-06,
"loss": 1.3043,
"step": 63100
},
{
"epoch": 93.35,
"learning_rate": 5.172374429223744e-06,
"loss": 1.2749,
"step": 63200
},
{
"epoch": 93.5,
"learning_rate": 5.058219178082192e-06,
"loss": 1.2701,
"step": 63300
},
{
"epoch": 93.65,
"learning_rate": 4.944063926940639e-06,
"loss": 1.3151,
"step": 63400
},
{
"epoch": 93.8,
"learning_rate": 4.829908675799086e-06,
"loss": 1.2707,
"step": 63500
},
{
"epoch": 93.8,
"eval_cer": 0.20465769925717728,
"eval_loss": 0.8097530603408813,
"eval_runtime": 113.7446,
"eval_samples_per_second": 17.768,
"eval_steps_per_second": 2.224,
"eval_wer": 0.8401781296387927,
"step": 63500
},
{
"epoch": 93.94,
"learning_rate": 4.715753424657534e-06,
"loss": 1.2936,
"step": 63600
},
{
"epoch": 94.09,
"learning_rate": 4.601598173515981e-06,
"loss": 1.2972,
"step": 63700
},
{
"epoch": 94.24,
"learning_rate": 4.487442922374429e-06,
"loss": 1.2465,
"step": 63800
},
{
"epoch": 94.39,
"learning_rate": 4.3732876712328764e-06,
"loss": 1.3015,
"step": 63900
},
{
"epoch": 94.53,
"learning_rate": 4.2591324200913244e-06,
"loss": 1.3026,
"step": 64000
},
{
"epoch": 94.53,
"eval_cer": 0.20501907247540654,
"eval_loss": 0.8096847534179688,
"eval_runtime": 113.8078,
"eval_samples_per_second": 17.758,
"eval_steps_per_second": 2.223,
"eval_wer": 0.8401781296387927,
"step": 64000
},
{
"epoch": 94.68,
"learning_rate": 4.144977168949772e-06,
"loss": 1.3007,
"step": 64100
},
{
"epoch": 94.83,
"learning_rate": 4.030821917808219e-06,
"loss": 1.2671,
"step": 64200
},
{
"epoch": 94.98,
"learning_rate": 3.916666666666667e-06,
"loss": 1.2834,
"step": 64300
},
{
"epoch": 95.13,
"learning_rate": 3.802511415525114e-06,
"loss": 1.3017,
"step": 64400
},
{
"epoch": 95.27,
"learning_rate": 3.689497716894977e-06,
"loss": 1.2546,
"step": 64500
},
{
"epoch": 95.27,
"eval_cer": 0.2054607508532423,
"eval_loss": 0.8111132383346558,
"eval_runtime": 114.1208,
"eval_samples_per_second": 17.709,
"eval_steps_per_second": 2.217,
"eval_wer": 0.8401781296387927,
"step": 64500
},
{
"epoch": 95.42,
"learning_rate": 3.5753424657534245e-06,
"loss": 1.3115,
"step": 64600
},
{
"epoch": 95.57,
"learning_rate": 3.461187214611872e-06,
"loss": 1.2918,
"step": 64700
},
{
"epoch": 95.72,
"learning_rate": 3.347031963470319e-06,
"loss": 1.2863,
"step": 64800
},
{
"epoch": 95.86,
"learning_rate": 3.2328767123287667e-06,
"loss": 1.3075,
"step": 64900
},
{
"epoch": 96.01,
"learning_rate": 3.1187214611872143e-06,
"loss": 1.2426,
"step": 65000
},
{
"epoch": 96.01,
"eval_cer": 0.20594258181088135,
"eval_loss": 0.8087843656539917,
"eval_runtime": 113.7192,
"eval_samples_per_second": 17.772,
"eval_steps_per_second": 2.225,
"eval_wer": 0.8372093023255814,
"step": 65000
},
{
"epoch": 96.16,
"learning_rate": 3.004566210045662e-06,
"loss": 1.2996,
"step": 65100
},
{
"epoch": 96.31,
"learning_rate": 2.8904109589041095e-06,
"loss": 1.3113,
"step": 65200
},
{
"epoch": 96.45,
"learning_rate": 2.776255707762557e-06,
"loss": 1.287,
"step": 65300
},
{
"epoch": 96.6,
"learning_rate": 2.662100456621004e-06,
"loss": 1.2838,
"step": 65400
},
{
"epoch": 96.75,
"learning_rate": 2.5479452054794517e-06,
"loss": 1.2869,
"step": 65500
},
{
"epoch": 96.75,
"eval_cer": 0.20481830957639027,
"eval_loss": 0.8092992305755615,
"eval_runtime": 113.4179,
"eval_samples_per_second": 17.819,
"eval_steps_per_second": 2.231,
"eval_wer": 0.8396833250865908,
"step": 65500
},
{
"epoch": 96.9,
"learning_rate": 2.4337899543378993e-06,
"loss": 1.2994,
"step": 65600
},
{
"epoch": 97.05,
"learning_rate": 2.319634703196347e-06,
"loss": 1.2983,
"step": 65700
},
{
"epoch": 97.19,
"learning_rate": 2.2054794520547945e-06,
"loss": 1.2737,
"step": 65800
},
{
"epoch": 97.34,
"learning_rate": 2.091324200913242e-06,
"loss": 1.2965,
"step": 65900
},
{
"epoch": 97.49,
"learning_rate": 1.9771689497716896e-06,
"loss": 1.2782,
"step": 66000
},
{
"epoch": 97.49,
"eval_cer": 0.2048986147359968,
"eval_loss": 0.8099350929260254,
"eval_runtime": 113.4967,
"eval_samples_per_second": 17.807,
"eval_steps_per_second": 2.229,
"eval_wer": 0.8411677387431964,
"step": 66000
},
{
"epoch": 97.64,
"learning_rate": 1.863013698630137e-06,
"loss": 1.2485,
"step": 66100
},
{
"epoch": 97.78,
"learning_rate": 1.7488584474885843e-06,
"loss": 1.281,
"step": 66200
},
{
"epoch": 97.93,
"learning_rate": 1.6347031963470319e-06,
"loss": 1.2679,
"step": 66300
},
{
"epoch": 98.08,
"learning_rate": 1.5205479452054794e-06,
"loss": 1.2255,
"step": 66400
},
{
"epoch": 98.23,
"learning_rate": 1.406392694063927e-06,
"loss": 1.2457,
"step": 66500
},
{
"epoch": 98.23,
"eval_cer": 0.20618349728970087,
"eval_loss": 0.8133619427680969,
"eval_runtime": 113.8096,
"eval_samples_per_second": 17.758,
"eval_steps_per_second": 2.223,
"eval_wer": 0.8411677387431964,
"step": 66500
},
{
"epoch": 98.38,
"learning_rate": 1.2922374429223744e-06,
"loss": 1.2885,
"step": 66600
},
{
"epoch": 98.52,
"learning_rate": 1.178082191780822e-06,
"loss": 1.2787,
"step": 66700
},
{
"epoch": 98.67,
"learning_rate": 1.0639269406392693e-06,
"loss": 1.271,
"step": 66800
},
{
"epoch": 98.82,
"learning_rate": 9.497716894977168e-07,
"loss": 1.2858,
"step": 66900
},
{
"epoch": 98.97,
"learning_rate": 8.356164383561643e-07,
"loss": 1.2967,
"step": 67000
},
{
"epoch": 98.97,
"eval_cer": 0.20554105601284883,
"eval_loss": 0.8114518523216248,
"eval_runtime": 113.394,
"eval_samples_per_second": 17.823,
"eval_steps_per_second": 2.231,
"eval_wer": 0.8381989114299851,
"step": 67000
},
{
"epoch": 99.11,
"learning_rate": 7.214611872146118e-07,
"loss": 1.3312,
"step": 67100
},
{
"epoch": 99.26,
"learning_rate": 6.073059360730594e-07,
"loss": 1.2486,
"step": 67200
},
{
"epoch": 99.41,
"learning_rate": 4.931506849315068e-07,
"loss": 1.2672,
"step": 67300
},
{
"epoch": 99.56,
"learning_rate": 3.7899543378995425e-07,
"loss": 1.2776,
"step": 67400
},
{
"epoch": 99.7,
"learning_rate": 2.648401826484018e-07,
"loss": 1.2817,
"step": 67500
},
{
"epoch": 99.7,
"eval_cer": 0.20626380244930737,
"eval_loss": 0.8127681612968445,
"eval_runtime": 113.1151,
"eval_samples_per_second": 17.867,
"eval_steps_per_second": 2.237,
"eval_wer": 0.839188520534389,
"step": 67500
},
{
"epoch": 99.85,
"learning_rate": 1.5068493150684929e-07,
"loss": 1.2743,
"step": 67600
},
{
"epoch": 100.0,
"learning_rate": 3.6529680365296796e-08,
"loss": 1.2394,
"step": 67700
},
{
"epoch": 100.0,
"step": 67700,
"total_flos": 3.080356462743465e+20,
"train_loss": 3.0068138397532342,
"train_runtime": 143778.5903,
"train_samples_per_second": 15.073,
"train_steps_per_second": 0.471
}
],
"max_steps": 67700,
"num_train_epochs": 100,
"total_flos": 3.080356462743465e+20,
"trial_name": null,
"trial_params": null
}