whisper-tiny-eu-cv16_1 / trainer_state.json
zuazo's picture
End of training
ff57fe6 verified
raw
history blame
No virus
205 kB
{
"best_metric": 19.094888228857275,
"best_model_checkpoint": "./checkpoint-19000",
"epoch": 400.0,
"eval_steps": 1000,
"global_step": 40000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.25,
"learning_rate": 1.6499999999999997e-06,
"loss": 2.4538,
"step": 25
},
{
"epoch": 0.5,
"learning_rate": 3.5249999999999997e-06,
"loss": 1.87,
"step": 50
},
{
"epoch": 0.75,
"learning_rate": 5.399999999999999e-06,
"loss": 1.3171,
"step": 75
},
{
"epoch": 1.0,
"learning_rate": 7.275e-06,
"loss": 1.016,
"step": 100
},
{
"epoch": 1.25,
"learning_rate": 9.149999999999999e-06,
"loss": 0.834,
"step": 125
},
{
"epoch": 1.5,
"learning_rate": 1.1024999999999999e-05,
"loss": 0.7356,
"step": 150
},
{
"epoch": 1.75,
"learning_rate": 1.2899999999999998e-05,
"loss": 0.6513,
"step": 175
},
{
"epoch": 2.0,
"learning_rate": 1.4775e-05,
"loss": 0.5926,
"step": 200
},
{
"epoch": 2.25,
"learning_rate": 1.6649999999999998e-05,
"loss": 0.5086,
"step": 225
},
{
"epoch": 2.5,
"learning_rate": 1.8525e-05,
"loss": 0.4757,
"step": 250
},
{
"epoch": 2.75,
"learning_rate": 2.04e-05,
"loss": 0.4501,
"step": 275
},
{
"epoch": 3.0,
"learning_rate": 2.2274999999999996e-05,
"loss": 0.4266,
"step": 300
},
{
"epoch": 3.25,
"learning_rate": 2.4149999999999997e-05,
"loss": 0.357,
"step": 325
},
{
"epoch": 3.5,
"learning_rate": 2.6024999999999996e-05,
"loss": 0.3415,
"step": 350
},
{
"epoch": 3.75,
"learning_rate": 2.7899999999999997e-05,
"loss": 0.3319,
"step": 375
},
{
"epoch": 4.0,
"learning_rate": 2.9775e-05,
"loss": 0.3189,
"step": 400
},
{
"epoch": 4.25,
"learning_rate": 3.165e-05,
"loss": 0.253,
"step": 425
},
{
"epoch": 4.5,
"learning_rate": 3.3524999999999995e-05,
"loss": 0.2526,
"step": 450
},
{
"epoch": 4.75,
"learning_rate": 3.539999999999999e-05,
"loss": 0.2463,
"step": 475
},
{
"epoch": 5.0,
"learning_rate": 3.7275e-05,
"loss": 0.2471,
"step": 500
},
{
"epoch": 5.25,
"learning_rate": 3.747911392405063e-05,
"loss": 0.184,
"step": 525
},
{
"epoch": 5.5,
"learning_rate": 3.7455379746835444e-05,
"loss": 0.1809,
"step": 550
},
{
"epoch": 5.75,
"learning_rate": 3.743164556962025e-05,
"loss": 0.1773,
"step": 575
},
{
"epoch": 6.0,
"learning_rate": 3.7407911392405063e-05,
"loss": 0.1852,
"step": 600
},
{
"epoch": 6.25,
"learning_rate": 3.738417721518987e-05,
"loss": 0.1259,
"step": 625
},
{
"epoch": 6.5,
"learning_rate": 3.736044303797468e-05,
"loss": 0.1287,
"step": 650
},
{
"epoch": 6.75,
"learning_rate": 3.733670886075949e-05,
"loss": 0.1289,
"step": 675
},
{
"epoch": 7.0,
"learning_rate": 3.73129746835443e-05,
"loss": 0.1312,
"step": 700
},
{
"epoch": 7.25,
"learning_rate": 3.7289240506329114e-05,
"loss": 0.0865,
"step": 725
},
{
"epoch": 7.5,
"learning_rate": 3.726550632911392e-05,
"loss": 0.0904,
"step": 750
},
{
"epoch": 7.75,
"learning_rate": 3.724177215189873e-05,
"loss": 0.0907,
"step": 775
},
{
"epoch": 8.0,
"learning_rate": 3.721803797468354e-05,
"loss": 0.0926,
"step": 800
},
{
"epoch": 8.25,
"learning_rate": 3.719430379746835e-05,
"loss": 0.0587,
"step": 825
},
{
"epoch": 8.5,
"learning_rate": 3.717056962025316e-05,
"loss": 0.061,
"step": 850
},
{
"epoch": 8.75,
"learning_rate": 3.714683544303797e-05,
"loss": 0.0625,
"step": 875
},
{
"epoch": 9.0,
"learning_rate": 3.7123101265822784e-05,
"loss": 0.0624,
"step": 900
},
{
"epoch": 9.25,
"learning_rate": 3.709936708860759e-05,
"loss": 0.0386,
"step": 925
},
{
"epoch": 9.5,
"learning_rate": 3.70756329113924e-05,
"loss": 0.0405,
"step": 950
},
{
"epoch": 9.75,
"learning_rate": 3.705189873417721e-05,
"loss": 0.0415,
"step": 975
},
{
"epoch": 10.0,
"learning_rate": 3.702816455696202e-05,
"loss": 0.0426,
"step": 1000
},
{
"epoch": 10.0,
"eval_loss": 0.34511512517929077,
"eval_runtime": 91.8649,
"eval_samples_per_second": 138.704,
"eval_steps_per_second": 1.089,
"eval_wer": 23.200328278880725,
"step": 1000
},
{
"epoch": 10.25,
"learning_rate": 3.700443037974683e-05,
"loss": 0.0259,
"step": 1025
},
{
"epoch": 10.5,
"learning_rate": 3.698069620253164e-05,
"loss": 0.0259,
"step": 1050
},
{
"epoch": 10.75,
"learning_rate": 3.6956962025316454e-05,
"loss": 0.0277,
"step": 1075
},
{
"epoch": 11.0,
"learning_rate": 3.693322784810126e-05,
"loss": 0.0279,
"step": 1100
},
{
"epoch": 11.25,
"learning_rate": 3.690949367088607e-05,
"loss": 0.0177,
"step": 1125
},
{
"epoch": 11.5,
"learning_rate": 3.688575949367088e-05,
"loss": 0.0184,
"step": 1150
},
{
"epoch": 11.75,
"learning_rate": 3.686202531645569e-05,
"loss": 0.018,
"step": 1175
},
{
"epoch": 12.0,
"learning_rate": 3.68382911392405e-05,
"loss": 0.019,
"step": 1200
},
{
"epoch": 12.25,
"learning_rate": 3.681455696202531e-05,
"loss": 0.0122,
"step": 1225
},
{
"epoch": 12.5,
"learning_rate": 3.6790822784810124e-05,
"loss": 0.0136,
"step": 1250
},
{
"epoch": 12.75,
"learning_rate": 3.676708860759493e-05,
"loss": 0.0136,
"step": 1275
},
{
"epoch": 13.0,
"learning_rate": 3.674335443037974e-05,
"loss": 0.014,
"step": 1300
},
{
"epoch": 13.25,
"learning_rate": 3.6719620253164556e-05,
"loss": 0.0097,
"step": 1325
},
{
"epoch": 13.5,
"learning_rate": 3.669588607594937e-05,
"loss": 0.0096,
"step": 1350
},
{
"epoch": 13.75,
"learning_rate": 3.6672151898734175e-05,
"loss": 0.0087,
"step": 1375
},
{
"epoch": 14.0,
"learning_rate": 3.664841772151899e-05,
"loss": 0.0088,
"step": 1400
},
{
"epoch": 14.25,
"learning_rate": 3.6624683544303794e-05,
"loss": 0.0064,
"step": 1425
},
{
"epoch": 14.5,
"learning_rate": 3.660094936708861e-05,
"loss": 0.0064,
"step": 1450
},
{
"epoch": 14.75,
"learning_rate": 3.657721518987341e-05,
"loss": 0.0063,
"step": 1475
},
{
"epoch": 15.0,
"learning_rate": 3.6553481012658226e-05,
"loss": 0.0063,
"step": 1500
},
{
"epoch": 15.25,
"learning_rate": 3.652974683544304e-05,
"loss": 0.0052,
"step": 1525
},
{
"epoch": 15.5,
"learning_rate": 3.6506012658227845e-05,
"loss": 0.0057,
"step": 1550
},
{
"epoch": 15.75,
"learning_rate": 3.648227848101266e-05,
"loss": 0.0059,
"step": 1575
},
{
"epoch": 16.0,
"learning_rate": 3.6458544303797464e-05,
"loss": 0.0057,
"step": 1600
},
{
"epoch": 16.25,
"learning_rate": 3.643481012658228e-05,
"loss": 0.0044,
"step": 1625
},
{
"epoch": 16.5,
"learning_rate": 3.641107594936708e-05,
"loss": 0.0044,
"step": 1650
},
{
"epoch": 16.75,
"learning_rate": 3.6387341772151896e-05,
"loss": 0.0047,
"step": 1675
},
{
"epoch": 17.0,
"learning_rate": 3.636360759493671e-05,
"loss": 0.0051,
"step": 1700
},
{
"epoch": 17.25,
"learning_rate": 3.6339873417721515e-05,
"loss": 0.0047,
"step": 1725
},
{
"epoch": 17.5,
"learning_rate": 3.631613924050633e-05,
"loss": 0.0052,
"step": 1750
},
{
"epoch": 17.75,
"learning_rate": 3.6292405063291134e-05,
"loss": 0.006,
"step": 1775
},
{
"epoch": 18.0,
"learning_rate": 3.626867088607595e-05,
"loss": 0.0079,
"step": 1800
},
{
"epoch": 18.25,
"learning_rate": 3.624493670886075e-05,
"loss": 0.0061,
"step": 1825
},
{
"epoch": 18.5,
"learning_rate": 3.6221202531645566e-05,
"loss": 0.0067,
"step": 1850
},
{
"epoch": 18.75,
"learning_rate": 3.619746835443038e-05,
"loss": 0.007,
"step": 1875
},
{
"epoch": 19.0,
"learning_rate": 3.6173734177215185e-05,
"loss": 0.0083,
"step": 1900
},
{
"epoch": 19.25,
"learning_rate": 3.615e-05,
"loss": 0.0072,
"step": 1925
},
{
"epoch": 19.5,
"learning_rate": 3.6126265822784804e-05,
"loss": 0.0079,
"step": 1950
},
{
"epoch": 19.75,
"learning_rate": 3.610253164556962e-05,
"loss": 0.0078,
"step": 1975
},
{
"epoch": 20.0,
"learning_rate": 3.607879746835442e-05,
"loss": 0.0077,
"step": 2000
},
{
"epoch": 20.0,
"eval_loss": 0.41232848167419434,
"eval_runtime": 81.6367,
"eval_samples_per_second": 156.082,
"eval_steps_per_second": 1.225,
"eval_wer": 22.605322807566047,
"step": 2000
},
{
"epoch": 20.25,
"learning_rate": 3.6055063291139236e-05,
"loss": 0.0059,
"step": 2025
},
{
"epoch": 20.5,
"learning_rate": 3.603132911392405e-05,
"loss": 0.0063,
"step": 2050
},
{
"epoch": 20.75,
"learning_rate": 3.6007594936708855e-05,
"loss": 0.0078,
"step": 2075
},
{
"epoch": 21.0,
"learning_rate": 3.598386075949367e-05,
"loss": 0.0081,
"step": 2100
},
{
"epoch": 21.25,
"learning_rate": 3.596012658227848e-05,
"loss": 0.0065,
"step": 2125
},
{
"epoch": 21.5,
"learning_rate": 3.593639240506329e-05,
"loss": 0.0078,
"step": 2150
},
{
"epoch": 21.75,
"learning_rate": 3.59126582278481e-05,
"loss": 0.008,
"step": 2175
},
{
"epoch": 22.0,
"learning_rate": 3.588892405063291e-05,
"loss": 0.0081,
"step": 2200
},
{
"epoch": 22.25,
"learning_rate": 3.586518987341772e-05,
"loss": 0.0071,
"step": 2225
},
{
"epoch": 22.5,
"learning_rate": 3.584145569620253e-05,
"loss": 0.007,
"step": 2250
},
{
"epoch": 22.75,
"learning_rate": 3.581772151898734e-05,
"loss": 0.0068,
"step": 2275
},
{
"epoch": 23.0,
"learning_rate": 3.579398734177215e-05,
"loss": 0.0073,
"step": 2300
},
{
"epoch": 23.25,
"learning_rate": 3.577025316455696e-05,
"loss": 0.0052,
"step": 2325
},
{
"epoch": 23.5,
"learning_rate": 3.574651898734177e-05,
"loss": 0.0051,
"step": 2350
},
{
"epoch": 23.75,
"learning_rate": 3.572278481012658e-05,
"loss": 0.0054,
"step": 2375
},
{
"epoch": 24.0,
"learning_rate": 3.569905063291139e-05,
"loss": 0.0053,
"step": 2400
},
{
"epoch": 24.25,
"learning_rate": 3.56753164556962e-05,
"loss": 0.0045,
"step": 2425
},
{
"epoch": 24.5,
"learning_rate": 3.565158227848101e-05,
"loss": 0.0044,
"step": 2450
},
{
"epoch": 24.75,
"learning_rate": 3.562784810126582e-05,
"loss": 0.004,
"step": 2475
},
{
"epoch": 25.0,
"learning_rate": 3.5604113924050627e-05,
"loss": 0.0044,
"step": 2500
},
{
"epoch": 25.25,
"learning_rate": 3.558037974683544e-05,
"loss": 0.0033,
"step": 2525
},
{
"epoch": 25.5,
"learning_rate": 3.555664556962025e-05,
"loss": 0.0029,
"step": 2550
},
{
"epoch": 25.75,
"learning_rate": 3.553291139240506e-05,
"loss": 0.0028,
"step": 2575
},
{
"epoch": 26.0,
"learning_rate": 3.550917721518987e-05,
"loss": 0.0033,
"step": 2600
},
{
"epoch": 26.25,
"learning_rate": 3.548544303797468e-05,
"loss": 0.0031,
"step": 2625
},
{
"epoch": 26.5,
"learning_rate": 3.546170886075949e-05,
"loss": 0.0028,
"step": 2650
},
{
"epoch": 26.75,
"learning_rate": 3.5437974683544297e-05,
"loss": 0.0028,
"step": 2675
},
{
"epoch": 27.0,
"learning_rate": 3.541424050632911e-05,
"loss": 0.0027,
"step": 2700
},
{
"epoch": 27.25,
"learning_rate": 3.539050632911392e-05,
"loss": 0.0025,
"step": 2725
},
{
"epoch": 27.5,
"learning_rate": 3.536677215189873e-05,
"loss": 0.0028,
"step": 2750
},
{
"epoch": 27.75,
"learning_rate": 3.534303797468354e-05,
"loss": 0.0025,
"step": 2775
},
{
"epoch": 28.0,
"learning_rate": 3.531930379746835e-05,
"loss": 0.0024,
"step": 2800
},
{
"epoch": 28.25,
"learning_rate": 3.529556962025316e-05,
"loss": 0.002,
"step": 2825
},
{
"epoch": 28.5,
"learning_rate": 3.527183544303797e-05,
"loss": 0.0021,
"step": 2850
},
{
"epoch": 28.75,
"learning_rate": 3.524810126582278e-05,
"loss": 0.0019,
"step": 2875
},
{
"epoch": 29.0,
"learning_rate": 3.522436708860759e-05,
"loss": 0.002,
"step": 2900
},
{
"epoch": 29.25,
"learning_rate": 3.5200632911392405e-05,
"loss": 0.0015,
"step": 2925
},
{
"epoch": 29.5,
"learning_rate": 3.517689873417721e-05,
"loss": 0.0014,
"step": 2950
},
{
"epoch": 29.75,
"learning_rate": 3.5153164556962024e-05,
"loss": 0.0015,
"step": 2975
},
{
"epoch": 30.0,
"learning_rate": 3.512943037974684e-05,
"loss": 0.0013,
"step": 3000
},
{
"epoch": 30.0,
"eval_loss": 0.4287857711315155,
"eval_runtime": 80.2692,
"eval_samples_per_second": 158.741,
"eval_steps_per_second": 1.246,
"eval_wer": 21.19645927778646,
"step": 3000
},
{
"epoch": 30.25,
"learning_rate": 3.510569620253164e-05,
"loss": 0.001,
"step": 3025
},
{
"epoch": 30.5,
"learning_rate": 3.5081962025316456e-05,
"loss": 0.0009,
"step": 3050
},
{
"epoch": 30.75,
"learning_rate": 3.505822784810126e-05,
"loss": 0.0009,
"step": 3075
},
{
"epoch": 31.0,
"learning_rate": 3.5034493670886075e-05,
"loss": 0.0009,
"step": 3100
},
{
"epoch": 31.25,
"learning_rate": 3.501075949367088e-05,
"loss": 0.0008,
"step": 3125
},
{
"epoch": 31.5,
"learning_rate": 3.4987025316455694e-05,
"loss": 0.0008,
"step": 3150
},
{
"epoch": 31.75,
"learning_rate": 3.496329113924051e-05,
"loss": 0.0008,
"step": 3175
},
{
"epoch": 32.0,
"learning_rate": 3.493955696202531e-05,
"loss": 0.0008,
"step": 3200
},
{
"epoch": 32.25,
"learning_rate": 3.4915822784810126e-05,
"loss": 0.0007,
"step": 3225
},
{
"epoch": 32.5,
"learning_rate": 3.489208860759493e-05,
"loss": 0.0007,
"step": 3250
},
{
"epoch": 32.75,
"learning_rate": 3.4868354430379745e-05,
"loss": 0.0007,
"step": 3275
},
{
"epoch": 33.0,
"learning_rate": 3.484462025316455e-05,
"loss": 0.0007,
"step": 3300
},
{
"epoch": 33.25,
"learning_rate": 3.4820886075949364e-05,
"loss": 0.0006,
"step": 3325
},
{
"epoch": 33.5,
"learning_rate": 3.479715189873418e-05,
"loss": 0.0006,
"step": 3350
},
{
"epoch": 33.75,
"learning_rate": 3.477341772151898e-05,
"loss": 0.0006,
"step": 3375
},
{
"epoch": 34.0,
"learning_rate": 3.4749683544303796e-05,
"loss": 0.0006,
"step": 3400
},
{
"epoch": 34.25,
"learning_rate": 3.47259493670886e-05,
"loss": 0.0006,
"step": 3425
},
{
"epoch": 34.5,
"learning_rate": 3.4702215189873415e-05,
"loss": 0.0006,
"step": 3450
},
{
"epoch": 34.75,
"learning_rate": 3.467848101265822e-05,
"loss": 0.0006,
"step": 3475
},
{
"epoch": 35.0,
"learning_rate": 3.4654746835443034e-05,
"loss": 0.0006,
"step": 3500
},
{
"epoch": 35.25,
"learning_rate": 3.463101265822785e-05,
"loss": 0.0005,
"step": 3525
},
{
"epoch": 35.5,
"learning_rate": 3.460727848101265e-05,
"loss": 0.0005,
"step": 3550
},
{
"epoch": 35.75,
"learning_rate": 3.4583544303797466e-05,
"loss": 0.0005,
"step": 3575
},
{
"epoch": 36.0,
"learning_rate": 3.455981012658227e-05,
"loss": 0.0005,
"step": 3600
},
{
"epoch": 36.25,
"learning_rate": 3.4536075949367085e-05,
"loss": 0.0005,
"step": 3625
},
{
"epoch": 36.5,
"learning_rate": 3.451234177215189e-05,
"loss": 0.0005,
"step": 3650
},
{
"epoch": 36.75,
"learning_rate": 3.4488607594936704e-05,
"loss": 0.0005,
"step": 3675
},
{
"epoch": 37.0,
"learning_rate": 3.446487341772152e-05,
"loss": 0.0005,
"step": 3700
},
{
"epoch": 37.25,
"learning_rate": 3.444113924050632e-05,
"loss": 0.0005,
"step": 3725
},
{
"epoch": 37.5,
"learning_rate": 3.4417405063291136e-05,
"loss": 0.0005,
"step": 3750
},
{
"epoch": 37.75,
"learning_rate": 3.439367088607595e-05,
"loss": 0.0005,
"step": 3775
},
{
"epoch": 38.0,
"learning_rate": 3.436993670886076e-05,
"loss": 0.0005,
"step": 3800
},
{
"epoch": 38.25,
"learning_rate": 3.434620253164557e-05,
"loss": 0.0004,
"step": 3825
},
{
"epoch": 38.5,
"learning_rate": 3.432246835443038e-05,
"loss": 0.0004,
"step": 3850
},
{
"epoch": 38.75,
"learning_rate": 3.429873417721519e-05,
"loss": 0.0004,
"step": 3875
},
{
"epoch": 39.0,
"learning_rate": 3.4275e-05,
"loss": 0.0004,
"step": 3900
},
{
"epoch": 39.25,
"learning_rate": 3.4251265822784806e-05,
"loss": 0.0004,
"step": 3925
},
{
"epoch": 39.5,
"learning_rate": 3.422753164556962e-05,
"loss": 0.0004,
"step": 3950
},
{
"epoch": 39.75,
"learning_rate": 3.420379746835443e-05,
"loss": 0.0004,
"step": 3975
},
{
"epoch": 40.0,
"learning_rate": 3.418006329113924e-05,
"loss": 0.0004,
"step": 4000
},
{
"epoch": 40.0,
"eval_loss": 0.45376476645469666,
"eval_runtime": 81.5739,
"eval_samples_per_second": 156.202,
"eval_steps_per_second": 1.226,
"eval_wer": 21.192551195873065,
"step": 4000
},
{
"epoch": 40.25,
"learning_rate": 3.415632911392405e-05,
"loss": 0.0004,
"step": 4025
},
{
"epoch": 40.5,
"learning_rate": 3.413259493670886e-05,
"loss": 0.0004,
"step": 4050
},
{
"epoch": 40.75,
"learning_rate": 3.410886075949367e-05,
"loss": 0.0004,
"step": 4075
},
{
"epoch": 41.0,
"learning_rate": 3.4085126582278476e-05,
"loss": 0.0004,
"step": 4100
},
{
"epoch": 41.25,
"learning_rate": 3.406139240506329e-05,
"loss": 0.0004,
"step": 4125
},
{
"epoch": 41.5,
"learning_rate": 3.40376582278481e-05,
"loss": 0.0004,
"step": 4150
},
{
"epoch": 41.75,
"learning_rate": 3.401392405063291e-05,
"loss": 0.0004,
"step": 4175
},
{
"epoch": 42.0,
"learning_rate": 3.399018987341772e-05,
"loss": 0.0004,
"step": 4200
},
{
"epoch": 42.25,
"learning_rate": 3.396645569620253e-05,
"loss": 0.0003,
"step": 4225
},
{
"epoch": 42.5,
"learning_rate": 3.394272151898734e-05,
"loss": 0.0003,
"step": 4250
},
{
"epoch": 42.75,
"learning_rate": 3.3918987341772146e-05,
"loss": 0.0004,
"step": 4275
},
{
"epoch": 43.0,
"learning_rate": 3.389525316455696e-05,
"loss": 0.0004,
"step": 4300
},
{
"epoch": 43.25,
"learning_rate": 3.387151898734177e-05,
"loss": 0.0003,
"step": 4325
},
{
"epoch": 43.5,
"learning_rate": 3.384778481012658e-05,
"loss": 0.0003,
"step": 4350
},
{
"epoch": 43.75,
"learning_rate": 3.382405063291139e-05,
"loss": 0.0003,
"step": 4375
},
{
"epoch": 44.0,
"learning_rate": 3.3800316455696197e-05,
"loss": 0.0003,
"step": 4400
},
{
"epoch": 44.25,
"learning_rate": 3.377658227848101e-05,
"loss": 0.0003,
"step": 4425
},
{
"epoch": 44.5,
"learning_rate": 3.3752848101265816e-05,
"loss": 0.0003,
"step": 4450
},
{
"epoch": 44.75,
"learning_rate": 3.372911392405063e-05,
"loss": 0.0003,
"step": 4475
},
{
"epoch": 45.0,
"learning_rate": 3.370537974683544e-05,
"loss": 0.0003,
"step": 4500
},
{
"epoch": 45.25,
"learning_rate": 3.368164556962025e-05,
"loss": 0.0003,
"step": 4525
},
{
"epoch": 45.5,
"learning_rate": 3.365791139240506e-05,
"loss": 0.0003,
"step": 4550
},
{
"epoch": 45.75,
"learning_rate": 3.363417721518987e-05,
"loss": 0.0003,
"step": 4575
},
{
"epoch": 46.0,
"learning_rate": 3.361044303797468e-05,
"loss": 0.0003,
"step": 4600
},
{
"epoch": 46.25,
"learning_rate": 3.358670886075949e-05,
"loss": 0.0003,
"step": 4625
},
{
"epoch": 46.5,
"learning_rate": 3.3562974683544305e-05,
"loss": 0.0003,
"step": 4650
},
{
"epoch": 46.75,
"learning_rate": 3.353924050632911e-05,
"loss": 0.0003,
"step": 4675
},
{
"epoch": 47.0,
"learning_rate": 3.3515506329113924e-05,
"loss": 0.0003,
"step": 4700
},
{
"epoch": 47.25,
"learning_rate": 3.349177215189873e-05,
"loss": 0.0003,
"step": 4725
},
{
"epoch": 47.5,
"learning_rate": 3.346803797468354e-05,
"loss": 0.0003,
"step": 4750
},
{
"epoch": 47.75,
"learning_rate": 3.344430379746835e-05,
"loss": 0.0003,
"step": 4775
},
{
"epoch": 48.0,
"learning_rate": 3.342056962025316e-05,
"loss": 0.0003,
"step": 4800
},
{
"epoch": 48.25,
"learning_rate": 3.3396835443037975e-05,
"loss": 0.0002,
"step": 4825
},
{
"epoch": 48.5,
"learning_rate": 3.337310126582278e-05,
"loss": 0.0002,
"step": 4850
},
{
"epoch": 48.75,
"learning_rate": 3.3349367088607594e-05,
"loss": 0.0002,
"step": 4875
},
{
"epoch": 49.0,
"learning_rate": 3.33256329113924e-05,
"loss": 0.0003,
"step": 4900
},
{
"epoch": 49.25,
"learning_rate": 3.330189873417721e-05,
"loss": 0.0002,
"step": 4925
},
{
"epoch": 49.5,
"learning_rate": 3.327816455696202e-05,
"loss": 0.0002,
"step": 4950
},
{
"epoch": 49.75,
"learning_rate": 3.325443037974683e-05,
"loss": 0.0002,
"step": 4975
},
{
"epoch": 50.0,
"learning_rate": 3.3230696202531645e-05,
"loss": 0.0003,
"step": 5000
},
{
"epoch": 50.0,
"eval_loss": 0.475699245929718,
"eval_runtime": 80.4553,
"eval_samples_per_second": 158.374,
"eval_steps_per_second": 1.243,
"eval_wer": 21.180826950132875,
"step": 5000
},
{
"epoch": 50.25,
"learning_rate": 3.320696202531645e-05,
"loss": 0.0002,
"step": 5025
},
{
"epoch": 50.5,
"learning_rate": 3.3183227848101264e-05,
"loss": 0.0002,
"step": 5050
},
{
"epoch": 50.75,
"learning_rate": 3.315949367088607e-05,
"loss": 0.0002,
"step": 5075
},
{
"epoch": 51.0,
"learning_rate": 3.313575949367088e-05,
"loss": 0.0002,
"step": 5100
},
{
"epoch": 51.25,
"learning_rate": 3.311202531645569e-05,
"loss": 0.0002,
"step": 5125
},
{
"epoch": 51.5,
"learning_rate": 3.30882911392405e-05,
"loss": 0.0002,
"step": 5150
},
{
"epoch": 51.75,
"learning_rate": 3.3064556962025315e-05,
"loss": 0.0002,
"step": 5175
},
{
"epoch": 52.0,
"learning_rate": 3.304082278481012e-05,
"loss": 0.0002,
"step": 5200
},
{
"epoch": 52.25,
"learning_rate": 3.3017088607594934e-05,
"loss": 0.0002,
"step": 5225
},
{
"epoch": 52.5,
"learning_rate": 3.299335443037974e-05,
"loss": 0.0002,
"step": 5250
},
{
"epoch": 52.75,
"learning_rate": 3.296962025316455e-05,
"loss": 0.0002,
"step": 5275
},
{
"epoch": 53.0,
"learning_rate": 3.2945886075949366e-05,
"loss": 0.0002,
"step": 5300
},
{
"epoch": 53.25,
"learning_rate": 3.292215189873417e-05,
"loss": 0.0002,
"step": 5325
},
{
"epoch": 53.5,
"learning_rate": 3.2898417721518985e-05,
"loss": 0.0002,
"step": 5350
},
{
"epoch": 53.75,
"learning_rate": 3.287468354430379e-05,
"loss": 0.0002,
"step": 5375
},
{
"epoch": 54.0,
"learning_rate": 3.2850949367088604e-05,
"loss": 0.0002,
"step": 5400
},
{
"epoch": 54.25,
"learning_rate": 3.282721518987342e-05,
"loss": 0.0002,
"step": 5425
},
{
"epoch": 54.5,
"learning_rate": 3.280348101265823e-05,
"loss": 0.0002,
"step": 5450
},
{
"epoch": 54.75,
"learning_rate": 3.2779746835443036e-05,
"loss": 0.0002,
"step": 5475
},
{
"epoch": 55.0,
"learning_rate": 3.275601265822785e-05,
"loss": 0.0002,
"step": 5500
},
{
"epoch": 55.25,
"learning_rate": 3.2732278481012655e-05,
"loss": 0.0002,
"step": 5525
},
{
"epoch": 55.5,
"learning_rate": 3.270854430379747e-05,
"loss": 0.0002,
"step": 5550
},
{
"epoch": 55.75,
"learning_rate": 3.2684810126582274e-05,
"loss": 0.0002,
"step": 5575
},
{
"epoch": 56.0,
"learning_rate": 3.266107594936709e-05,
"loss": 0.0002,
"step": 5600
},
{
"epoch": 56.25,
"learning_rate": 3.26373417721519e-05,
"loss": 0.0002,
"step": 5625
},
{
"epoch": 56.5,
"learning_rate": 3.2613607594936706e-05,
"loss": 0.0002,
"step": 5650
},
{
"epoch": 56.75,
"learning_rate": 3.258987341772152e-05,
"loss": 0.0002,
"step": 5675
},
{
"epoch": 57.0,
"learning_rate": 3.2566139240506325e-05,
"loss": 0.0002,
"step": 5700
},
{
"epoch": 57.25,
"learning_rate": 3.254240506329114e-05,
"loss": 0.0002,
"step": 5725
},
{
"epoch": 57.5,
"learning_rate": 3.2518670886075944e-05,
"loss": 0.0002,
"step": 5750
},
{
"epoch": 57.75,
"learning_rate": 3.249493670886076e-05,
"loss": 0.0002,
"step": 5775
},
{
"epoch": 58.0,
"learning_rate": 3.247120253164557e-05,
"loss": 0.0054,
"step": 5800
},
{
"epoch": 58.25,
"learning_rate": 3.2447468354430376e-05,
"loss": 0.0387,
"step": 5825
},
{
"epoch": 58.5,
"learning_rate": 3.242373417721519e-05,
"loss": 0.0443,
"step": 5850
},
{
"epoch": 58.75,
"learning_rate": 3.2399999999999995e-05,
"loss": 0.0406,
"step": 5875
},
{
"epoch": 59.0,
"learning_rate": 3.237626582278481e-05,
"loss": 0.0352,
"step": 5900
},
{
"epoch": 59.25,
"learning_rate": 3.2352531645569614e-05,
"loss": 0.0224,
"step": 5925
},
{
"epoch": 59.5,
"learning_rate": 3.232879746835443e-05,
"loss": 0.0213,
"step": 5950
},
{
"epoch": 59.75,
"learning_rate": 3.230506329113924e-05,
"loss": 0.0218,
"step": 5975
},
{
"epoch": 60.0,
"learning_rate": 3.2281329113924046e-05,
"loss": 0.0206,
"step": 6000
},
{
"epoch": 60.0,
"eval_loss": 0.41719070076942444,
"eval_runtime": 86.1367,
"eval_samples_per_second": 147.928,
"eval_steps_per_second": 1.161,
"eval_wer": 22.275089885884007,
"step": 6000
},
{
"epoch": 60.25,
"learning_rate": 3.225759493670886e-05,
"loss": 0.0123,
"step": 6025
},
{
"epoch": 60.5,
"learning_rate": 3.2233860759493665e-05,
"loss": 0.0125,
"step": 6050
},
{
"epoch": 60.75,
"learning_rate": 3.221012658227848e-05,
"loss": 0.0126,
"step": 6075
},
{
"epoch": 61.0,
"learning_rate": 3.2186392405063284e-05,
"loss": 0.0126,
"step": 6100
},
{
"epoch": 61.25,
"learning_rate": 3.2162658227848097e-05,
"loss": 0.0078,
"step": 6125
},
{
"epoch": 61.5,
"learning_rate": 3.213892405063291e-05,
"loss": 0.0072,
"step": 6150
},
{
"epoch": 61.75,
"learning_rate": 3.2115189873417716e-05,
"loss": 0.0068,
"step": 6175
},
{
"epoch": 62.0,
"learning_rate": 3.209145569620253e-05,
"loss": 0.0073,
"step": 6200
},
{
"epoch": 62.25,
"learning_rate": 3.206772151898734e-05,
"loss": 0.0041,
"step": 6225
},
{
"epoch": 62.5,
"learning_rate": 3.2043987341772154e-05,
"loss": 0.004,
"step": 6250
},
{
"epoch": 62.75,
"learning_rate": 3.202025316455696e-05,
"loss": 0.0039,
"step": 6275
},
{
"epoch": 63.0,
"learning_rate": 3.199651898734177e-05,
"loss": 0.0036,
"step": 6300
},
{
"epoch": 63.25,
"learning_rate": 3.197278481012658e-05,
"loss": 0.0022,
"step": 6325
},
{
"epoch": 63.5,
"learning_rate": 3.194905063291139e-05,
"loss": 0.0016,
"step": 6350
},
{
"epoch": 63.75,
"learning_rate": 3.19253164556962e-05,
"loss": 0.0019,
"step": 6375
},
{
"epoch": 64.0,
"learning_rate": 3.190158227848101e-05,
"loss": 0.0017,
"step": 6400
},
{
"epoch": 64.25,
"learning_rate": 3.1877848101265824e-05,
"loss": 0.001,
"step": 6425
},
{
"epoch": 64.5,
"learning_rate": 3.185411392405063e-05,
"loss": 0.0015,
"step": 6450
},
{
"epoch": 64.75,
"learning_rate": 3.183037974683544e-05,
"loss": 0.001,
"step": 6475
},
{
"epoch": 65.0,
"learning_rate": 3.180664556962025e-05,
"loss": 0.0013,
"step": 6500
},
{
"epoch": 65.25,
"learning_rate": 3.178291139240506e-05,
"loss": 0.0008,
"step": 6525
},
{
"epoch": 65.5,
"learning_rate": 3.175917721518987e-05,
"loss": 0.0008,
"step": 6550
},
{
"epoch": 65.75,
"learning_rate": 3.173544303797468e-05,
"loss": 0.001,
"step": 6575
},
{
"epoch": 66.0,
"learning_rate": 3.1711708860759494e-05,
"loss": 0.0008,
"step": 6600
},
{
"epoch": 66.25,
"learning_rate": 3.16879746835443e-05,
"loss": 0.0005,
"step": 6625
},
{
"epoch": 66.5,
"learning_rate": 3.166424050632911e-05,
"loss": 0.0007,
"step": 6650
},
{
"epoch": 66.75,
"learning_rate": 3.164050632911392e-05,
"loss": 0.0007,
"step": 6675
},
{
"epoch": 67.0,
"learning_rate": 3.161677215189873e-05,
"loss": 0.0006,
"step": 6700
},
{
"epoch": 67.25,
"learning_rate": 3.159303797468354e-05,
"loss": 0.0004,
"step": 6725
},
{
"epoch": 67.5,
"learning_rate": 3.156930379746835e-05,
"loss": 0.0004,
"step": 6750
},
{
"epoch": 67.75,
"learning_rate": 3.1545569620253164e-05,
"loss": 0.0004,
"step": 6775
},
{
"epoch": 68.0,
"learning_rate": 3.152183544303797e-05,
"loss": 0.0004,
"step": 6800
},
{
"epoch": 68.25,
"learning_rate": 3.149810126582278e-05,
"loss": 0.0003,
"step": 6825
},
{
"epoch": 68.5,
"learning_rate": 3.147436708860759e-05,
"loss": 0.0003,
"step": 6850
},
{
"epoch": 68.75,
"learning_rate": 3.14506329113924e-05,
"loss": 0.0003,
"step": 6875
},
{
"epoch": 69.0,
"learning_rate": 3.142689873417721e-05,
"loss": 0.0003,
"step": 6900
},
{
"epoch": 69.25,
"learning_rate": 3.140316455696202e-05,
"loss": 0.0003,
"step": 6925
},
{
"epoch": 69.5,
"learning_rate": 3.1379430379746834e-05,
"loss": 0.0003,
"step": 6950
},
{
"epoch": 69.75,
"learning_rate": 3.135569620253164e-05,
"loss": 0.0003,
"step": 6975
},
{
"epoch": 70.0,
"learning_rate": 3.133196202531645e-05,
"loss": 0.0003,
"step": 7000
},
{
"epoch": 70.0,
"eval_loss": 0.43740585446357727,
"eval_runtime": 80.2604,
"eval_samples_per_second": 158.758,
"eval_steps_per_second": 1.246,
"eval_wer": 19.513052993590748,
"step": 7000
},
{
"epoch": 70.25,
"learning_rate": 3.130822784810126e-05,
"loss": 0.0003,
"step": 7025
},
{
"epoch": 70.5,
"learning_rate": 3.128449367088607e-05,
"loss": 0.0003,
"step": 7050
},
{
"epoch": 70.75,
"learning_rate": 3.1260759493670885e-05,
"loss": 0.0003,
"step": 7075
},
{
"epoch": 71.0,
"learning_rate": 3.12370253164557e-05,
"loss": 0.0003,
"step": 7100
},
{
"epoch": 71.25,
"learning_rate": 3.1213291139240504e-05,
"loss": 0.0002,
"step": 7125
},
{
"epoch": 71.5,
"learning_rate": 3.118955696202532e-05,
"loss": 0.0002,
"step": 7150
},
{
"epoch": 71.75,
"learning_rate": 3.116582278481012e-05,
"loss": 0.0003,
"step": 7175
},
{
"epoch": 72.0,
"learning_rate": 3.1142088607594936e-05,
"loss": 0.0002,
"step": 7200
},
{
"epoch": 72.25,
"learning_rate": 3.111835443037974e-05,
"loss": 0.0002,
"step": 7225
},
{
"epoch": 72.5,
"learning_rate": 3.1094620253164555e-05,
"loss": 0.0002,
"step": 7250
},
{
"epoch": 72.75,
"learning_rate": 3.107088607594937e-05,
"loss": 0.0002,
"step": 7275
},
{
"epoch": 73.0,
"learning_rate": 3.1047151898734174e-05,
"loss": 0.0002,
"step": 7300
},
{
"epoch": 73.25,
"learning_rate": 3.102341772151899e-05,
"loss": 0.0002,
"step": 7325
},
{
"epoch": 73.5,
"learning_rate": 3.099968354430379e-05,
"loss": 0.0002,
"step": 7350
},
{
"epoch": 73.75,
"learning_rate": 3.0975949367088606e-05,
"loss": 0.0002,
"step": 7375
},
{
"epoch": 74.0,
"learning_rate": 3.095221518987341e-05,
"loss": 0.0002,
"step": 7400
},
{
"epoch": 74.25,
"learning_rate": 3.0928481012658225e-05,
"loss": 0.0002,
"step": 7425
},
{
"epoch": 74.5,
"learning_rate": 3.090474683544304e-05,
"loss": 0.0002,
"step": 7450
},
{
"epoch": 74.75,
"learning_rate": 3.0881012658227844e-05,
"loss": 0.0002,
"step": 7475
},
{
"epoch": 75.0,
"learning_rate": 3.085727848101266e-05,
"loss": 0.0002,
"step": 7500
},
{
"epoch": 75.25,
"learning_rate": 3.083354430379746e-05,
"loss": 0.0002,
"step": 7525
},
{
"epoch": 75.5,
"learning_rate": 3.0809810126582276e-05,
"loss": 0.0002,
"step": 7550
},
{
"epoch": 75.75,
"learning_rate": 3.078607594936709e-05,
"loss": 0.0002,
"step": 7575
},
{
"epoch": 76.0,
"learning_rate": 3.0762341772151895e-05,
"loss": 0.0002,
"step": 7600
},
{
"epoch": 76.25,
"learning_rate": 3.073860759493671e-05,
"loss": 0.0002,
"step": 7625
},
{
"epoch": 76.5,
"learning_rate": 3.0714873417721514e-05,
"loss": 0.0002,
"step": 7650
},
{
"epoch": 76.75,
"learning_rate": 3.069113924050633e-05,
"loss": 0.0002,
"step": 7675
},
{
"epoch": 77.0,
"learning_rate": 3.066740506329113e-05,
"loss": 0.0002,
"step": 7700
},
{
"epoch": 77.25,
"learning_rate": 3.0643670886075946e-05,
"loss": 0.0002,
"step": 7725
},
{
"epoch": 77.5,
"learning_rate": 3.061993670886076e-05,
"loss": 0.0002,
"step": 7750
},
{
"epoch": 77.75,
"learning_rate": 3.0596202531645565e-05,
"loss": 0.0002,
"step": 7775
},
{
"epoch": 78.0,
"learning_rate": 3.057246835443038e-05,
"loss": 0.0002,
"step": 7800
},
{
"epoch": 78.25,
"learning_rate": 3.0548734177215184e-05,
"loss": 0.0002,
"step": 7825
},
{
"epoch": 78.5,
"learning_rate": 3.0524999999999997e-05,
"loss": 0.0002,
"step": 7850
},
{
"epoch": 78.75,
"learning_rate": 3.050126582278481e-05,
"loss": 0.0002,
"step": 7875
},
{
"epoch": 79.0,
"learning_rate": 3.047753164556962e-05,
"loss": 0.0002,
"step": 7900
},
{
"epoch": 79.25,
"learning_rate": 3.045379746835443e-05,
"loss": 0.0001,
"step": 7925
},
{
"epoch": 79.5,
"learning_rate": 3.0430063291139238e-05,
"loss": 0.0001,
"step": 7950
},
{
"epoch": 79.75,
"learning_rate": 3.040632911392405e-05,
"loss": 0.0001,
"step": 7975
},
{
"epoch": 80.0,
"learning_rate": 3.038259493670886e-05,
"loss": 0.0002,
"step": 8000
},
{
"epoch": 80.0,
"eval_loss": 0.4546888768672943,
"eval_runtime": 80.4032,
"eval_samples_per_second": 158.476,
"eval_steps_per_second": 1.244,
"eval_wer": 19.50914491167735,
"step": 8000
},
{
"epoch": 80.25,
"learning_rate": 3.035886075949367e-05,
"loss": 0.0001,
"step": 8025
},
{
"epoch": 80.5,
"learning_rate": 3.033512658227848e-05,
"loss": 0.0001,
"step": 8050
},
{
"epoch": 80.75,
"learning_rate": 3.031139240506329e-05,
"loss": 0.0001,
"step": 8075
},
{
"epoch": 81.0,
"learning_rate": 3.02876582278481e-05,
"loss": 0.0001,
"step": 8100
},
{
"epoch": 81.25,
"learning_rate": 3.0263924050632908e-05,
"loss": 0.0001,
"step": 8125
},
{
"epoch": 81.5,
"learning_rate": 3.024018987341772e-05,
"loss": 0.0001,
"step": 8150
},
{
"epoch": 81.75,
"learning_rate": 3.021645569620253e-05,
"loss": 0.0001,
"step": 8175
},
{
"epoch": 82.0,
"learning_rate": 3.019272151898734e-05,
"loss": 0.0001,
"step": 8200
},
{
"epoch": 82.25,
"learning_rate": 3.016898734177215e-05,
"loss": 0.0001,
"step": 8225
},
{
"epoch": 82.5,
"learning_rate": 3.014525316455696e-05,
"loss": 0.0001,
"step": 8250
},
{
"epoch": 82.75,
"learning_rate": 3.012151898734177e-05,
"loss": 0.0001,
"step": 8275
},
{
"epoch": 83.0,
"learning_rate": 3.0097784810126578e-05,
"loss": 0.0001,
"step": 8300
},
{
"epoch": 83.25,
"learning_rate": 3.007405063291139e-05,
"loss": 0.0001,
"step": 8325
},
{
"epoch": 83.5,
"learning_rate": 3.00503164556962e-05,
"loss": 0.0001,
"step": 8350
},
{
"epoch": 83.75,
"learning_rate": 3.002658227848101e-05,
"loss": 0.0001,
"step": 8375
},
{
"epoch": 84.0,
"learning_rate": 3.000284810126582e-05,
"loss": 0.0001,
"step": 8400
},
{
"epoch": 84.25,
"learning_rate": 2.997911392405063e-05,
"loss": 0.0001,
"step": 8425
},
{
"epoch": 84.5,
"learning_rate": 2.9955379746835438e-05,
"loss": 0.0001,
"step": 8450
},
{
"epoch": 84.75,
"learning_rate": 2.993164556962025e-05,
"loss": 0.0001,
"step": 8475
},
{
"epoch": 85.0,
"learning_rate": 2.990791139240506e-05,
"loss": 0.0001,
"step": 8500
},
{
"epoch": 85.25,
"learning_rate": 2.988417721518987e-05,
"loss": 0.0001,
"step": 8525
},
{
"epoch": 85.5,
"learning_rate": 2.986044303797468e-05,
"loss": 0.0001,
"step": 8550
},
{
"epoch": 85.75,
"learning_rate": 2.983670886075949e-05,
"loss": 0.0001,
"step": 8575
},
{
"epoch": 86.0,
"learning_rate": 2.98129746835443e-05,
"loss": 0.0001,
"step": 8600
},
{
"epoch": 86.25,
"learning_rate": 2.9789240506329108e-05,
"loss": 0.0001,
"step": 8625
},
{
"epoch": 86.5,
"learning_rate": 2.976550632911392e-05,
"loss": 0.0001,
"step": 8650
},
{
"epoch": 86.75,
"learning_rate": 2.974177215189873e-05,
"loss": 0.0001,
"step": 8675
},
{
"epoch": 87.0,
"learning_rate": 2.9718037974683544e-05,
"loss": 0.0001,
"step": 8700
},
{
"epoch": 87.25,
"learning_rate": 2.9694303797468353e-05,
"loss": 0.0001,
"step": 8725
},
{
"epoch": 87.5,
"learning_rate": 2.9670569620253163e-05,
"loss": 0.0001,
"step": 8750
},
{
"epoch": 87.75,
"learning_rate": 2.9646835443037972e-05,
"loss": 0.0001,
"step": 8775
},
{
"epoch": 88.0,
"learning_rate": 2.9623101265822785e-05,
"loss": 0.0001,
"step": 8800
},
{
"epoch": 88.25,
"learning_rate": 2.9599367088607594e-05,
"loss": 0.0001,
"step": 8825
},
{
"epoch": 88.5,
"learning_rate": 2.9575632911392404e-05,
"loss": 0.0001,
"step": 8850
},
{
"epoch": 88.75,
"learning_rate": 2.9551898734177213e-05,
"loss": 0.0001,
"step": 8875
},
{
"epoch": 89.0,
"learning_rate": 2.9528164556962023e-05,
"loss": 0.0001,
"step": 8900
},
{
"epoch": 89.25,
"learning_rate": 2.9504430379746832e-05,
"loss": 0.0001,
"step": 8925
},
{
"epoch": 89.5,
"learning_rate": 2.9480696202531645e-05,
"loss": 0.0001,
"step": 8950
},
{
"epoch": 89.75,
"learning_rate": 2.9456962025316455e-05,
"loss": 0.0001,
"step": 8975
},
{
"epoch": 90.0,
"learning_rate": 2.9433227848101264e-05,
"loss": 0.0001,
"step": 9000
},
{
"epoch": 90.0,
"eval_loss": 0.4697396755218506,
"eval_runtime": 80.422,
"eval_samples_per_second": 158.439,
"eval_steps_per_second": 1.243,
"eval_wer": 19.5062138502423,
"step": 9000
},
{
"epoch": 90.25,
"learning_rate": 2.9409493670886074e-05,
"loss": 0.0001,
"step": 9025
},
{
"epoch": 90.5,
"learning_rate": 2.9385759493670883e-05,
"loss": 0.0001,
"step": 9050
},
{
"epoch": 90.75,
"learning_rate": 2.9362025316455693e-05,
"loss": 0.0001,
"step": 9075
},
{
"epoch": 91.0,
"learning_rate": 2.9338291139240502e-05,
"loss": 0.0001,
"step": 9100
},
{
"epoch": 91.25,
"learning_rate": 2.9314556962025315e-05,
"loss": 0.0001,
"step": 9125
},
{
"epoch": 91.5,
"learning_rate": 2.9290822784810125e-05,
"loss": 0.0001,
"step": 9150
},
{
"epoch": 91.75,
"learning_rate": 2.9267088607594934e-05,
"loss": 0.0001,
"step": 9175
},
{
"epoch": 92.0,
"learning_rate": 2.9243354430379744e-05,
"loss": 0.0001,
"step": 9200
},
{
"epoch": 92.25,
"learning_rate": 2.9219620253164553e-05,
"loss": 0.0001,
"step": 9225
},
{
"epoch": 92.5,
"learning_rate": 2.9195886075949363e-05,
"loss": 0.0001,
"step": 9250
},
{
"epoch": 92.75,
"learning_rate": 2.9172151898734172e-05,
"loss": 0.0001,
"step": 9275
},
{
"epoch": 93.0,
"learning_rate": 2.9148417721518985e-05,
"loss": 0.0001,
"step": 9300
},
{
"epoch": 93.25,
"learning_rate": 2.9124683544303795e-05,
"loss": 0.0001,
"step": 9325
},
{
"epoch": 93.5,
"learning_rate": 2.9100949367088604e-05,
"loss": 0.0001,
"step": 9350
},
{
"epoch": 93.75,
"learning_rate": 2.9077215189873414e-05,
"loss": 0.0001,
"step": 9375
},
{
"epoch": 94.0,
"learning_rate": 2.9053481012658223e-05,
"loss": 0.0001,
"step": 9400
},
{
"epoch": 94.25,
"learning_rate": 2.9029746835443033e-05,
"loss": 0.0001,
"step": 9425
},
{
"epoch": 94.5,
"learning_rate": 2.9006012658227842e-05,
"loss": 0.0001,
"step": 9450
},
{
"epoch": 94.75,
"learning_rate": 2.8982278481012655e-05,
"loss": 0.0001,
"step": 9475
},
{
"epoch": 95.0,
"learning_rate": 2.8958544303797465e-05,
"loss": 0.0001,
"step": 9500
},
{
"epoch": 95.25,
"learning_rate": 2.8934810126582278e-05,
"loss": 0.0001,
"step": 9525
},
{
"epoch": 95.5,
"learning_rate": 2.8911075949367087e-05,
"loss": 0.0001,
"step": 9550
},
{
"epoch": 95.75,
"learning_rate": 2.8887341772151897e-05,
"loss": 0.0001,
"step": 9575
},
{
"epoch": 96.0,
"learning_rate": 2.886360759493671e-05,
"loss": 0.0001,
"step": 9600
},
{
"epoch": 96.25,
"learning_rate": 2.883987341772152e-05,
"loss": 0.0001,
"step": 9625
},
{
"epoch": 96.5,
"learning_rate": 2.881613924050633e-05,
"loss": 0.0001,
"step": 9650
},
{
"epoch": 96.75,
"learning_rate": 2.8792405063291138e-05,
"loss": 0.0001,
"step": 9675
},
{
"epoch": 97.0,
"learning_rate": 2.8768670886075948e-05,
"loss": 0.0001,
"step": 9700
},
{
"epoch": 97.25,
"learning_rate": 2.8744936708860757e-05,
"loss": 0.0001,
"step": 9725
},
{
"epoch": 97.5,
"learning_rate": 2.8721202531645567e-05,
"loss": 0.0001,
"step": 9750
},
{
"epoch": 97.75,
"learning_rate": 2.869746835443038e-05,
"loss": 0.0001,
"step": 9775
},
{
"epoch": 98.0,
"learning_rate": 2.867373417721519e-05,
"loss": 0.0001,
"step": 9800
},
{
"epoch": 98.25,
"learning_rate": 2.865e-05,
"loss": 0.0001,
"step": 9825
},
{
"epoch": 98.5,
"learning_rate": 2.8626265822784808e-05,
"loss": 0.0001,
"step": 9850
},
{
"epoch": 98.75,
"learning_rate": 2.8602531645569617e-05,
"loss": 0.0001,
"step": 9875
},
{
"epoch": 99.0,
"learning_rate": 2.8578797468354427e-05,
"loss": 0.0001,
"step": 9900
},
{
"epoch": 99.25,
"learning_rate": 2.8555063291139236e-05,
"loss": 0.0001,
"step": 9925
},
{
"epoch": 99.5,
"learning_rate": 2.853132911392405e-05,
"loss": 0.0001,
"step": 9950
},
{
"epoch": 99.75,
"learning_rate": 2.850759493670886e-05,
"loss": 0.0001,
"step": 9975
},
{
"epoch": 100.0,
"learning_rate": 2.848386075949367e-05,
"loss": 0.0001,
"step": 10000
},
{
"epoch": 100.0,
"eval_loss": 0.48529908061027527,
"eval_runtime": 80.5352,
"eval_samples_per_second": 158.217,
"eval_steps_per_second": 1.242,
"eval_wer": 19.51989213693919,
"step": 10000
},
{
"epoch": 100.25,
"learning_rate": 2.8460126582278478e-05,
"loss": 0.0001,
"step": 10025
},
{
"epoch": 100.5,
"learning_rate": 2.8436392405063287e-05,
"loss": 0.0001,
"step": 10050
},
{
"epoch": 100.75,
"learning_rate": 2.8412658227848097e-05,
"loss": 0.0001,
"step": 10075
},
{
"epoch": 101.0,
"learning_rate": 2.8388924050632906e-05,
"loss": 0.0001,
"step": 10100
},
{
"epoch": 101.25,
"learning_rate": 2.836518987341772e-05,
"loss": 0.0001,
"step": 10125
},
{
"epoch": 101.5,
"learning_rate": 2.834145569620253e-05,
"loss": 0.0001,
"step": 10150
},
{
"epoch": 101.75,
"learning_rate": 2.831772151898734e-05,
"loss": 0.0001,
"step": 10175
},
{
"epoch": 102.0,
"learning_rate": 2.8293987341772148e-05,
"loss": 0.0001,
"step": 10200
},
{
"epoch": 102.25,
"learning_rate": 2.8270253164556957e-05,
"loss": 0.0001,
"step": 10225
},
{
"epoch": 102.5,
"learning_rate": 2.8246518987341767e-05,
"loss": 0.0001,
"step": 10250
},
{
"epoch": 102.75,
"learning_rate": 2.8222784810126576e-05,
"loss": 0.0001,
"step": 10275
},
{
"epoch": 103.0,
"learning_rate": 2.819905063291139e-05,
"loss": 0.0001,
"step": 10300
},
{
"epoch": 103.25,
"learning_rate": 2.81753164556962e-05,
"loss": 0.0001,
"step": 10325
},
{
"epoch": 103.5,
"learning_rate": 2.815158227848101e-05,
"loss": 0.0001,
"step": 10350
},
{
"epoch": 103.75,
"learning_rate": 2.812784810126582e-05,
"loss": 0.0001,
"step": 10375
},
{
"epoch": 104.0,
"learning_rate": 2.810411392405063e-05,
"loss": 0.0,
"step": 10400
},
{
"epoch": 104.25,
"learning_rate": 2.8080379746835444e-05,
"loss": 0.0,
"step": 10425
},
{
"epoch": 104.5,
"learning_rate": 2.8056645569620253e-05,
"loss": 0.0,
"step": 10450
},
{
"epoch": 104.75,
"learning_rate": 2.8032911392405063e-05,
"loss": 0.0,
"step": 10475
},
{
"epoch": 105.0,
"learning_rate": 2.8009177215189872e-05,
"loss": 0.0001,
"step": 10500
},
{
"epoch": 105.25,
"learning_rate": 2.798544303797468e-05,
"loss": 0.0,
"step": 10525
},
{
"epoch": 105.5,
"learning_rate": 2.796170886075949e-05,
"loss": 0.0,
"step": 10550
},
{
"epoch": 105.75,
"learning_rate": 2.79379746835443e-05,
"loss": 0.0001,
"step": 10575
},
{
"epoch": 106.0,
"learning_rate": 2.7914240506329113e-05,
"loss": 0.0001,
"step": 10600
},
{
"epoch": 106.25,
"learning_rate": 2.7890506329113923e-05,
"loss": 0.0,
"step": 10625
},
{
"epoch": 106.5,
"learning_rate": 2.7866772151898732e-05,
"loss": 0.0,
"step": 10650
},
{
"epoch": 106.75,
"learning_rate": 2.7843037974683542e-05,
"loss": 0.0001,
"step": 10675
},
{
"epoch": 107.0,
"learning_rate": 2.781930379746835e-05,
"loss": 0.0,
"step": 10700
},
{
"epoch": 107.25,
"learning_rate": 2.779556962025316e-05,
"loss": 0.0,
"step": 10725
},
{
"epoch": 107.5,
"learning_rate": 2.777183544303797e-05,
"loss": 0.0,
"step": 10750
},
{
"epoch": 107.75,
"learning_rate": 2.7748101265822783e-05,
"loss": 0.0001,
"step": 10775
},
{
"epoch": 108.0,
"learning_rate": 2.7724367088607593e-05,
"loss": 0.0001,
"step": 10800
},
{
"epoch": 108.25,
"learning_rate": 2.7700632911392402e-05,
"loss": 0.0001,
"step": 10825
},
{
"epoch": 108.5,
"learning_rate": 2.7676898734177212e-05,
"loss": 0.0,
"step": 10850
},
{
"epoch": 108.75,
"learning_rate": 2.765316455696202e-05,
"loss": 0.0001,
"step": 10875
},
{
"epoch": 109.0,
"learning_rate": 2.762943037974683e-05,
"loss": 0.0,
"step": 10900
},
{
"epoch": 109.25,
"learning_rate": 2.7605696202531644e-05,
"loss": 0.0,
"step": 10925
},
{
"epoch": 109.5,
"learning_rate": 2.7581962025316453e-05,
"loss": 0.0,
"step": 10950
},
{
"epoch": 109.75,
"learning_rate": 2.7558227848101263e-05,
"loss": 0.0,
"step": 10975
},
{
"epoch": 110.0,
"learning_rate": 2.7534493670886072e-05,
"loss": 0.0001,
"step": 11000
},
{
"epoch": 110.0,
"eval_loss": 0.5008699297904968,
"eval_runtime": 80.5626,
"eval_samples_per_second": 158.163,
"eval_steps_per_second": 1.241,
"eval_wer": 19.568743160856652,
"step": 11000
},
{
"epoch": 110.25,
"learning_rate": 2.7510759493670882e-05,
"loss": 0.0,
"step": 11025
},
{
"epoch": 110.5,
"learning_rate": 2.748702531645569e-05,
"loss": 0.0,
"step": 11050
},
{
"epoch": 110.75,
"learning_rate": 2.74632911392405e-05,
"loss": 0.0,
"step": 11075
},
{
"epoch": 111.0,
"learning_rate": 2.7439556962025314e-05,
"loss": 0.0,
"step": 11100
},
{
"epoch": 111.25,
"learning_rate": 2.7415822784810123e-05,
"loss": 0.0,
"step": 11125
},
{
"epoch": 111.5,
"learning_rate": 2.7392088607594933e-05,
"loss": 0.0,
"step": 11150
},
{
"epoch": 111.75,
"learning_rate": 2.7368354430379746e-05,
"loss": 0.0,
"step": 11175
},
{
"epoch": 112.0,
"learning_rate": 2.7344620253164555e-05,
"loss": 0.0,
"step": 11200
},
{
"epoch": 112.25,
"learning_rate": 2.7320886075949368e-05,
"loss": 0.0,
"step": 11225
},
{
"epoch": 112.5,
"learning_rate": 2.7297151898734178e-05,
"loss": 0.0,
"step": 11250
},
{
"epoch": 112.75,
"learning_rate": 2.7273417721518987e-05,
"loss": 0.0,
"step": 11275
},
{
"epoch": 113.0,
"learning_rate": 2.7249683544303797e-05,
"loss": 0.0,
"step": 11300
},
{
"epoch": 113.25,
"learning_rate": 2.7225949367088606e-05,
"loss": 0.0,
"step": 11325
},
{
"epoch": 113.5,
"learning_rate": 2.7202215189873416e-05,
"loss": 0.0,
"step": 11350
},
{
"epoch": 113.75,
"learning_rate": 2.7178481012658225e-05,
"loss": 0.0,
"step": 11375
},
{
"epoch": 114.0,
"learning_rate": 2.7154746835443038e-05,
"loss": 0.0,
"step": 11400
},
{
"epoch": 114.25,
"learning_rate": 2.7131012658227848e-05,
"loss": 0.0,
"step": 11425
},
{
"epoch": 114.5,
"learning_rate": 2.7107278481012657e-05,
"loss": 0.0,
"step": 11450
},
{
"epoch": 114.75,
"learning_rate": 2.7083544303797467e-05,
"loss": 0.0,
"step": 11475
},
{
"epoch": 115.0,
"learning_rate": 2.7059810126582276e-05,
"loss": 0.0001,
"step": 11500
},
{
"epoch": 115.25,
"learning_rate": 2.7036075949367086e-05,
"loss": 0.0,
"step": 11525
},
{
"epoch": 115.5,
"learning_rate": 2.7012341772151895e-05,
"loss": 0.0001,
"step": 11550
},
{
"epoch": 115.75,
"learning_rate": 2.6988607594936708e-05,
"loss": 0.0,
"step": 11575
},
{
"epoch": 116.0,
"learning_rate": 2.6964873417721517e-05,
"loss": 0.0,
"step": 11600
},
{
"epoch": 116.25,
"learning_rate": 2.6941139240506327e-05,
"loss": 0.0,
"step": 11625
},
{
"epoch": 116.5,
"learning_rate": 2.6917405063291136e-05,
"loss": 0.0,
"step": 11650
},
{
"epoch": 116.75,
"learning_rate": 2.6893670886075946e-05,
"loss": 0.0,
"step": 11675
},
{
"epoch": 117.0,
"learning_rate": 2.6869936708860755e-05,
"loss": 0.0,
"step": 11700
},
{
"epoch": 117.25,
"learning_rate": 2.6846202531645565e-05,
"loss": 0.0,
"step": 11725
},
{
"epoch": 117.5,
"learning_rate": 2.6822468354430378e-05,
"loss": 0.0,
"step": 11750
},
{
"epoch": 117.75,
"learning_rate": 2.6798734177215187e-05,
"loss": 0.0,
"step": 11775
},
{
"epoch": 118.0,
"learning_rate": 2.6774999999999997e-05,
"loss": 0.0,
"step": 11800
},
{
"epoch": 118.25,
"learning_rate": 2.6751265822784806e-05,
"loss": 0.0,
"step": 11825
},
{
"epoch": 118.5,
"learning_rate": 2.6727531645569616e-05,
"loss": 0.0,
"step": 11850
},
{
"epoch": 118.75,
"learning_rate": 2.6703797468354425e-05,
"loss": 0.0,
"step": 11875
},
{
"epoch": 119.0,
"learning_rate": 2.6680063291139235e-05,
"loss": 0.0,
"step": 11900
},
{
"epoch": 119.25,
"learning_rate": 2.6656329113924048e-05,
"loss": 0.0,
"step": 11925
},
{
"epoch": 119.5,
"learning_rate": 2.6632594936708857e-05,
"loss": 0.0,
"step": 11950
},
{
"epoch": 119.75,
"learning_rate": 2.660886075949367e-05,
"loss": 0.0,
"step": 11975
},
{
"epoch": 120.0,
"learning_rate": 2.658512658227848e-05,
"loss": 0.0,
"step": 12000
},
{
"epoch": 120.0,
"eval_loss": 0.5174862146377563,
"eval_runtime": 80.4061,
"eval_samples_per_second": 158.471,
"eval_steps_per_second": 1.244,
"eval_wer": 19.65862904486478,
"step": 12000
},
{
"epoch": 120.25,
"learning_rate": 2.656139240506329e-05,
"loss": 0.0,
"step": 12025
},
{
"epoch": 120.5,
"learning_rate": 2.6537658227848102e-05,
"loss": 0.0,
"step": 12050
},
{
"epoch": 120.75,
"learning_rate": 2.651392405063291e-05,
"loss": 0.0,
"step": 12075
},
{
"epoch": 121.0,
"learning_rate": 2.649018987341772e-05,
"loss": 0.0,
"step": 12100
},
{
"epoch": 121.25,
"learning_rate": 2.646645569620253e-05,
"loss": 0.0,
"step": 12125
},
{
"epoch": 121.5,
"learning_rate": 2.644272151898734e-05,
"loss": 0.0,
"step": 12150
},
{
"epoch": 121.75,
"learning_rate": 2.641898734177215e-05,
"loss": 0.0,
"step": 12175
},
{
"epoch": 122.0,
"learning_rate": 2.639525316455696e-05,
"loss": 0.0,
"step": 12200
},
{
"epoch": 122.25,
"learning_rate": 2.6371518987341772e-05,
"loss": 0.0,
"step": 12225
},
{
"epoch": 122.5,
"learning_rate": 2.634778481012658e-05,
"loss": 0.0,
"step": 12250
},
{
"epoch": 122.75,
"learning_rate": 2.632405063291139e-05,
"loss": 0.0,
"step": 12275
},
{
"epoch": 123.0,
"learning_rate": 2.63003164556962e-05,
"loss": 0.0,
"step": 12300
},
{
"epoch": 123.25,
"learning_rate": 2.627658227848101e-05,
"loss": 0.0,
"step": 12325
},
{
"epoch": 123.5,
"learning_rate": 2.625284810126582e-05,
"loss": 0.0,
"step": 12350
},
{
"epoch": 123.75,
"learning_rate": 2.622911392405063e-05,
"loss": 0.0,
"step": 12375
},
{
"epoch": 124.0,
"learning_rate": 2.6205379746835442e-05,
"loss": 0.0,
"step": 12400
},
{
"epoch": 124.25,
"learning_rate": 2.618164556962025e-05,
"loss": 0.0,
"step": 12425
},
{
"epoch": 124.5,
"learning_rate": 2.615791139240506e-05,
"loss": 0.0,
"step": 12450
},
{
"epoch": 124.75,
"learning_rate": 2.613417721518987e-05,
"loss": 0.0,
"step": 12475
},
{
"epoch": 125.0,
"learning_rate": 2.611044303797468e-05,
"loss": 0.0,
"step": 12500
},
{
"epoch": 125.25,
"learning_rate": 2.608670886075949e-05,
"loss": 0.0,
"step": 12525
},
{
"epoch": 125.5,
"learning_rate": 2.60629746835443e-05,
"loss": 0.0,
"step": 12550
},
{
"epoch": 125.75,
"learning_rate": 2.6039240506329112e-05,
"loss": 0.0,
"step": 12575
},
{
"epoch": 126.0,
"learning_rate": 2.601550632911392e-05,
"loss": 0.0,
"step": 12600
},
{
"epoch": 126.25,
"learning_rate": 2.599177215189873e-05,
"loss": 0.0,
"step": 12625
},
{
"epoch": 126.5,
"learning_rate": 2.596803797468354e-05,
"loss": 0.0,
"step": 12650
},
{
"epoch": 126.75,
"learning_rate": 2.594430379746835e-05,
"loss": 0.0,
"step": 12675
},
{
"epoch": 127.0,
"learning_rate": 2.592056962025316e-05,
"loss": 0.0,
"step": 12700
},
{
"epoch": 127.25,
"learning_rate": 2.5896835443037972e-05,
"loss": 0.0,
"step": 12725
},
{
"epoch": 127.5,
"learning_rate": 2.5873101265822782e-05,
"loss": 0.0,
"step": 12750
},
{
"epoch": 127.75,
"learning_rate": 2.584936708860759e-05,
"loss": 0.0,
"step": 12775
},
{
"epoch": 128.0,
"learning_rate": 2.5825632911392404e-05,
"loss": 0.0,
"step": 12800
},
{
"epoch": 128.25,
"learning_rate": 2.5801898734177214e-05,
"loss": 0.0,
"step": 12825
},
{
"epoch": 128.5,
"learning_rate": 2.5778164556962023e-05,
"loss": 0.0,
"step": 12850
},
{
"epoch": 128.75,
"learning_rate": 2.5754430379746836e-05,
"loss": 0.0,
"step": 12875
},
{
"epoch": 129.0,
"learning_rate": 2.5730696202531646e-05,
"loss": 0.0,
"step": 12900
},
{
"epoch": 129.25,
"learning_rate": 2.5706962025316455e-05,
"loss": 0.0,
"step": 12925
},
{
"epoch": 129.5,
"learning_rate": 2.5683227848101265e-05,
"loss": 0.0,
"step": 12950
},
{
"epoch": 129.75,
"learning_rate": 2.5659493670886074e-05,
"loss": 0.0,
"step": 12975
},
{
"epoch": 130.0,
"learning_rate": 2.5635759493670884e-05,
"loss": 0.0,
"step": 13000
},
{
"epoch": 130.0,
"eval_loss": 0.5348048806190491,
"eval_runtime": 80.5003,
"eval_samples_per_second": 158.285,
"eval_steps_per_second": 1.242,
"eval_wer": 19.77294044083164,
"step": 13000
},
{
"epoch": 130.25,
"learning_rate": 2.5612025316455693e-05,
"loss": 0.0,
"step": 13025
},
{
"epoch": 130.5,
"learning_rate": 2.5588291139240506e-05,
"loss": 0.0,
"step": 13050
},
{
"epoch": 130.75,
"learning_rate": 2.5564556962025316e-05,
"loss": 0.0,
"step": 13075
},
{
"epoch": 131.0,
"learning_rate": 2.5540822784810125e-05,
"loss": 0.0,
"step": 13100
},
{
"epoch": 131.25,
"learning_rate": 2.5517088607594935e-05,
"loss": 0.0,
"step": 13125
},
{
"epoch": 131.5,
"learning_rate": 2.5493354430379744e-05,
"loss": 0.0,
"step": 13150
},
{
"epoch": 131.75,
"learning_rate": 2.5469620253164554e-05,
"loss": 0.0,
"step": 13175
},
{
"epoch": 132.0,
"learning_rate": 2.5445886075949367e-05,
"loss": 0.0,
"step": 13200
},
{
"epoch": 132.25,
"learning_rate": 2.5422151898734176e-05,
"loss": 0.0,
"step": 13225
},
{
"epoch": 132.5,
"learning_rate": 2.5398417721518986e-05,
"loss": 0.0,
"step": 13250
},
{
"epoch": 132.75,
"learning_rate": 2.5374683544303795e-05,
"loss": 0.0,
"step": 13275
},
{
"epoch": 133.0,
"learning_rate": 2.5350949367088605e-05,
"loss": 0.0,
"step": 13300
},
{
"epoch": 133.25,
"learning_rate": 2.5327215189873414e-05,
"loss": 0.0,
"step": 13325
},
{
"epoch": 133.5,
"learning_rate": 2.5303481012658224e-05,
"loss": 0.0,
"step": 13350
},
{
"epoch": 133.75,
"learning_rate": 2.5279746835443036e-05,
"loss": 0.0,
"step": 13375
},
{
"epoch": 134.0,
"learning_rate": 2.5256012658227846e-05,
"loss": 0.0,
"step": 13400
},
{
"epoch": 134.25,
"learning_rate": 2.5232278481012656e-05,
"loss": 0.0,
"step": 13425
},
{
"epoch": 134.5,
"learning_rate": 2.5208544303797465e-05,
"loss": 0.0,
"step": 13450
},
{
"epoch": 134.75,
"learning_rate": 2.5184810126582275e-05,
"loss": 0.0,
"step": 13475
},
{
"epoch": 135.0,
"learning_rate": 2.5161075949367084e-05,
"loss": 0.0,
"step": 13500
},
{
"epoch": 135.25,
"learning_rate": 2.5137341772151894e-05,
"loss": 0.0,
"step": 13525
},
{
"epoch": 135.5,
"learning_rate": 2.5113607594936706e-05,
"loss": 0.0,
"step": 13550
},
{
"epoch": 135.75,
"learning_rate": 2.5089873417721516e-05,
"loss": 0.0,
"step": 13575
},
{
"epoch": 136.0,
"learning_rate": 2.5066139240506325e-05,
"loss": 0.0,
"step": 13600
},
{
"epoch": 136.25,
"learning_rate": 2.504240506329114e-05,
"loss": 0.0,
"step": 13625
},
{
"epoch": 136.5,
"learning_rate": 2.5018670886075948e-05,
"loss": 0.0,
"step": 13650
},
{
"epoch": 136.75,
"learning_rate": 2.499493670886076e-05,
"loss": 0.0,
"step": 13675
},
{
"epoch": 137.0,
"learning_rate": 2.497120253164557e-05,
"loss": 0.0,
"step": 13700
},
{
"epoch": 137.25,
"learning_rate": 2.494746835443038e-05,
"loss": 0.0,
"step": 13725
},
{
"epoch": 137.5,
"learning_rate": 2.492373417721519e-05,
"loss": 0.0,
"step": 13750
},
{
"epoch": 137.75,
"learning_rate": 2.49e-05,
"loss": 0.0,
"step": 13775
},
{
"epoch": 138.0,
"learning_rate": 2.4876265822784808e-05,
"loss": 0.0,
"step": 13800
},
{
"epoch": 138.25,
"learning_rate": 2.4852531645569618e-05,
"loss": 0.0,
"step": 13825
},
{
"epoch": 138.5,
"learning_rate": 2.482879746835443e-05,
"loss": 0.0,
"step": 13850
},
{
"epoch": 138.75,
"learning_rate": 2.480506329113924e-05,
"loss": 0.0,
"step": 13875
},
{
"epoch": 139.0,
"learning_rate": 2.478132911392405e-05,
"loss": 0.0,
"step": 13900
},
{
"epoch": 139.25,
"learning_rate": 2.475759493670886e-05,
"loss": 0.0,
"step": 13925
},
{
"epoch": 139.5,
"learning_rate": 2.473386075949367e-05,
"loss": 0.0,
"step": 13950
},
{
"epoch": 139.75,
"learning_rate": 2.4710126582278478e-05,
"loss": 0.0,
"step": 13975
},
{
"epoch": 140.0,
"learning_rate": 2.4686392405063288e-05,
"loss": 0.0,
"step": 14000
},
{
"epoch": 140.0,
"eval_loss": 0.553089439868927,
"eval_runtime": 80.4755,
"eval_samples_per_second": 158.334,
"eval_steps_per_second": 1.243,
"eval_wer": 19.784664686571833,
"step": 14000
},
{
"epoch": 140.25,
"learning_rate": 2.46626582278481e-05,
"loss": 0.0,
"step": 14025
},
{
"epoch": 140.5,
"learning_rate": 2.463892405063291e-05,
"loss": 0.0,
"step": 14050
},
{
"epoch": 140.75,
"learning_rate": 2.461518987341772e-05,
"loss": 0.0,
"step": 14075
},
{
"epoch": 141.0,
"learning_rate": 2.459145569620253e-05,
"loss": 0.0,
"step": 14100
},
{
"epoch": 141.25,
"learning_rate": 2.456772151898734e-05,
"loss": 0.0,
"step": 14125
},
{
"epoch": 141.5,
"learning_rate": 2.4543987341772148e-05,
"loss": 0.0,
"step": 14150
},
{
"epoch": 141.75,
"learning_rate": 2.4520253164556958e-05,
"loss": 0.0,
"step": 14175
},
{
"epoch": 142.0,
"learning_rate": 2.449651898734177e-05,
"loss": 0.0,
"step": 14200
},
{
"epoch": 142.25,
"learning_rate": 2.447278481012658e-05,
"loss": 0.0,
"step": 14225
},
{
"epoch": 142.5,
"learning_rate": 2.444905063291139e-05,
"loss": 0.0,
"step": 14250
},
{
"epoch": 142.75,
"learning_rate": 2.44253164556962e-05,
"loss": 0.0,
"step": 14275
},
{
"epoch": 143.0,
"learning_rate": 2.440158227848101e-05,
"loss": 0.0,
"step": 14300
},
{
"epoch": 143.25,
"learning_rate": 2.4377848101265818e-05,
"loss": 0.0,
"step": 14325
},
{
"epoch": 143.5,
"learning_rate": 2.4354113924050628e-05,
"loss": 0.0,
"step": 14350
},
{
"epoch": 143.75,
"learning_rate": 2.4333227848101262e-05,
"loss": 0.0107,
"step": 14375
},
{
"epoch": 144.0,
"learning_rate": 2.4309493670886075e-05,
"loss": 0.0398,
"step": 14400
},
{
"epoch": 144.25,
"learning_rate": 2.4285759493670885e-05,
"loss": 0.0325,
"step": 14425
},
{
"epoch": 144.5,
"learning_rate": 2.4262025316455694e-05,
"loss": 0.024,
"step": 14450
},
{
"epoch": 144.75,
"learning_rate": 2.4238291139240504e-05,
"loss": 0.0209,
"step": 14475
},
{
"epoch": 145.0,
"learning_rate": 2.4214556962025313e-05,
"loss": 0.0178,
"step": 14500
},
{
"epoch": 145.25,
"learning_rate": 2.4190822784810123e-05,
"loss": 0.0087,
"step": 14525
},
{
"epoch": 145.5,
"learning_rate": 2.4167088607594932e-05,
"loss": 0.0102,
"step": 14550
},
{
"epoch": 145.75,
"learning_rate": 2.4143354430379745e-05,
"loss": 0.0085,
"step": 14575
},
{
"epoch": 146.0,
"learning_rate": 2.4119620253164555e-05,
"loss": 0.007,
"step": 14600
},
{
"epoch": 146.25,
"learning_rate": 2.4095886075949364e-05,
"loss": 0.0046,
"step": 14625
},
{
"epoch": 146.5,
"learning_rate": 2.4072151898734174e-05,
"loss": 0.005,
"step": 14650
},
{
"epoch": 146.75,
"learning_rate": 2.4048417721518983e-05,
"loss": 0.0035,
"step": 14675
},
{
"epoch": 147.0,
"learning_rate": 2.4024683544303793e-05,
"loss": 0.0035,
"step": 14700
},
{
"epoch": 147.25,
"learning_rate": 2.4000949367088602e-05,
"loss": 0.0021,
"step": 14725
},
{
"epoch": 147.5,
"learning_rate": 2.3977215189873415e-05,
"loss": 0.002,
"step": 14750
},
{
"epoch": 147.75,
"learning_rate": 2.3953481012658225e-05,
"loss": 0.0016,
"step": 14775
},
{
"epoch": 148.0,
"learning_rate": 2.3929746835443034e-05,
"loss": 0.0015,
"step": 14800
},
{
"epoch": 148.25,
"learning_rate": 2.3906012658227847e-05,
"loss": 0.0006,
"step": 14825
},
{
"epoch": 148.5,
"learning_rate": 2.3882278481012657e-05,
"loss": 0.0005,
"step": 14850
},
{
"epoch": 148.75,
"learning_rate": 2.385854430379747e-05,
"loss": 0.0004,
"step": 14875
},
{
"epoch": 149.0,
"learning_rate": 2.383481012658228e-05,
"loss": 0.0006,
"step": 14900
},
{
"epoch": 149.25,
"learning_rate": 2.381107594936709e-05,
"loss": 0.0003,
"step": 14925
},
{
"epoch": 149.5,
"learning_rate": 2.3787341772151898e-05,
"loss": 0.0003,
"step": 14950
},
{
"epoch": 149.75,
"learning_rate": 2.3763607594936707e-05,
"loss": 0.0003,
"step": 14975
},
{
"epoch": 150.0,
"learning_rate": 2.3739873417721517e-05,
"loss": 0.0002,
"step": 15000
},
{
"epoch": 150.0,
"eval_loss": 0.4625629484653473,
"eval_runtime": 81.6484,
"eval_samples_per_second": 156.059,
"eval_steps_per_second": 1.225,
"eval_wer": 19.472995153978427,
"step": 15000
},
{
"epoch": 150.25,
"learning_rate": 2.3716139240506327e-05,
"loss": 0.0002,
"step": 15025
},
{
"epoch": 150.5,
"learning_rate": 2.369240506329114e-05,
"loss": 0.0002,
"step": 15050
},
{
"epoch": 150.75,
"learning_rate": 2.366867088607595e-05,
"loss": 0.0002,
"step": 15075
},
{
"epoch": 151.0,
"learning_rate": 2.364493670886076e-05,
"loss": 0.0002,
"step": 15100
},
{
"epoch": 151.25,
"learning_rate": 2.3621202531645568e-05,
"loss": 0.0001,
"step": 15125
},
{
"epoch": 151.5,
"learning_rate": 2.3597468354430377e-05,
"loss": 0.0001,
"step": 15150
},
{
"epoch": 151.75,
"learning_rate": 2.3573734177215187e-05,
"loss": 0.0001,
"step": 15175
},
{
"epoch": 152.0,
"learning_rate": 2.3549999999999996e-05,
"loss": 0.0002,
"step": 15200
},
{
"epoch": 152.25,
"learning_rate": 2.352626582278481e-05,
"loss": 0.0001,
"step": 15225
},
{
"epoch": 152.5,
"learning_rate": 2.350253164556962e-05,
"loss": 0.0001,
"step": 15250
},
{
"epoch": 152.75,
"learning_rate": 2.347879746835443e-05,
"loss": 0.0001,
"step": 15275
},
{
"epoch": 153.0,
"learning_rate": 2.3455063291139238e-05,
"loss": 0.0001,
"step": 15300
},
{
"epoch": 153.25,
"learning_rate": 2.3431329113924047e-05,
"loss": 0.0001,
"step": 15325
},
{
"epoch": 153.5,
"learning_rate": 2.3407594936708857e-05,
"loss": 0.0001,
"step": 15350
},
{
"epoch": 153.75,
"learning_rate": 2.3383860759493666e-05,
"loss": 0.0001,
"step": 15375
},
{
"epoch": 154.0,
"learning_rate": 2.336012658227848e-05,
"loss": 0.0001,
"step": 15400
},
{
"epoch": 154.25,
"learning_rate": 2.333639240506329e-05,
"loss": 0.0001,
"step": 15425
},
{
"epoch": 154.5,
"learning_rate": 2.3312658227848098e-05,
"loss": 0.0001,
"step": 15450
},
{
"epoch": 154.75,
"learning_rate": 2.3288924050632908e-05,
"loss": 0.0001,
"step": 15475
},
{
"epoch": 155.0,
"learning_rate": 2.3265189873417717e-05,
"loss": 0.0001,
"step": 15500
},
{
"epoch": 155.25,
"learning_rate": 2.3241455696202527e-05,
"loss": 0.0001,
"step": 15525
},
{
"epoch": 155.5,
"learning_rate": 2.321772151898734e-05,
"loss": 0.0001,
"step": 15550
},
{
"epoch": 155.75,
"learning_rate": 2.319398734177215e-05,
"loss": 0.0001,
"step": 15575
},
{
"epoch": 156.0,
"learning_rate": 2.317025316455696e-05,
"loss": 0.0001,
"step": 15600
},
{
"epoch": 156.25,
"learning_rate": 2.3146518987341768e-05,
"loss": 0.0001,
"step": 15625
},
{
"epoch": 156.5,
"learning_rate": 2.312278481012658e-05,
"loss": 0.0001,
"step": 15650
},
{
"epoch": 156.75,
"learning_rate": 2.309905063291139e-05,
"loss": 0.0001,
"step": 15675
},
{
"epoch": 157.0,
"learning_rate": 2.3075316455696204e-05,
"loss": 0.0001,
"step": 15700
},
{
"epoch": 157.25,
"learning_rate": 2.3051582278481013e-05,
"loss": 0.0001,
"step": 15725
},
{
"epoch": 157.5,
"learning_rate": 2.3027848101265823e-05,
"loss": 0.0001,
"step": 15750
},
{
"epoch": 157.75,
"learning_rate": 2.3004113924050632e-05,
"loss": 0.0001,
"step": 15775
},
{
"epoch": 158.0,
"learning_rate": 2.298037974683544e-05,
"loss": 0.0001,
"step": 15800
},
{
"epoch": 158.25,
"learning_rate": 2.295664556962025e-05,
"loss": 0.0001,
"step": 15825
},
{
"epoch": 158.5,
"learning_rate": 2.293291139240506e-05,
"loss": 0.0001,
"step": 15850
},
{
"epoch": 158.75,
"learning_rate": 2.2909177215189873e-05,
"loss": 0.0001,
"step": 15875
},
{
"epoch": 159.0,
"learning_rate": 2.2885443037974683e-05,
"loss": 0.0001,
"step": 15900
},
{
"epoch": 159.25,
"learning_rate": 2.2861708860759492e-05,
"loss": 0.0001,
"step": 15925
},
{
"epoch": 159.5,
"learning_rate": 2.2837974683544302e-05,
"loss": 0.0001,
"step": 15950
},
{
"epoch": 159.75,
"learning_rate": 2.281424050632911e-05,
"loss": 0.0001,
"step": 15975
},
{
"epoch": 160.0,
"learning_rate": 2.279050632911392e-05,
"loss": 0.0001,
"step": 16000
},
{
"epoch": 160.0,
"eval_loss": 0.4813273549079895,
"eval_runtime": 80.403,
"eval_samples_per_second": 158.477,
"eval_steps_per_second": 1.244,
"eval_wer": 19.21994685008598,
"step": 16000
},
{
"epoch": 160.25,
"learning_rate": 2.2766772151898734e-05,
"loss": 0.0001,
"step": 16025
},
{
"epoch": 160.5,
"learning_rate": 2.2743037974683543e-05,
"loss": 0.0001,
"step": 16050
},
{
"epoch": 160.75,
"learning_rate": 2.2719303797468353e-05,
"loss": 0.0001,
"step": 16075
},
{
"epoch": 161.0,
"learning_rate": 2.2695569620253162e-05,
"loss": 0.0001,
"step": 16100
},
{
"epoch": 161.25,
"learning_rate": 2.2671835443037972e-05,
"loss": 0.0001,
"step": 16125
},
{
"epoch": 161.5,
"learning_rate": 2.264810126582278e-05,
"loss": 0.0001,
"step": 16150
},
{
"epoch": 161.75,
"learning_rate": 2.262436708860759e-05,
"loss": 0.0001,
"step": 16175
},
{
"epoch": 162.0,
"learning_rate": 2.2600632911392404e-05,
"loss": 0.0001,
"step": 16200
},
{
"epoch": 162.25,
"learning_rate": 2.2576898734177213e-05,
"loss": 0.0001,
"step": 16225
},
{
"epoch": 162.5,
"learning_rate": 2.2553164556962023e-05,
"loss": 0.0001,
"step": 16250
},
{
"epoch": 162.75,
"learning_rate": 2.2529430379746832e-05,
"loss": 0.0001,
"step": 16275
},
{
"epoch": 163.0,
"learning_rate": 2.2505696202531642e-05,
"loss": 0.0001,
"step": 16300
},
{
"epoch": 163.25,
"learning_rate": 2.248196202531645e-05,
"loss": 0.0001,
"step": 16325
},
{
"epoch": 163.5,
"learning_rate": 2.245822784810126e-05,
"loss": 0.0001,
"step": 16350
},
{
"epoch": 163.75,
"learning_rate": 2.2434493670886074e-05,
"loss": 0.0001,
"step": 16375
},
{
"epoch": 164.0,
"learning_rate": 2.2410759493670883e-05,
"loss": 0.0001,
"step": 16400
},
{
"epoch": 164.25,
"learning_rate": 2.2387025316455693e-05,
"loss": 0.0001,
"step": 16425
},
{
"epoch": 164.5,
"learning_rate": 2.2363291139240502e-05,
"loss": 0.0001,
"step": 16450
},
{
"epoch": 164.75,
"learning_rate": 2.2339556962025315e-05,
"loss": 0.0001,
"step": 16475
},
{
"epoch": 165.0,
"learning_rate": 2.2315822784810128e-05,
"loss": 0.0001,
"step": 16500
},
{
"epoch": 165.25,
"learning_rate": 2.2292088607594938e-05,
"loss": 0.0001,
"step": 16525
},
{
"epoch": 165.5,
"learning_rate": 2.2268354430379747e-05,
"loss": 0.0001,
"step": 16550
},
{
"epoch": 165.75,
"learning_rate": 2.2244620253164557e-05,
"loss": 0.0001,
"step": 16575
},
{
"epoch": 166.0,
"learning_rate": 2.2220886075949366e-05,
"loss": 0.0001,
"step": 16600
},
{
"epoch": 166.25,
"learning_rate": 2.2197151898734176e-05,
"loss": 0.0001,
"step": 16625
},
{
"epoch": 166.5,
"learning_rate": 2.2173417721518985e-05,
"loss": 0.0001,
"step": 16650
},
{
"epoch": 166.75,
"learning_rate": 2.2149683544303798e-05,
"loss": 0.0001,
"step": 16675
},
{
"epoch": 167.0,
"learning_rate": 2.2125949367088608e-05,
"loss": 0.0001,
"step": 16700
},
{
"epoch": 167.25,
"learning_rate": 2.2102215189873417e-05,
"loss": 0.0001,
"step": 16725
},
{
"epoch": 167.5,
"learning_rate": 2.2078481012658227e-05,
"loss": 0.0001,
"step": 16750
},
{
"epoch": 167.75,
"learning_rate": 2.2054746835443036e-05,
"loss": 0.0001,
"step": 16775
},
{
"epoch": 168.0,
"learning_rate": 2.2031012658227846e-05,
"loss": 0.0001,
"step": 16800
},
{
"epoch": 168.25,
"learning_rate": 2.2007278481012655e-05,
"loss": 0.0,
"step": 16825
},
{
"epoch": 168.5,
"learning_rate": 2.1983544303797468e-05,
"loss": 0.0,
"step": 16850
},
{
"epoch": 168.75,
"learning_rate": 2.1959810126582277e-05,
"loss": 0.0,
"step": 16875
},
{
"epoch": 169.0,
"learning_rate": 2.1936075949367087e-05,
"loss": 0.0001,
"step": 16900
},
{
"epoch": 169.25,
"learning_rate": 2.1912341772151896e-05,
"loss": 0.0,
"step": 16925
},
{
"epoch": 169.5,
"learning_rate": 2.1888607594936706e-05,
"loss": 0.0001,
"step": 16950
},
{
"epoch": 169.75,
"learning_rate": 2.1864873417721515e-05,
"loss": 0.0,
"step": 16975
},
{
"epoch": 170.0,
"learning_rate": 2.1841139240506325e-05,
"loss": 0.0,
"step": 17000
},
{
"epoch": 170.0,
"eval_loss": 0.49322769045829773,
"eval_runtime": 80.3155,
"eval_samples_per_second": 158.649,
"eval_steps_per_second": 1.245,
"eval_wer": 19.169141785211817,
"step": 17000
},
{
"epoch": 170.25,
"learning_rate": 2.1817405063291138e-05,
"loss": 0.0,
"step": 17025
},
{
"epoch": 170.5,
"learning_rate": 2.1793670886075947e-05,
"loss": 0.0,
"step": 17050
},
{
"epoch": 170.75,
"learning_rate": 2.1769936708860757e-05,
"loss": 0.0,
"step": 17075
},
{
"epoch": 171.0,
"learning_rate": 2.1746202531645566e-05,
"loss": 0.0001,
"step": 17100
},
{
"epoch": 171.25,
"learning_rate": 2.1722468354430376e-05,
"loss": 0.0,
"step": 17125
},
{
"epoch": 171.5,
"learning_rate": 2.1698734177215185e-05,
"loss": 0.0001,
"step": 17150
},
{
"epoch": 171.75,
"learning_rate": 2.1674999999999995e-05,
"loss": 0.0,
"step": 17175
},
{
"epoch": 172.0,
"learning_rate": 2.1651265822784808e-05,
"loss": 0.0,
"step": 17200
},
{
"epoch": 172.25,
"learning_rate": 2.1627531645569617e-05,
"loss": 0.0,
"step": 17225
},
{
"epoch": 172.5,
"learning_rate": 2.1603797468354427e-05,
"loss": 0.0,
"step": 17250
},
{
"epoch": 172.75,
"learning_rate": 2.1580063291139236e-05,
"loss": 0.0,
"step": 17275
},
{
"epoch": 173.0,
"learning_rate": 2.155632911392405e-05,
"loss": 0.0,
"step": 17300
},
{
"epoch": 173.25,
"learning_rate": 2.1532594936708862e-05,
"loss": 0.0,
"step": 17325
},
{
"epoch": 173.5,
"learning_rate": 2.150886075949367e-05,
"loss": 0.0,
"step": 17350
},
{
"epoch": 173.75,
"learning_rate": 2.148512658227848e-05,
"loss": 0.0,
"step": 17375
},
{
"epoch": 174.0,
"learning_rate": 2.146139240506329e-05,
"loss": 0.0,
"step": 17400
},
{
"epoch": 174.25,
"learning_rate": 2.14376582278481e-05,
"loss": 0.0,
"step": 17425
},
{
"epoch": 174.5,
"learning_rate": 2.141392405063291e-05,
"loss": 0.0,
"step": 17450
},
{
"epoch": 174.75,
"learning_rate": 2.139018987341772e-05,
"loss": 0.0,
"step": 17475
},
{
"epoch": 175.0,
"learning_rate": 2.1366455696202532e-05,
"loss": 0.0,
"step": 17500
},
{
"epoch": 175.25,
"learning_rate": 2.134272151898734e-05,
"loss": 0.0,
"step": 17525
},
{
"epoch": 175.5,
"learning_rate": 2.131898734177215e-05,
"loss": 0.0,
"step": 17550
},
{
"epoch": 175.75,
"learning_rate": 2.129525316455696e-05,
"loss": 0.0,
"step": 17575
},
{
"epoch": 176.0,
"learning_rate": 2.127151898734177e-05,
"loss": 0.0,
"step": 17600
},
{
"epoch": 176.25,
"learning_rate": 2.124778481012658e-05,
"loss": 0.0,
"step": 17625
},
{
"epoch": 176.5,
"learning_rate": 2.122405063291139e-05,
"loss": 0.0,
"step": 17650
},
{
"epoch": 176.75,
"learning_rate": 2.1200316455696202e-05,
"loss": 0.0,
"step": 17675
},
{
"epoch": 177.0,
"learning_rate": 2.117658227848101e-05,
"loss": 0.0,
"step": 17700
},
{
"epoch": 177.25,
"learning_rate": 2.115284810126582e-05,
"loss": 0.0,
"step": 17725
},
{
"epoch": 177.5,
"learning_rate": 2.112911392405063e-05,
"loss": 0.0,
"step": 17750
},
{
"epoch": 177.75,
"learning_rate": 2.110537974683544e-05,
"loss": 0.0,
"step": 17775
},
{
"epoch": 178.0,
"learning_rate": 2.108164556962025e-05,
"loss": 0.0,
"step": 17800
},
{
"epoch": 178.25,
"learning_rate": 2.1057911392405062e-05,
"loss": 0.0,
"step": 17825
},
{
"epoch": 178.5,
"learning_rate": 2.1034177215189872e-05,
"loss": 0.0,
"step": 17850
},
{
"epoch": 178.75,
"learning_rate": 2.101044303797468e-05,
"loss": 0.0,
"step": 17875
},
{
"epoch": 179.0,
"learning_rate": 2.098670886075949e-05,
"loss": 0.0,
"step": 17900
},
{
"epoch": 179.25,
"learning_rate": 2.09629746835443e-05,
"loss": 0.0,
"step": 17925
},
{
"epoch": 179.5,
"learning_rate": 2.093924050632911e-05,
"loss": 0.0,
"step": 17950
},
{
"epoch": 179.75,
"learning_rate": 2.091550632911392e-05,
"loss": 0.0,
"step": 17975
},
{
"epoch": 180.0,
"learning_rate": 2.0891772151898732e-05,
"loss": 0.0,
"step": 18000
},
{
"epoch": 180.0,
"eval_loss": 0.5040577054023743,
"eval_runtime": 80.2662,
"eval_samples_per_second": 158.747,
"eval_steps_per_second": 1.246,
"eval_wer": 19.1290839455995,
"step": 18000
},
{
"epoch": 180.25,
"learning_rate": 2.0868037974683542e-05,
"loss": 0.0,
"step": 18025
},
{
"epoch": 180.5,
"learning_rate": 2.084430379746835e-05,
"loss": 0.0,
"step": 18050
},
{
"epoch": 180.75,
"learning_rate": 2.082056962025316e-05,
"loss": 0.0,
"step": 18075
},
{
"epoch": 181.0,
"learning_rate": 2.0796835443037974e-05,
"loss": 0.0,
"step": 18100
},
{
"epoch": 181.25,
"learning_rate": 2.0773101265822783e-05,
"loss": 0.0,
"step": 18125
},
{
"epoch": 181.5,
"learning_rate": 2.0749367088607596e-05,
"loss": 0.0,
"step": 18150
},
{
"epoch": 181.75,
"learning_rate": 2.0725632911392406e-05,
"loss": 0.0,
"step": 18175
},
{
"epoch": 182.0,
"learning_rate": 2.0701898734177215e-05,
"loss": 0.0,
"step": 18200
},
{
"epoch": 182.25,
"learning_rate": 2.0678164556962025e-05,
"loss": 0.0,
"step": 18225
},
{
"epoch": 182.5,
"learning_rate": 2.0654430379746834e-05,
"loss": 0.0,
"step": 18250
},
{
"epoch": 182.75,
"learning_rate": 2.0630696202531644e-05,
"loss": 0.0,
"step": 18275
},
{
"epoch": 183.0,
"learning_rate": 2.0606962025316457e-05,
"loss": 0.0,
"step": 18300
},
{
"epoch": 183.25,
"learning_rate": 2.0583227848101266e-05,
"loss": 0.0,
"step": 18325
},
{
"epoch": 183.5,
"learning_rate": 2.0559493670886076e-05,
"loss": 0.0,
"step": 18350
},
{
"epoch": 183.75,
"learning_rate": 2.0535759493670885e-05,
"loss": 0.0,
"step": 18375
},
{
"epoch": 184.0,
"learning_rate": 2.0512025316455695e-05,
"loss": 0.0,
"step": 18400
},
{
"epoch": 184.25,
"learning_rate": 2.0488291139240504e-05,
"loss": 0.0,
"step": 18425
},
{
"epoch": 184.5,
"learning_rate": 2.0464556962025314e-05,
"loss": 0.0,
"step": 18450
},
{
"epoch": 184.75,
"learning_rate": 2.0440822784810127e-05,
"loss": 0.0,
"step": 18475
},
{
"epoch": 185.0,
"learning_rate": 2.0417088607594936e-05,
"loss": 0.0,
"step": 18500
},
{
"epoch": 185.25,
"learning_rate": 2.0393354430379746e-05,
"loss": 0.0,
"step": 18525
},
{
"epoch": 185.5,
"learning_rate": 2.0369620253164555e-05,
"loss": 0.0,
"step": 18550
},
{
"epoch": 185.75,
"learning_rate": 2.0345886075949365e-05,
"loss": 0.0,
"step": 18575
},
{
"epoch": 186.0,
"learning_rate": 2.0322151898734174e-05,
"loss": 0.0,
"step": 18600
},
{
"epoch": 186.25,
"learning_rate": 2.0298417721518984e-05,
"loss": 0.0,
"step": 18625
},
{
"epoch": 186.5,
"learning_rate": 2.0274683544303796e-05,
"loss": 0.0,
"step": 18650
},
{
"epoch": 186.75,
"learning_rate": 2.0250949367088606e-05,
"loss": 0.0,
"step": 18675
},
{
"epoch": 187.0,
"learning_rate": 2.0227215189873415e-05,
"loss": 0.0,
"step": 18700
},
{
"epoch": 187.25,
"learning_rate": 2.0203481012658225e-05,
"loss": 0.0,
"step": 18725
},
{
"epoch": 187.5,
"learning_rate": 2.0179746835443035e-05,
"loss": 0.0,
"step": 18750
},
{
"epoch": 187.75,
"learning_rate": 2.0156012658227844e-05,
"loss": 0.0,
"step": 18775
},
{
"epoch": 188.0,
"learning_rate": 2.0132278481012654e-05,
"loss": 0.0,
"step": 18800
},
{
"epoch": 188.25,
"learning_rate": 2.0108544303797466e-05,
"loss": 0.0,
"step": 18825
},
{
"epoch": 188.5,
"learning_rate": 2.0084810126582276e-05,
"loss": 0.0,
"step": 18850
},
{
"epoch": 188.75,
"learning_rate": 2.0061075949367085e-05,
"loss": 0.0,
"step": 18875
},
{
"epoch": 189.0,
"learning_rate": 2.0037341772151895e-05,
"loss": 0.0,
"step": 18900
},
{
"epoch": 189.25,
"learning_rate": 2.0013607594936708e-05,
"loss": 0.0,
"step": 18925
},
{
"epoch": 189.5,
"learning_rate": 1.998987341772152e-05,
"loss": 0.0,
"step": 18950
},
{
"epoch": 189.75,
"learning_rate": 1.996613924050633e-05,
"loss": 0.0,
"step": 18975
},
{
"epoch": 190.0,
"learning_rate": 1.994240506329114e-05,
"loss": 0.0,
"step": 19000
},
{
"epoch": 190.0,
"eval_loss": 0.5146323442459106,
"eval_runtime": 80.5291,
"eval_samples_per_second": 158.229,
"eval_steps_per_second": 1.242,
"eval_wer": 19.094888228857275,
"step": 19000
},
{
"epoch": 190.25,
"learning_rate": 1.991867088607595e-05,
"loss": 0.0,
"step": 19025
},
{
"epoch": 190.5,
"learning_rate": 1.989493670886076e-05,
"loss": 0.0,
"step": 19050
},
{
"epoch": 190.75,
"learning_rate": 1.9871202531645568e-05,
"loss": 0.0,
"step": 19075
},
{
"epoch": 191.0,
"learning_rate": 1.9847468354430378e-05,
"loss": 0.0,
"step": 19100
},
{
"epoch": 191.25,
"learning_rate": 1.982373417721519e-05,
"loss": 0.0,
"step": 19125
},
{
"epoch": 191.5,
"learning_rate": 1.98e-05,
"loss": 0.0,
"step": 19150
},
{
"epoch": 191.75,
"learning_rate": 1.977626582278481e-05,
"loss": 0.0,
"step": 19175
},
{
"epoch": 192.0,
"learning_rate": 1.975253164556962e-05,
"loss": 0.0,
"step": 19200
},
{
"epoch": 192.25,
"learning_rate": 1.972879746835443e-05,
"loss": 0.0,
"step": 19225
},
{
"epoch": 192.5,
"learning_rate": 1.9705063291139238e-05,
"loss": 0.0,
"step": 19250
},
{
"epoch": 192.75,
"learning_rate": 1.9681329113924048e-05,
"loss": 0.0,
"step": 19275
},
{
"epoch": 193.0,
"learning_rate": 1.965759493670886e-05,
"loss": 0.0,
"step": 19300
},
{
"epoch": 193.25,
"learning_rate": 1.963386075949367e-05,
"loss": 0.0,
"step": 19325
},
{
"epoch": 193.5,
"learning_rate": 1.961012658227848e-05,
"loss": 0.0,
"step": 19350
},
{
"epoch": 193.75,
"learning_rate": 1.958639240506329e-05,
"loss": 0.0,
"step": 19375
},
{
"epoch": 194.0,
"learning_rate": 1.95626582278481e-05,
"loss": 0.0,
"step": 19400
},
{
"epoch": 194.25,
"learning_rate": 1.9538924050632908e-05,
"loss": 0.0,
"step": 19425
},
{
"epoch": 194.5,
"learning_rate": 1.9515189873417718e-05,
"loss": 0.0,
"step": 19450
},
{
"epoch": 194.75,
"learning_rate": 1.949145569620253e-05,
"loss": 0.0,
"step": 19475
},
{
"epoch": 195.0,
"learning_rate": 1.946772151898734e-05,
"loss": 0.0,
"step": 19500
},
{
"epoch": 195.25,
"learning_rate": 1.944398734177215e-05,
"loss": 0.0,
"step": 19525
},
{
"epoch": 195.5,
"learning_rate": 1.942025316455696e-05,
"loss": 0.0,
"step": 19550
},
{
"epoch": 195.75,
"learning_rate": 1.939651898734177e-05,
"loss": 0.0,
"step": 19575
},
{
"epoch": 196.0,
"learning_rate": 1.9372784810126578e-05,
"loss": 0.0,
"step": 19600
},
{
"epoch": 196.25,
"learning_rate": 1.9349050632911388e-05,
"loss": 0.0,
"step": 19625
},
{
"epoch": 196.5,
"learning_rate": 1.93253164556962e-05,
"loss": 0.0,
"step": 19650
},
{
"epoch": 196.75,
"learning_rate": 1.930158227848101e-05,
"loss": 0.0,
"step": 19675
},
{
"epoch": 197.0,
"learning_rate": 1.927784810126582e-05,
"loss": 0.0,
"step": 19700
},
{
"epoch": 197.25,
"learning_rate": 1.925411392405063e-05,
"loss": 0.0,
"step": 19725
},
{
"epoch": 197.5,
"learning_rate": 1.9230379746835442e-05,
"loss": 0.0,
"step": 19750
},
{
"epoch": 197.75,
"learning_rate": 1.9206645569620255e-05,
"loss": 0.0,
"step": 19775
},
{
"epoch": 198.0,
"learning_rate": 1.9182911392405064e-05,
"loss": 0.0,
"step": 19800
},
{
"epoch": 198.25,
"learning_rate": 1.9159177215189874e-05,
"loss": 0.0,
"step": 19825
},
{
"epoch": 198.5,
"learning_rate": 1.9135443037974683e-05,
"loss": 0.0,
"step": 19850
},
{
"epoch": 198.75,
"learning_rate": 1.9111708860759493e-05,
"loss": 0.0,
"step": 19875
},
{
"epoch": 199.0,
"learning_rate": 1.9087974683544302e-05,
"loss": 0.0,
"step": 19900
},
{
"epoch": 199.25,
"learning_rate": 1.9064240506329112e-05,
"loss": 0.0,
"step": 19925
},
{
"epoch": 199.5,
"learning_rate": 1.9040506329113925e-05,
"loss": 0.0,
"step": 19950
},
{
"epoch": 199.75,
"learning_rate": 1.9016772151898734e-05,
"loss": 0.0,
"step": 19975
},
{
"epoch": 200.0,
"learning_rate": 1.8993037974683544e-05,
"loss": 0.0,
"step": 20000
},
{
"epoch": 200.0,
"eval_loss": 0.5253657698631287,
"eval_runtime": 80.492,
"eval_samples_per_second": 158.301,
"eval_steps_per_second": 1.242,
"eval_wer": 19.123221822729406,
"step": 20000
},
{
"epoch": 200.25,
"learning_rate": 1.8969303797468353e-05,
"loss": 0.0,
"step": 20025
},
{
"epoch": 200.5,
"learning_rate": 1.8945569620253163e-05,
"loss": 0.0,
"step": 20050
},
{
"epoch": 200.75,
"learning_rate": 1.8921835443037972e-05,
"loss": 0.0,
"step": 20075
},
{
"epoch": 201.0,
"learning_rate": 1.8898101265822785e-05,
"loss": 0.0,
"step": 20100
},
{
"epoch": 201.25,
"learning_rate": 1.8874367088607595e-05,
"loss": 0.0,
"step": 20125
},
{
"epoch": 201.5,
"learning_rate": 1.8850632911392404e-05,
"loss": 0.0,
"step": 20150
},
{
"epoch": 201.75,
"learning_rate": 1.8826898734177214e-05,
"loss": 0.0,
"step": 20175
},
{
"epoch": 202.0,
"learning_rate": 1.8803164556962023e-05,
"loss": 0.0,
"step": 20200
},
{
"epoch": 202.25,
"learning_rate": 1.8779430379746833e-05,
"loss": 0.0,
"step": 20225
},
{
"epoch": 202.5,
"learning_rate": 1.8755696202531642e-05,
"loss": 0.0,
"step": 20250
},
{
"epoch": 202.75,
"learning_rate": 1.8731962025316455e-05,
"loss": 0.0,
"step": 20275
},
{
"epoch": 203.0,
"learning_rate": 1.8708227848101265e-05,
"loss": 0.0,
"step": 20300
},
{
"epoch": 203.25,
"learning_rate": 1.8684493670886074e-05,
"loss": 0.0,
"step": 20325
},
{
"epoch": 203.5,
"learning_rate": 1.8660759493670884e-05,
"loss": 0.0,
"step": 20350
},
{
"epoch": 203.75,
"learning_rate": 1.8637025316455696e-05,
"loss": 0.0,
"step": 20375
},
{
"epoch": 204.0,
"learning_rate": 1.8613291139240506e-05,
"loss": 0.0,
"step": 20400
},
{
"epoch": 204.25,
"learning_rate": 1.8589556962025316e-05,
"loss": 0.0,
"step": 20425
},
{
"epoch": 204.5,
"learning_rate": 1.8565822784810125e-05,
"loss": 0.0,
"step": 20450
},
{
"epoch": 204.75,
"learning_rate": 1.8542088607594935e-05,
"loss": 0.0,
"step": 20475
},
{
"epoch": 205.0,
"learning_rate": 1.8518354430379744e-05,
"loss": 0.0,
"step": 20500
},
{
"epoch": 205.25,
"learning_rate": 1.8494620253164557e-05,
"loss": 0.0,
"step": 20525
},
{
"epoch": 205.5,
"learning_rate": 1.8470886075949366e-05,
"loss": 0.0,
"step": 20550
},
{
"epoch": 205.75,
"learning_rate": 1.8447151898734176e-05,
"loss": 0.0,
"step": 20575
},
{
"epoch": 206.0,
"learning_rate": 1.8423417721518985e-05,
"loss": 0.0,
"step": 20600
},
{
"epoch": 206.25,
"learning_rate": 1.8399683544303795e-05,
"loss": 0.0,
"step": 20625
},
{
"epoch": 206.5,
"learning_rate": 1.8375949367088604e-05,
"loss": 0.0,
"step": 20650
},
{
"epoch": 206.75,
"learning_rate": 1.8352215189873414e-05,
"loss": 0.0,
"step": 20675
},
{
"epoch": 207.0,
"learning_rate": 1.8328481012658227e-05,
"loss": 0.0,
"step": 20700
},
{
"epoch": 207.25,
"learning_rate": 1.8304746835443036e-05,
"loss": 0.0,
"step": 20725
},
{
"epoch": 207.5,
"learning_rate": 1.8281012658227846e-05,
"loss": 0.0,
"step": 20750
},
{
"epoch": 207.75,
"learning_rate": 1.825727848101266e-05,
"loss": 0.0,
"step": 20775
},
{
"epoch": 208.0,
"learning_rate": 1.8233544303797468e-05,
"loss": 0.0,
"step": 20800
},
{
"epoch": 208.25,
"learning_rate": 1.8209810126582278e-05,
"loss": 0.0,
"step": 20825
},
{
"epoch": 208.5,
"learning_rate": 1.8186075949367087e-05,
"loss": 0.0,
"step": 20850
},
{
"epoch": 208.75,
"learning_rate": 1.8162341772151897e-05,
"loss": 0.0,
"step": 20875
},
{
"epoch": 209.0,
"learning_rate": 1.8138607594936706e-05,
"loss": 0.0,
"step": 20900
},
{
"epoch": 209.25,
"learning_rate": 1.811487341772152e-05,
"loss": 0.0,
"step": 20925
},
{
"epoch": 209.5,
"learning_rate": 1.809113924050633e-05,
"loss": 0.0,
"step": 20950
},
{
"epoch": 209.75,
"learning_rate": 1.8067405063291138e-05,
"loss": 0.0,
"step": 20975
},
{
"epoch": 210.0,
"learning_rate": 1.8043670886075948e-05,
"loss": 0.0,
"step": 21000
},
{
"epoch": 210.0,
"eval_loss": 0.5368518233299255,
"eval_runtime": 80.6917,
"eval_samples_per_second": 157.91,
"eval_steps_per_second": 1.239,
"eval_wer": 19.136900109426293,
"step": 21000
},
{
"epoch": 210.25,
"learning_rate": 1.8019936708860757e-05,
"loss": 0.0,
"step": 21025
},
{
"epoch": 210.5,
"learning_rate": 1.7996202531645567e-05,
"loss": 0.0,
"step": 21050
},
{
"epoch": 210.75,
"learning_rate": 1.7972468354430376e-05,
"loss": 0.0,
"step": 21075
},
{
"epoch": 211.0,
"learning_rate": 1.794873417721519e-05,
"loss": 0.0,
"step": 21100
},
{
"epoch": 211.25,
"learning_rate": 1.7925e-05,
"loss": 0.0,
"step": 21125
},
{
"epoch": 211.5,
"learning_rate": 1.7901265822784808e-05,
"loss": 0.0,
"step": 21150
},
{
"epoch": 211.75,
"learning_rate": 1.7877531645569618e-05,
"loss": 0.0,
"step": 21175
},
{
"epoch": 212.0,
"learning_rate": 1.785379746835443e-05,
"loss": 0.0,
"step": 21200
},
{
"epoch": 212.25,
"learning_rate": 1.783006329113924e-05,
"loss": 0.0,
"step": 21225
},
{
"epoch": 212.5,
"learning_rate": 1.780632911392405e-05,
"loss": 0.0,
"step": 21250
},
{
"epoch": 212.75,
"learning_rate": 1.778259493670886e-05,
"loss": 0.0,
"step": 21275
},
{
"epoch": 213.0,
"learning_rate": 1.775886075949367e-05,
"loss": 0.0,
"step": 21300
},
{
"epoch": 213.25,
"learning_rate": 1.773512658227848e-05,
"loss": 0.0,
"step": 21325
},
{
"epoch": 213.5,
"learning_rate": 1.771139240506329e-05,
"loss": 0.0,
"step": 21350
},
{
"epoch": 213.75,
"learning_rate": 1.76876582278481e-05,
"loss": 0.0,
"step": 21375
},
{
"epoch": 214.0,
"learning_rate": 1.766392405063291e-05,
"loss": 0.0,
"step": 21400
},
{
"epoch": 214.25,
"learning_rate": 1.764018987341772e-05,
"loss": 0.0,
"step": 21425
},
{
"epoch": 214.5,
"learning_rate": 1.761645569620253e-05,
"loss": 0.0,
"step": 21450
},
{
"epoch": 214.75,
"learning_rate": 1.759272151898734e-05,
"loss": 0.0,
"step": 21475
},
{
"epoch": 215.0,
"learning_rate": 1.756898734177215e-05,
"loss": 0.0,
"step": 21500
},
{
"epoch": 215.25,
"learning_rate": 1.754525316455696e-05,
"loss": 0.0,
"step": 21525
},
{
"epoch": 215.5,
"learning_rate": 1.752151898734177e-05,
"loss": 0.0,
"step": 21550
},
{
"epoch": 215.75,
"learning_rate": 1.749778481012658e-05,
"loss": 0.0,
"step": 21575
},
{
"epoch": 216.0,
"learning_rate": 1.7474050632911393e-05,
"loss": 0.0,
"step": 21600
},
{
"epoch": 216.25,
"learning_rate": 1.7450316455696202e-05,
"loss": 0.0,
"step": 21625
},
{
"epoch": 216.5,
"learning_rate": 1.7426582278481012e-05,
"loss": 0.0,
"step": 21650
},
{
"epoch": 216.75,
"learning_rate": 1.740284810126582e-05,
"loss": 0.0,
"step": 21675
},
{
"epoch": 217.0,
"learning_rate": 1.737911392405063e-05,
"loss": 0.0,
"step": 21700
},
{
"epoch": 217.25,
"learning_rate": 1.735537974683544e-05,
"loss": 0.0,
"step": 21725
},
{
"epoch": 217.5,
"learning_rate": 1.7331645569620253e-05,
"loss": 0.0,
"step": 21750
},
{
"epoch": 217.75,
"learning_rate": 1.7307911392405063e-05,
"loss": 0.0,
"step": 21775
},
{
"epoch": 218.0,
"learning_rate": 1.7284177215189872e-05,
"loss": 0.0,
"step": 21800
},
{
"epoch": 218.25,
"learning_rate": 1.7260443037974682e-05,
"loss": 0.0,
"step": 21825
},
{
"epoch": 218.5,
"learning_rate": 1.723670886075949e-05,
"loss": 0.0,
"step": 21850
},
{
"epoch": 218.75,
"learning_rate": 1.72129746835443e-05,
"loss": 0.0,
"step": 21875
},
{
"epoch": 219.0,
"learning_rate": 1.718924050632911e-05,
"loss": 0.0,
"step": 21900
},
{
"epoch": 219.25,
"learning_rate": 1.7165506329113923e-05,
"loss": 0.0,
"step": 21925
},
{
"epoch": 219.5,
"learning_rate": 1.7141772151898733e-05,
"loss": 0.0,
"step": 21950
},
{
"epoch": 219.75,
"learning_rate": 1.7118037974683542e-05,
"loss": 0.0,
"step": 21975
},
{
"epoch": 220.0,
"learning_rate": 1.7094303797468352e-05,
"loss": 0.0,
"step": 22000
},
{
"epoch": 220.0,
"eval_loss": 0.5483614802360535,
"eval_runtime": 80.6444,
"eval_samples_per_second": 158.002,
"eval_steps_per_second": 1.24,
"eval_wer": 19.112474597467564,
"step": 22000
},
{
"epoch": 220.25,
"learning_rate": 1.7070569620253165e-05,
"loss": 0.0,
"step": 22025
},
{
"epoch": 220.5,
"learning_rate": 1.7046835443037974e-05,
"loss": 0.0,
"step": 22050
},
{
"epoch": 220.75,
"learning_rate": 1.7023101265822784e-05,
"loss": 0.0,
"step": 22075
},
{
"epoch": 221.0,
"learning_rate": 1.6999367088607593e-05,
"loss": 0.0,
"step": 22100
},
{
"epoch": 221.25,
"learning_rate": 1.6975632911392403e-05,
"loss": 0.0,
"step": 22125
},
{
"epoch": 221.5,
"learning_rate": 1.6951898734177216e-05,
"loss": 0.0,
"step": 22150
},
{
"epoch": 221.75,
"learning_rate": 1.6928164556962025e-05,
"loss": 0.0,
"step": 22175
},
{
"epoch": 222.0,
"learning_rate": 1.6904430379746835e-05,
"loss": 0.0,
"step": 22200
},
{
"epoch": 222.25,
"learning_rate": 1.6880696202531644e-05,
"loss": 0.0,
"step": 22225
},
{
"epoch": 222.5,
"learning_rate": 1.6856962025316454e-05,
"loss": 0.0,
"step": 22250
},
{
"epoch": 222.75,
"learning_rate": 1.6833227848101263e-05,
"loss": 0.0,
"step": 22275
},
{
"epoch": 223.0,
"learning_rate": 1.6809493670886073e-05,
"loss": 0.0,
"step": 22300
},
{
"epoch": 223.25,
"learning_rate": 1.6785759493670885e-05,
"loss": 0.0,
"step": 22325
},
{
"epoch": 223.5,
"learning_rate": 1.6762025316455695e-05,
"loss": 0.0,
"step": 22350
},
{
"epoch": 223.75,
"learning_rate": 1.6738291139240504e-05,
"loss": 0.0,
"step": 22375
},
{
"epoch": 224.0,
"learning_rate": 1.6714556962025314e-05,
"loss": 0.0,
"step": 22400
},
{
"epoch": 224.25,
"learning_rate": 1.6690822784810127e-05,
"loss": 0.0,
"step": 22425
},
{
"epoch": 224.5,
"learning_rate": 1.6667088607594936e-05,
"loss": 0.0,
"step": 22450
},
{
"epoch": 224.75,
"learning_rate": 1.6643354430379746e-05,
"loss": 0.0,
"step": 22475
},
{
"epoch": 225.0,
"learning_rate": 1.6619620253164555e-05,
"loss": 0.0,
"step": 22500
},
{
"epoch": 225.25,
"learning_rate": 1.6595886075949365e-05,
"loss": 0.0,
"step": 22525
},
{
"epoch": 225.5,
"learning_rate": 1.6572151898734178e-05,
"loss": 0.0,
"step": 22550
},
{
"epoch": 225.75,
"learning_rate": 1.6548417721518987e-05,
"loss": 0.0,
"step": 22575
},
{
"epoch": 226.0,
"learning_rate": 1.6524683544303797e-05,
"loss": 0.0,
"step": 22600
},
{
"epoch": 226.25,
"learning_rate": 1.6500949367088606e-05,
"loss": 0.0,
"step": 22625
},
{
"epoch": 226.5,
"learning_rate": 1.6477215189873416e-05,
"loss": 0.0,
"step": 22650
},
{
"epoch": 226.75,
"learning_rate": 1.6453481012658225e-05,
"loss": 0.0,
"step": 22675
},
{
"epoch": 227.0,
"learning_rate": 1.6429746835443035e-05,
"loss": 0.0,
"step": 22700
},
{
"epoch": 227.25,
"learning_rate": 1.6406012658227848e-05,
"loss": 0.0,
"step": 22725
},
{
"epoch": 227.5,
"learning_rate": 1.6382278481012657e-05,
"loss": 0.0,
"step": 22750
},
{
"epoch": 227.75,
"learning_rate": 1.6358544303797467e-05,
"loss": 0.0,
"step": 22775
},
{
"epoch": 228.0,
"learning_rate": 1.6334810126582276e-05,
"loss": 0.0,
"step": 22800
},
{
"epoch": 228.25,
"learning_rate": 1.6311075949367086e-05,
"loss": 0.0,
"step": 22825
},
{
"epoch": 228.5,
"learning_rate": 1.62873417721519e-05,
"loss": 0.0,
"step": 22850
},
{
"epoch": 228.75,
"learning_rate": 1.6263607594936708e-05,
"loss": 0.0,
"step": 22875
},
{
"epoch": 229.0,
"learning_rate": 1.6239873417721518e-05,
"loss": 0.0,
"step": 22900
},
{
"epoch": 229.25,
"learning_rate": 1.6216139240506327e-05,
"loss": 0.0,
"step": 22925
},
{
"epoch": 229.5,
"learning_rate": 1.6192405063291137e-05,
"loss": 0.0,
"step": 22950
},
{
"epoch": 229.75,
"learning_rate": 1.616867088607595e-05,
"loss": 0.0,
"step": 22975
},
{
"epoch": 230.0,
"learning_rate": 1.614493670886076e-05,
"loss": 0.0,
"step": 23000
},
{
"epoch": 230.0,
"eval_loss": 0.5606202483177185,
"eval_runtime": 80.6021,
"eval_samples_per_second": 158.085,
"eval_steps_per_second": 1.241,
"eval_wer": 19.132992027512895,
"step": 23000
},
{
"epoch": 230.25,
"learning_rate": 1.612120253164557e-05,
"loss": 0.0,
"step": 23025
},
{
"epoch": 230.5,
"learning_rate": 1.6097468354430378e-05,
"loss": 0.0,
"step": 23050
},
{
"epoch": 230.75,
"learning_rate": 1.6073734177215188e-05,
"loss": 0.0,
"step": 23075
},
{
"epoch": 231.0,
"learning_rate": 1.6049999999999997e-05,
"loss": 0.0,
"step": 23100
},
{
"epoch": 231.25,
"learning_rate": 1.6026265822784807e-05,
"loss": 0.0,
"step": 23125
},
{
"epoch": 231.5,
"learning_rate": 1.600253164556962e-05,
"loss": 0.0,
"step": 23150
},
{
"epoch": 231.75,
"learning_rate": 1.597879746835443e-05,
"loss": 0.0,
"step": 23175
},
{
"epoch": 232.0,
"learning_rate": 1.595506329113924e-05,
"loss": 0.0,
"step": 23200
},
{
"epoch": 232.25,
"learning_rate": 1.5931329113924048e-05,
"loss": 0.0,
"step": 23225
},
{
"epoch": 232.5,
"learning_rate": 1.590759493670886e-05,
"loss": 0.0,
"step": 23250
},
{
"epoch": 232.75,
"learning_rate": 1.588386075949367e-05,
"loss": 0.0,
"step": 23275
},
{
"epoch": 233.0,
"learning_rate": 1.586012658227848e-05,
"loss": 0.0,
"step": 23300
},
{
"epoch": 233.25,
"learning_rate": 1.583639240506329e-05,
"loss": 0.0,
"step": 23325
},
{
"epoch": 233.5,
"learning_rate": 1.58126582278481e-05,
"loss": 0.0,
"step": 23350
},
{
"epoch": 233.75,
"learning_rate": 1.5788924050632912e-05,
"loss": 0.0,
"step": 23375
},
{
"epoch": 234.0,
"learning_rate": 1.576518987341772e-05,
"loss": 0.0,
"step": 23400
},
{
"epoch": 234.25,
"learning_rate": 1.574145569620253e-05,
"loss": 0.0,
"step": 23425
},
{
"epoch": 234.5,
"learning_rate": 1.571772151898734e-05,
"loss": 0.0,
"step": 23450
},
{
"epoch": 234.75,
"learning_rate": 1.569398734177215e-05,
"loss": 0.0,
"step": 23475
},
{
"epoch": 235.0,
"learning_rate": 1.567025316455696e-05,
"loss": 0.0,
"step": 23500
},
{
"epoch": 235.25,
"learning_rate": 1.564651898734177e-05,
"loss": 0.0,
"step": 23525
},
{
"epoch": 235.5,
"learning_rate": 1.5622784810126582e-05,
"loss": 0.0,
"step": 23550
},
{
"epoch": 235.75,
"learning_rate": 1.559905063291139e-05,
"loss": 0.0,
"step": 23575
},
{
"epoch": 236.0,
"learning_rate": 1.55753164556962e-05,
"loss": 0.0,
"step": 23600
},
{
"epoch": 236.25,
"learning_rate": 1.555158227848101e-05,
"loss": 0.0,
"step": 23625
},
{
"epoch": 236.5,
"learning_rate": 1.552784810126582e-05,
"loss": 0.0,
"step": 23650
},
{
"epoch": 236.75,
"learning_rate": 1.5504113924050633e-05,
"loss": 0.0,
"step": 23675
},
{
"epoch": 237.0,
"learning_rate": 1.5480379746835442e-05,
"loss": 0.0,
"step": 23700
},
{
"epoch": 237.25,
"learning_rate": 1.5456645569620252e-05,
"loss": 0.0,
"step": 23725
},
{
"epoch": 237.5,
"learning_rate": 1.543291139240506e-05,
"loss": 0.0,
"step": 23750
},
{
"epoch": 237.75,
"learning_rate": 1.5409177215189874e-05,
"loss": 0.0,
"step": 23775
},
{
"epoch": 238.0,
"learning_rate": 1.5385443037974684e-05,
"loss": 0.0,
"step": 23800
},
{
"epoch": 238.25,
"learning_rate": 1.5361708860759493e-05,
"loss": 0.0,
"step": 23825
},
{
"epoch": 238.5,
"learning_rate": 1.5337974683544303e-05,
"loss": 0.0,
"step": 23850
},
{
"epoch": 238.75,
"learning_rate": 1.5314240506329112e-05,
"loss": 0.0,
"step": 23875
},
{
"epoch": 239.0,
"learning_rate": 1.529050632911392e-05,
"loss": 0.0,
"step": 23900
},
{
"epoch": 239.25,
"learning_rate": 1.526677215189873e-05,
"loss": 0.0,
"step": 23925
},
{
"epoch": 239.5,
"learning_rate": 1.5243037974683542e-05,
"loss": 0.0,
"step": 23950
},
{
"epoch": 239.75,
"learning_rate": 1.5219303797468352e-05,
"loss": 0.0,
"step": 23975
},
{
"epoch": 240.0,
"learning_rate": 1.5195569620253163e-05,
"loss": 0.0,
"step": 24000
},
{
"epoch": 240.0,
"eval_loss": 0.5731757879257202,
"eval_runtime": 80.5462,
"eval_samples_per_second": 158.195,
"eval_steps_per_second": 1.242,
"eval_wer": 19.196498358605595,
"step": 24000
},
{
"epoch": 240.25,
"learning_rate": 1.5171835443037973e-05,
"loss": 0.0,
"step": 24025
},
{
"epoch": 240.5,
"learning_rate": 1.5148101265822782e-05,
"loss": 0.0,
"step": 24050
},
{
"epoch": 240.75,
"learning_rate": 1.5124367088607595e-05,
"loss": 0.0,
"step": 24075
},
{
"epoch": 241.0,
"learning_rate": 1.5100632911392404e-05,
"loss": 0.0,
"step": 24100
},
{
"epoch": 241.25,
"learning_rate": 1.5076898734177214e-05,
"loss": 0.0,
"step": 24125
},
{
"epoch": 241.5,
"learning_rate": 1.5053164556962025e-05,
"loss": 0.0,
"step": 24150
},
{
"epoch": 241.75,
"learning_rate": 1.5029430379746835e-05,
"loss": 0.0,
"step": 24175
},
{
"epoch": 242.0,
"learning_rate": 1.5005696202531644e-05,
"loss": 0.0,
"step": 24200
},
{
"epoch": 242.25,
"learning_rate": 1.4981962025316455e-05,
"loss": 0.0,
"step": 24225
},
{
"epoch": 242.5,
"learning_rate": 1.4958227848101265e-05,
"loss": 0.0,
"step": 24250
},
{
"epoch": 242.75,
"learning_rate": 1.4934493670886074e-05,
"loss": 0.0,
"step": 24275
},
{
"epoch": 243.0,
"learning_rate": 1.4910759493670884e-05,
"loss": 0.0,
"step": 24300
},
{
"epoch": 243.25,
"learning_rate": 1.4887025316455695e-05,
"loss": 0.0,
"step": 24325
},
{
"epoch": 243.5,
"learning_rate": 1.4863291139240505e-05,
"loss": 0.0,
"step": 24350
},
{
"epoch": 243.75,
"learning_rate": 1.4839556962025314e-05,
"loss": 0.0,
"step": 24375
},
{
"epoch": 244.0,
"learning_rate": 1.4816772151898732e-05,
"loss": 0.0,
"step": 24400
},
{
"epoch": 244.25,
"learning_rate": 1.4793037974683542e-05,
"loss": 0.0,
"step": 24425
},
{
"epoch": 244.5,
"learning_rate": 1.4769303797468353e-05,
"loss": 0.0,
"step": 24450
},
{
"epoch": 244.75,
"learning_rate": 1.4745569620253164e-05,
"loss": 0.0,
"step": 24475
},
{
"epoch": 245.0,
"learning_rate": 1.4721835443037973e-05,
"loss": 0.0,
"step": 24500
},
{
"epoch": 245.25,
"learning_rate": 1.4698101265822785e-05,
"loss": 0.0,
"step": 24525
},
{
"epoch": 245.5,
"learning_rate": 1.4674367088607594e-05,
"loss": 0.0,
"step": 24550
},
{
"epoch": 245.75,
"learning_rate": 1.4650632911392404e-05,
"loss": 0.0,
"step": 24575
},
{
"epoch": 246.0,
"learning_rate": 1.4626898734177215e-05,
"loss": 0.0,
"step": 24600
},
{
"epoch": 246.25,
"learning_rate": 1.4603164556962024e-05,
"loss": 0.0,
"step": 24625
},
{
"epoch": 246.5,
"learning_rate": 1.4579430379746834e-05,
"loss": 0.0,
"step": 24650
},
{
"epoch": 246.75,
"learning_rate": 1.4555696202531643e-05,
"loss": 0.0,
"step": 24675
},
{
"epoch": 247.0,
"learning_rate": 1.4531962025316455e-05,
"loss": 0.0,
"step": 24700
},
{
"epoch": 247.25,
"learning_rate": 1.4508227848101264e-05,
"loss": 0.0,
"step": 24725
},
{
"epoch": 247.5,
"learning_rate": 1.4484493670886074e-05,
"loss": 0.0,
"step": 24750
},
{
"epoch": 247.75,
"learning_rate": 1.4460759493670885e-05,
"loss": 0.0,
"step": 24775
},
{
"epoch": 248.0,
"learning_rate": 1.4437025316455694e-05,
"loss": 0.0,
"step": 24800
},
{
"epoch": 248.25,
"learning_rate": 1.4413291139240504e-05,
"loss": 0.0,
"step": 24825
},
{
"epoch": 248.5,
"learning_rate": 1.4389556962025315e-05,
"loss": 0.0,
"step": 24850
},
{
"epoch": 248.75,
"learning_rate": 1.4365822784810126e-05,
"loss": 0.0,
"step": 24875
},
{
"epoch": 249.0,
"learning_rate": 1.4342088607594936e-05,
"loss": 0.0,
"step": 24900
},
{
"epoch": 249.25,
"learning_rate": 1.4318354430379747e-05,
"loss": 0.0,
"step": 24925
},
{
"epoch": 249.5,
"learning_rate": 1.4294620253164556e-05,
"loss": 0.0,
"step": 24950
},
{
"epoch": 249.75,
"learning_rate": 1.4270886075949366e-05,
"loss": 0.0,
"step": 24975
},
{
"epoch": 250.0,
"learning_rate": 1.4247151898734177e-05,
"loss": 0.0,
"step": 25000
},
{
"epoch": 250.0,
"eval_loss": 0.5863945484161377,
"eval_runtime": 80.5107,
"eval_samples_per_second": 158.265,
"eval_steps_per_second": 1.242,
"eval_wer": 19.221900891042676,
"step": 25000
},
{
"epoch": 250.25,
"learning_rate": 1.4223417721518987e-05,
"loss": 0.0,
"step": 25025
},
{
"epoch": 250.5,
"learning_rate": 1.4199683544303796e-05,
"loss": 0.0,
"step": 25050
},
{
"epoch": 250.75,
"learning_rate": 1.4175949367088606e-05,
"loss": 0.0,
"step": 25075
},
{
"epoch": 251.0,
"learning_rate": 1.4152215189873417e-05,
"loss": 0.0,
"step": 25100
},
{
"epoch": 251.25,
"learning_rate": 1.4128481012658226e-05,
"loss": 0.0,
"step": 25125
},
{
"epoch": 251.5,
"learning_rate": 1.4104746835443036e-05,
"loss": 0.0,
"step": 25150
},
{
"epoch": 251.75,
"learning_rate": 1.4081012658227847e-05,
"loss": 0.0,
"step": 25175
},
{
"epoch": 252.0,
"learning_rate": 1.4057278481012657e-05,
"loss": 0.0,
"step": 25200
},
{
"epoch": 252.25,
"learning_rate": 1.4033544303797466e-05,
"loss": 0.0,
"step": 25225
},
{
"epoch": 252.5,
"learning_rate": 1.4009810126582276e-05,
"loss": 0.0,
"step": 25250
},
{
"epoch": 252.75,
"learning_rate": 1.3986075949367087e-05,
"loss": 0.0,
"step": 25275
},
{
"epoch": 253.0,
"learning_rate": 1.3962341772151898e-05,
"loss": 0.0,
"step": 25300
},
{
"epoch": 253.25,
"learning_rate": 1.393860759493671e-05,
"loss": 0.0,
"step": 25325
},
{
"epoch": 253.5,
"learning_rate": 1.3914873417721519e-05,
"loss": 0.0,
"step": 25350
},
{
"epoch": 253.75,
"learning_rate": 1.3891139240506328e-05,
"loss": 0.0,
"step": 25375
},
{
"epoch": 254.0,
"learning_rate": 1.3867405063291138e-05,
"loss": 0.0,
"step": 25400
},
{
"epoch": 254.25,
"learning_rate": 1.3843670886075949e-05,
"loss": 0.0,
"step": 25425
},
{
"epoch": 254.5,
"learning_rate": 1.3819936708860758e-05,
"loss": 0.0,
"step": 25450
},
{
"epoch": 254.75,
"learning_rate": 1.3796202531645568e-05,
"loss": 0.0,
"step": 25475
},
{
"epoch": 255.0,
"learning_rate": 1.377246835443038e-05,
"loss": 0.0,
"step": 25500
},
{
"epoch": 255.25,
"learning_rate": 1.3748734177215189e-05,
"loss": 0.0,
"step": 25525
},
{
"epoch": 255.5,
"learning_rate": 1.3724999999999998e-05,
"loss": 0.0,
"step": 25550
},
{
"epoch": 255.75,
"learning_rate": 1.3701265822784808e-05,
"loss": 0.0,
"step": 25575
},
{
"epoch": 256.0,
"learning_rate": 1.3677531645569619e-05,
"loss": 0.0,
"step": 25600
},
{
"epoch": 256.25,
"learning_rate": 1.3653797468354428e-05,
"loss": 0.0,
"step": 25625
},
{
"epoch": 256.5,
"learning_rate": 1.3630063291139238e-05,
"loss": 0.0,
"step": 25650
},
{
"epoch": 256.75,
"learning_rate": 1.3606329113924049e-05,
"loss": 0.0,
"step": 25675
},
{
"epoch": 257.0,
"learning_rate": 1.358259493670886e-05,
"loss": 0.0,
"step": 25700
},
{
"epoch": 257.25,
"learning_rate": 1.355886075949367e-05,
"loss": 0.0,
"step": 25725
},
{
"epoch": 257.5,
"learning_rate": 1.3535126582278481e-05,
"loss": 0.0,
"step": 25750
},
{
"epoch": 257.75,
"learning_rate": 1.351139240506329e-05,
"loss": 0.0,
"step": 25775
},
{
"epoch": 258.0,
"learning_rate": 1.34876582278481e-05,
"loss": 0.0,
"step": 25800
},
{
"epoch": 258.25,
"learning_rate": 1.3463924050632911e-05,
"loss": 0.0,
"step": 25825
},
{
"epoch": 258.5,
"learning_rate": 1.344018987341772e-05,
"loss": 0.0,
"step": 25850
},
{
"epoch": 258.75,
"learning_rate": 1.341645569620253e-05,
"loss": 0.0,
"step": 25875
},
{
"epoch": 259.0,
"learning_rate": 1.3392721518987341e-05,
"loss": 0.0,
"step": 25900
},
{
"epoch": 259.25,
"learning_rate": 1.3368987341772151e-05,
"loss": 0.0,
"step": 25925
},
{
"epoch": 259.5,
"learning_rate": 1.334525316455696e-05,
"loss": 0.0,
"step": 25950
},
{
"epoch": 259.75,
"learning_rate": 1.332151898734177e-05,
"loss": 0.0,
"step": 25975
},
{
"epoch": 260.0,
"learning_rate": 1.3297784810126581e-05,
"loss": 0.0,
"step": 26000
},
{
"epoch": 260.0,
"eval_loss": 0.6003339886665344,
"eval_runtime": 80.5514,
"eval_samples_per_second": 158.185,
"eval_steps_per_second": 1.241,
"eval_wer": 19.310809754572457,
"step": 26000
},
{
"epoch": 260.25,
"learning_rate": 1.327405063291139e-05,
"loss": 0.0,
"step": 26025
},
{
"epoch": 260.5,
"learning_rate": 1.32503164556962e-05,
"loss": 0.0,
"step": 26050
},
{
"epoch": 260.75,
"learning_rate": 1.3226582278481011e-05,
"loss": 0.0,
"step": 26075
},
{
"epoch": 261.0,
"learning_rate": 1.3202848101265821e-05,
"loss": 0.0,
"step": 26100
},
{
"epoch": 261.25,
"learning_rate": 1.3179113924050632e-05,
"loss": 0.0,
"step": 26125
},
{
"epoch": 261.5,
"learning_rate": 1.3155379746835443e-05,
"loss": 0.0,
"step": 26150
},
{
"epoch": 261.75,
"learning_rate": 1.3131645569620253e-05,
"loss": 0.0,
"step": 26175
},
{
"epoch": 262.0,
"learning_rate": 1.3107911392405062e-05,
"loss": 0.0,
"step": 26200
},
{
"epoch": 262.25,
"learning_rate": 1.3084177215189874e-05,
"loss": 0.0,
"step": 26225
},
{
"epoch": 262.5,
"learning_rate": 1.3060443037974683e-05,
"loss": 0.0,
"step": 26250
},
{
"epoch": 262.75,
"learning_rate": 1.3036708860759493e-05,
"loss": 0.0,
"step": 26275
},
{
"epoch": 263.0,
"learning_rate": 1.3012974683544302e-05,
"loss": 0.0,
"step": 26300
},
{
"epoch": 263.25,
"learning_rate": 1.2989240506329113e-05,
"loss": 0.0,
"step": 26325
},
{
"epoch": 263.5,
"learning_rate": 1.2965506329113923e-05,
"loss": 0.0,
"step": 26350
},
{
"epoch": 263.75,
"learning_rate": 1.2941772151898732e-05,
"loss": 0.0,
"step": 26375
},
{
"epoch": 264.0,
"learning_rate": 1.2918037974683543e-05,
"loss": 0.0,
"step": 26400
},
{
"epoch": 264.25,
"learning_rate": 1.2894303797468353e-05,
"loss": 0.0,
"step": 26425
},
{
"epoch": 264.5,
"learning_rate": 1.2870569620253162e-05,
"loss": 0.0,
"step": 26450
},
{
"epoch": 264.75,
"learning_rate": 1.284778481012658e-05,
"loss": 0.0,
"step": 26475
},
{
"epoch": 265.0,
"learning_rate": 1.282405063291139e-05,
"loss": 0.0,
"step": 26500
},
{
"epoch": 265.25,
"learning_rate": 1.2800316455696203e-05,
"loss": 0.0,
"step": 26525
},
{
"epoch": 265.5,
"learning_rate": 1.2776582278481012e-05,
"loss": 0.0,
"step": 26550
},
{
"epoch": 265.75,
"learning_rate": 1.2752848101265822e-05,
"loss": 0.0,
"step": 26575
},
{
"epoch": 266.0,
"learning_rate": 1.2729113924050633e-05,
"loss": 0.0,
"step": 26600
},
{
"epoch": 266.25,
"learning_rate": 1.2705379746835443e-05,
"loss": 0.0,
"step": 26625
},
{
"epoch": 266.5,
"learning_rate": 1.2681645569620252e-05,
"loss": 0.0,
"step": 26650
},
{
"epoch": 266.75,
"learning_rate": 1.2657911392405062e-05,
"loss": 0.0,
"step": 26675
},
{
"epoch": 267.0,
"learning_rate": 1.2634177215189873e-05,
"loss": 0.0,
"step": 26700
},
{
"epoch": 267.25,
"learning_rate": 1.2610443037974682e-05,
"loss": 0.0,
"step": 26725
},
{
"epoch": 267.5,
"learning_rate": 1.2586708860759492e-05,
"loss": 0.0,
"step": 26750
},
{
"epoch": 267.75,
"learning_rate": 1.2562974683544303e-05,
"loss": 0.0,
"step": 26775
},
{
"epoch": 268.0,
"learning_rate": 1.2539240506329112e-05,
"loss": 0.0,
"step": 26800
},
{
"epoch": 268.25,
"learning_rate": 1.2515506329113922e-05,
"loss": 0.0,
"step": 26825
},
{
"epoch": 268.5,
"learning_rate": 1.2491772151898733e-05,
"loss": 0.0,
"step": 26850
},
{
"epoch": 268.75,
"learning_rate": 1.2468037974683543e-05,
"loss": 0.0,
"step": 26875
},
{
"epoch": 269.0,
"learning_rate": 1.2444303797468352e-05,
"loss": 0.0,
"step": 26900
},
{
"epoch": 269.25,
"learning_rate": 1.2420569620253165e-05,
"loss": 0.0,
"step": 26925
},
{
"epoch": 269.5,
"learning_rate": 1.2396835443037975e-05,
"loss": 0.0,
"step": 26950
},
{
"epoch": 269.75,
"learning_rate": 1.2373101265822784e-05,
"loss": 0.0,
"step": 26975
},
{
"epoch": 270.0,
"learning_rate": 1.2349367088607595e-05,
"loss": 0.0,
"step": 27000
},
{
"epoch": 270.0,
"eval_loss": 0.6140475273132324,
"eval_runtime": 80.6529,
"eval_samples_per_second": 157.986,
"eval_steps_per_second": 1.24,
"eval_wer": 19.371385024230108,
"step": 27000
},
{
"epoch": 270.25,
"learning_rate": 1.2325632911392405e-05,
"loss": 0.0,
"step": 27025
},
{
"epoch": 270.5,
"learning_rate": 1.2301898734177214e-05,
"loss": 0.0,
"step": 27050
},
{
"epoch": 270.75,
"learning_rate": 1.2278164556962024e-05,
"loss": 0.0,
"step": 27075
},
{
"epoch": 271.0,
"learning_rate": 1.2254430379746835e-05,
"loss": 0.0,
"step": 27100
},
{
"epoch": 271.25,
"learning_rate": 1.2230696202531645e-05,
"loss": 0.0,
"step": 27125
},
{
"epoch": 271.5,
"learning_rate": 1.2206962025316454e-05,
"loss": 0.0,
"step": 27150
},
{
"epoch": 271.75,
"learning_rate": 1.2183227848101265e-05,
"loss": 0.0,
"step": 27175
},
{
"epoch": 272.0,
"learning_rate": 1.2159493670886075e-05,
"loss": 0.0,
"step": 27200
},
{
"epoch": 272.25,
"learning_rate": 1.2135759493670884e-05,
"loss": 0.0,
"step": 27225
},
{
"epoch": 272.5,
"learning_rate": 1.2112025316455694e-05,
"loss": 0.0,
"step": 27250
},
{
"epoch": 272.75,
"learning_rate": 1.2088291139240505e-05,
"loss": 0.0,
"step": 27275
},
{
"epoch": 273.0,
"learning_rate": 1.2064556962025314e-05,
"loss": 0.0,
"step": 27300
},
{
"epoch": 273.25,
"learning_rate": 1.2040822784810124e-05,
"loss": 0.0,
"step": 27325
},
{
"epoch": 273.5,
"learning_rate": 1.2017088607594937e-05,
"loss": 0.0,
"step": 27350
},
{
"epoch": 273.75,
"learning_rate": 1.1993354430379746e-05,
"loss": 0.0,
"step": 27375
},
{
"epoch": 274.0,
"learning_rate": 1.1969620253164556e-05,
"loss": 0.0,
"step": 27400
},
{
"epoch": 274.25,
"learning_rate": 1.1945886075949367e-05,
"loss": 0.0,
"step": 27425
},
{
"epoch": 274.5,
"learning_rate": 1.1922151898734177e-05,
"loss": 0.0,
"step": 27450
},
{
"epoch": 274.75,
"learning_rate": 1.1898417721518986e-05,
"loss": 0.0,
"step": 27475
},
{
"epoch": 275.0,
"learning_rate": 1.1874683544303797e-05,
"loss": 0.0,
"step": 27500
},
{
"epoch": 275.25,
"learning_rate": 1.1850949367088607e-05,
"loss": 0.0,
"step": 27525
},
{
"epoch": 275.5,
"learning_rate": 1.1827215189873416e-05,
"loss": 0.0,
"step": 27550
},
{
"epoch": 275.75,
"learning_rate": 1.1803481012658226e-05,
"loss": 0.0,
"step": 27575
},
{
"epoch": 276.0,
"learning_rate": 1.1779746835443037e-05,
"loss": 0.0,
"step": 27600
},
{
"epoch": 276.25,
"learning_rate": 1.1756012658227847e-05,
"loss": 0.0,
"step": 27625
},
{
"epoch": 276.5,
"learning_rate": 1.1732278481012656e-05,
"loss": 0.0,
"step": 27650
},
{
"epoch": 276.75,
"learning_rate": 1.1708544303797467e-05,
"loss": 0.0,
"step": 27675
},
{
"epoch": 277.0,
"learning_rate": 1.1684810126582277e-05,
"loss": 0.0,
"step": 27700
},
{
"epoch": 277.25,
"learning_rate": 1.1661075949367086e-05,
"loss": 0.0,
"step": 27725
},
{
"epoch": 277.5,
"learning_rate": 1.1637341772151899e-05,
"loss": 0.0,
"step": 27750
},
{
"epoch": 277.75,
"learning_rate": 1.1613607594936709e-05,
"loss": 0.0,
"step": 27775
},
{
"epoch": 278.0,
"learning_rate": 1.1589873417721518e-05,
"loss": 0.0,
"step": 27800
},
{
"epoch": 278.25,
"learning_rate": 1.156613924050633e-05,
"loss": 0.0,
"step": 27825
},
{
"epoch": 278.5,
"learning_rate": 1.1542405063291139e-05,
"loss": 0.0,
"step": 27850
},
{
"epoch": 278.75,
"learning_rate": 1.1518670886075948e-05,
"loss": 0.0,
"step": 27875
},
{
"epoch": 279.0,
"learning_rate": 1.1496835443037973e-05,
"loss": 0.0033,
"step": 27900
},
{
"epoch": 279.25,
"learning_rate": 1.1474050632911391e-05,
"loss": 0.0072,
"step": 27925
},
{
"epoch": 279.5,
"learning_rate": 1.14503164556962e-05,
"loss": 0.0052,
"step": 27950
},
{
"epoch": 279.75,
"learning_rate": 1.1426582278481012e-05,
"loss": 0.004,
"step": 27975
},
{
"epoch": 280.0,
"learning_rate": 1.1402848101265821e-05,
"loss": 0.0034,
"step": 28000
},
{
"epoch": 280.0,
"eval_loss": 0.5535955429077148,
"eval_runtime": 81.9868,
"eval_samples_per_second": 155.415,
"eval_steps_per_second": 1.22,
"eval_wer": 20.663006096607788,
"step": 28000
},
{
"epoch": 280.25,
"learning_rate": 1.137911392405063e-05,
"loss": 0.0018,
"step": 28025
},
{
"epoch": 280.5,
"learning_rate": 1.1355379746835442e-05,
"loss": 0.0018,
"step": 28050
},
{
"epoch": 280.75,
"learning_rate": 1.1331645569620251e-05,
"loss": 0.0015,
"step": 28075
},
{
"epoch": 281.0,
"learning_rate": 1.1307911392405061e-05,
"loss": 0.0015,
"step": 28100
},
{
"epoch": 281.25,
"learning_rate": 1.1284177215189874e-05,
"loss": 0.0003,
"step": 28125
},
{
"epoch": 281.5,
"learning_rate": 1.1260443037974683e-05,
"loss": 0.0004,
"step": 28150
},
{
"epoch": 281.75,
"learning_rate": 1.1236708860759493e-05,
"loss": 0.0004,
"step": 28175
},
{
"epoch": 282.0,
"learning_rate": 1.1212974683544304e-05,
"loss": 0.0003,
"step": 28200
},
{
"epoch": 282.25,
"learning_rate": 1.1189240506329114e-05,
"loss": 0.0001,
"step": 28225
},
{
"epoch": 282.5,
"learning_rate": 1.1165506329113923e-05,
"loss": 0.0001,
"step": 28250
},
{
"epoch": 282.75,
"learning_rate": 1.1141772151898733e-05,
"loss": 0.0001,
"step": 28275
},
{
"epoch": 283.0,
"learning_rate": 1.1118037974683544e-05,
"loss": 0.0001,
"step": 28300
},
{
"epoch": 283.25,
"learning_rate": 1.1094303797468353e-05,
"loss": 0.0001,
"step": 28325
},
{
"epoch": 283.5,
"learning_rate": 1.1070569620253163e-05,
"loss": 0.0001,
"step": 28350
},
{
"epoch": 283.75,
"learning_rate": 1.1046835443037974e-05,
"loss": 0.0,
"step": 28375
},
{
"epoch": 284.0,
"learning_rate": 1.1023101265822783e-05,
"loss": 0.0003,
"step": 28400
},
{
"epoch": 284.25,
"learning_rate": 1.0999367088607593e-05,
"loss": 0.0,
"step": 28425
},
{
"epoch": 284.5,
"learning_rate": 1.0975632911392404e-05,
"loss": 0.0,
"step": 28450
},
{
"epoch": 284.75,
"learning_rate": 1.0951898734177214e-05,
"loss": 0.0,
"step": 28475
},
{
"epoch": 285.0,
"learning_rate": 1.0928164556962023e-05,
"loss": 0.0,
"step": 28500
},
{
"epoch": 285.25,
"learning_rate": 1.0904430379746836e-05,
"loss": 0.0,
"step": 28525
},
{
"epoch": 285.5,
"learning_rate": 1.0880696202531646e-05,
"loss": 0.0,
"step": 28550
},
{
"epoch": 285.75,
"learning_rate": 1.0856962025316455e-05,
"loss": 0.0,
"step": 28575
},
{
"epoch": 286.0,
"learning_rate": 1.0833227848101266e-05,
"loss": 0.0,
"step": 28600
},
{
"epoch": 286.25,
"learning_rate": 1.0809493670886076e-05,
"loss": 0.0,
"step": 28625
},
{
"epoch": 286.5,
"learning_rate": 1.0785759493670885e-05,
"loss": 0.0,
"step": 28650
},
{
"epoch": 286.75,
"learning_rate": 1.0762025316455695e-05,
"loss": 0.0,
"step": 28675
},
{
"epoch": 287.0,
"learning_rate": 1.0738291139240506e-05,
"loss": 0.0,
"step": 28700
},
{
"epoch": 287.25,
"learning_rate": 1.0714556962025316e-05,
"loss": 0.0,
"step": 28725
},
{
"epoch": 287.5,
"learning_rate": 1.0690822784810125e-05,
"loss": 0.0,
"step": 28750
},
{
"epoch": 287.75,
"learning_rate": 1.0667088607594936e-05,
"loss": 0.0,
"step": 28775
},
{
"epoch": 288.0,
"learning_rate": 1.0643354430379746e-05,
"loss": 0.0,
"step": 28800
},
{
"epoch": 288.25,
"learning_rate": 1.0619620253164555e-05,
"loss": 0.0,
"step": 28825
},
{
"epoch": 288.5,
"learning_rate": 1.0595886075949365e-05,
"loss": 0.0,
"step": 28850
},
{
"epoch": 288.75,
"learning_rate": 1.0572151898734176e-05,
"loss": 0.0,
"step": 28875
},
{
"epoch": 289.0,
"learning_rate": 1.0548417721518985e-05,
"loss": 0.0,
"step": 28900
},
{
"epoch": 289.25,
"learning_rate": 1.0524683544303795e-05,
"loss": 0.0,
"step": 28925
},
{
"epoch": 289.5,
"learning_rate": 1.0500949367088608e-05,
"loss": 0.0,
"step": 28950
},
{
"epoch": 289.75,
"learning_rate": 1.0477215189873417e-05,
"loss": 0.0,
"step": 28975
},
{
"epoch": 290.0,
"learning_rate": 1.0453481012658227e-05,
"loss": 0.0,
"step": 29000
},
{
"epoch": 290.0,
"eval_loss": 0.5485877394676208,
"eval_runtime": 80.6015,
"eval_samples_per_second": 158.086,
"eval_steps_per_second": 1.241,
"eval_wer": 19.339143348444583,
"step": 29000
},
{
"epoch": 290.25,
"learning_rate": 1.0429746835443038e-05,
"loss": 0.0,
"step": 29025
},
{
"epoch": 290.5,
"learning_rate": 1.0406012658227848e-05,
"loss": 0.0,
"step": 29050
},
{
"epoch": 290.75,
"learning_rate": 1.0382278481012657e-05,
"loss": 0.0,
"step": 29075
},
{
"epoch": 291.0,
"learning_rate": 1.0358544303797468e-05,
"loss": 0.0,
"step": 29100
},
{
"epoch": 291.25,
"learning_rate": 1.0334810126582278e-05,
"loss": 0.0,
"step": 29125
},
{
"epoch": 291.5,
"learning_rate": 1.0311075949367087e-05,
"loss": 0.0,
"step": 29150
},
{
"epoch": 291.75,
"learning_rate": 1.0287341772151897e-05,
"loss": 0.0,
"step": 29175
},
{
"epoch": 292.0,
"learning_rate": 1.0263607594936708e-05,
"loss": 0.0,
"step": 29200
},
{
"epoch": 292.25,
"learning_rate": 1.0239873417721518e-05,
"loss": 0.0,
"step": 29225
},
{
"epoch": 292.5,
"learning_rate": 1.0216139240506327e-05,
"loss": 0.0,
"step": 29250
},
{
"epoch": 292.75,
"learning_rate": 1.0192405063291138e-05,
"loss": 0.0,
"step": 29275
},
{
"epoch": 293.0,
"learning_rate": 1.0168670886075948e-05,
"loss": 0.0,
"step": 29300
},
{
"epoch": 293.25,
"learning_rate": 1.0144936708860757e-05,
"loss": 0.0,
"step": 29325
},
{
"epoch": 293.5,
"learning_rate": 1.012120253164557e-05,
"loss": 0.0,
"step": 29350
},
{
"epoch": 293.75,
"learning_rate": 1.009746835443038e-05,
"loss": 0.0,
"step": 29375
},
{
"epoch": 294.0,
"learning_rate": 1.0073734177215189e-05,
"loss": 0.0,
"step": 29400
},
{
"epoch": 294.25,
"learning_rate": 1.005e-05,
"loss": 0.0,
"step": 29425
},
{
"epoch": 294.5,
"learning_rate": 1.002626582278481e-05,
"loss": 0.0,
"step": 29450
},
{
"epoch": 294.75,
"learning_rate": 1.000253164556962e-05,
"loss": 0.0,
"step": 29475
},
{
"epoch": 295.0,
"learning_rate": 9.97879746835443e-06,
"loss": 0.0,
"step": 29500
},
{
"epoch": 295.25,
"learning_rate": 9.95506329113924e-06,
"loss": 0.0,
"step": 29525
},
{
"epoch": 295.5,
"learning_rate": 9.93132911392405e-06,
"loss": 0.0,
"step": 29550
},
{
"epoch": 295.75,
"learning_rate": 9.907594936708859e-06,
"loss": 0.0,
"step": 29575
},
{
"epoch": 296.0,
"learning_rate": 9.88386075949367e-06,
"loss": 0.0,
"step": 29600
},
{
"epoch": 296.25,
"learning_rate": 9.86012658227848e-06,
"loss": 0.0,
"step": 29625
},
{
"epoch": 296.5,
"learning_rate": 9.83639240506329e-06,
"loss": 0.0,
"step": 29650
},
{
"epoch": 296.75,
"learning_rate": 9.8126582278481e-06,
"loss": 0.0,
"step": 29675
},
{
"epoch": 297.0,
"learning_rate": 9.78892405063291e-06,
"loss": 0.0,
"step": 29700
},
{
"epoch": 297.25,
"learning_rate": 9.76518987341772e-06,
"loss": 0.0,
"step": 29725
},
{
"epoch": 297.5,
"learning_rate": 9.741455696202532e-06,
"loss": 0.0,
"step": 29750
},
{
"epoch": 297.75,
"learning_rate": 9.717721518987342e-06,
"loss": 0.0,
"step": 29775
},
{
"epoch": 298.0,
"learning_rate": 9.693987341772151e-06,
"loss": 0.0,
"step": 29800
},
{
"epoch": 298.25,
"learning_rate": 9.670253164556963e-06,
"loss": 0.0,
"step": 29825
},
{
"epoch": 298.5,
"learning_rate": 9.646518987341772e-06,
"loss": 0.0,
"step": 29850
},
{
"epoch": 298.75,
"learning_rate": 9.622784810126582e-06,
"loss": 0.0,
"step": 29875
},
{
"epoch": 299.0,
"learning_rate": 9.599050632911391e-06,
"loss": 0.0,
"step": 29900
},
{
"epoch": 299.25,
"learning_rate": 9.575316455696202e-06,
"loss": 0.0,
"step": 29925
},
{
"epoch": 299.5,
"learning_rate": 9.551582278481012e-06,
"loss": 0.0,
"step": 29950
},
{
"epoch": 299.75,
"learning_rate": 9.527848101265821e-06,
"loss": 0.0,
"step": 29975
},
{
"epoch": 300.0,
"learning_rate": 9.504113924050633e-06,
"loss": 0.0,
"step": 30000
},
{
"epoch": 300.0,
"eval_loss": 0.5590522885322571,
"eval_runtime": 80.5922,
"eval_samples_per_second": 158.105,
"eval_steps_per_second": 1.241,
"eval_wer": 19.30592465218071,
"step": 30000
},
{
"epoch": 300.25,
"learning_rate": 9.480379746835442e-06,
"loss": 0.0,
"step": 30025
},
{
"epoch": 300.5,
"learning_rate": 9.456645569620252e-06,
"loss": 0.0,
"step": 30050
},
{
"epoch": 300.75,
"learning_rate": 9.432911392405061e-06,
"loss": 0.0,
"step": 30075
},
{
"epoch": 301.0,
"learning_rate": 9.409177215189872e-06,
"loss": 0.0,
"step": 30100
},
{
"epoch": 301.25,
"learning_rate": 9.385443037974682e-06,
"loss": 0.0,
"step": 30125
},
{
"epoch": 301.5,
"learning_rate": 9.361708860759493e-06,
"loss": 0.0,
"step": 30150
},
{
"epoch": 301.75,
"learning_rate": 9.337974683544302e-06,
"loss": 0.0,
"step": 30175
},
{
"epoch": 302.0,
"learning_rate": 9.314240506329114e-06,
"loss": 0.0,
"step": 30200
},
{
"epoch": 302.25,
"learning_rate": 9.290506329113923e-06,
"loss": 0.0,
"step": 30225
},
{
"epoch": 302.5,
"learning_rate": 9.266772151898733e-06,
"loss": 0.0,
"step": 30250
},
{
"epoch": 302.75,
"learning_rate": 9.243037974683544e-06,
"loss": 0.0,
"step": 30275
},
{
"epoch": 303.0,
"learning_rate": 9.219303797468353e-06,
"loss": 0.0,
"step": 30300
},
{
"epoch": 303.25,
"learning_rate": 9.195569620253165e-06,
"loss": 0.0,
"step": 30325
},
{
"epoch": 303.5,
"learning_rate": 9.171835443037974e-06,
"loss": 0.0,
"step": 30350
},
{
"epoch": 303.75,
"learning_rate": 9.148101265822784e-06,
"loss": 0.0,
"step": 30375
},
{
"epoch": 304.0,
"learning_rate": 9.124367088607593e-06,
"loss": 0.0,
"step": 30400
},
{
"epoch": 304.25,
"learning_rate": 9.100632911392404e-06,
"loss": 0.0,
"step": 30425
},
{
"epoch": 304.5,
"learning_rate": 9.076898734177214e-06,
"loss": 0.0,
"step": 30450
},
{
"epoch": 304.75,
"learning_rate": 9.053164556962025e-06,
"loss": 0.0,
"step": 30475
},
{
"epoch": 305.0,
"learning_rate": 9.029430379746835e-06,
"loss": 0.0,
"step": 30500
},
{
"epoch": 305.25,
"learning_rate": 9.005696202531646e-06,
"loss": 0.0,
"step": 30525
},
{
"epoch": 305.5,
"learning_rate": 8.981962025316455e-06,
"loss": 0.0,
"step": 30550
},
{
"epoch": 305.75,
"learning_rate": 8.958227848101265e-06,
"loss": 0.0,
"step": 30575
},
{
"epoch": 306.0,
"learning_rate": 8.934493670886074e-06,
"loss": 0.0,
"step": 30600
},
{
"epoch": 306.25,
"learning_rate": 8.910759493670885e-06,
"loss": 0.0,
"step": 30625
},
{
"epoch": 306.5,
"learning_rate": 8.887025316455695e-06,
"loss": 0.0,
"step": 30650
},
{
"epoch": 306.75,
"learning_rate": 8.863291139240504e-06,
"loss": 0.0,
"step": 30675
},
{
"epoch": 307.0,
"learning_rate": 8.839556962025316e-06,
"loss": 0.0,
"step": 30700
},
{
"epoch": 307.25,
"learning_rate": 8.815822784810127e-06,
"loss": 0.0,
"step": 30725
},
{
"epoch": 307.5,
"learning_rate": 8.792088607594936e-06,
"loss": 0.0,
"step": 30750
},
{
"epoch": 307.75,
"learning_rate": 8.768354430379746e-06,
"loss": 0.0,
"step": 30775
},
{
"epoch": 308.0,
"learning_rate": 8.744620253164555e-06,
"loss": 0.0,
"step": 30800
},
{
"epoch": 308.25,
"learning_rate": 8.720886075949367e-06,
"loss": 0.0,
"step": 30825
},
{
"epoch": 308.5,
"learning_rate": 8.697151898734176e-06,
"loss": 0.0,
"step": 30850
},
{
"epoch": 308.75,
"learning_rate": 8.673417721518986e-06,
"loss": 0.0,
"step": 30875
},
{
"epoch": 309.0,
"learning_rate": 8.649683544303797e-06,
"loss": 0.0,
"step": 30900
},
{
"epoch": 309.25,
"learning_rate": 8.625949367088606e-06,
"loss": 0.0,
"step": 30925
},
{
"epoch": 309.5,
"learning_rate": 8.602215189873418e-06,
"loss": 0.0,
"step": 30950
},
{
"epoch": 309.75,
"learning_rate": 8.578481012658227e-06,
"loss": 0.0,
"step": 30975
},
{
"epoch": 310.0,
"learning_rate": 8.554746835443037e-06,
"loss": 0.0,
"step": 31000
},
{
"epoch": 310.0,
"eval_loss": 0.566923975944519,
"eval_runtime": 80.5145,
"eval_samples_per_second": 158.257,
"eval_steps_per_second": 1.242,
"eval_wer": 19.313740816007506,
"step": 31000
},
{
"epoch": 310.25,
"learning_rate": 8.531012658227848e-06,
"loss": 0.0,
"step": 31025
},
{
"epoch": 310.5,
"learning_rate": 8.507278481012657e-06,
"loss": 0.0,
"step": 31050
},
{
"epoch": 310.75,
"learning_rate": 8.483544303797467e-06,
"loss": 0.0,
"step": 31075
},
{
"epoch": 311.0,
"learning_rate": 8.459810126582278e-06,
"loss": 0.0,
"step": 31100
},
{
"epoch": 311.25,
"learning_rate": 8.436075949367087e-06,
"loss": 0.0,
"step": 31125
},
{
"epoch": 311.5,
"learning_rate": 8.412341772151899e-06,
"loss": 0.0,
"step": 31150
},
{
"epoch": 311.75,
"learning_rate": 8.388607594936708e-06,
"loss": 0.0,
"step": 31175
},
{
"epoch": 312.0,
"learning_rate": 8.364873417721518e-06,
"loss": 0.0,
"step": 31200
},
{
"epoch": 312.25,
"learning_rate": 8.341139240506329e-06,
"loss": 0.0,
"step": 31225
},
{
"epoch": 312.5,
"learning_rate": 8.317405063291138e-06,
"loss": 0.0,
"step": 31250
},
{
"epoch": 312.75,
"learning_rate": 8.293670886075948e-06,
"loss": 0.0,
"step": 31275
},
{
"epoch": 313.0,
"learning_rate": 8.269936708860759e-06,
"loss": 0.0,
"step": 31300
},
{
"epoch": 313.25,
"learning_rate": 8.246202531645569e-06,
"loss": 0.0,
"step": 31325
},
{
"epoch": 313.5,
"learning_rate": 8.22246835443038e-06,
"loss": 0.0,
"step": 31350
},
{
"epoch": 313.75,
"learning_rate": 8.19873417721519e-06,
"loss": 0.0,
"step": 31375
},
{
"epoch": 314.0,
"learning_rate": 8.174999999999999e-06,
"loss": 0.0,
"step": 31400
},
{
"epoch": 314.25,
"learning_rate": 8.15126582278481e-06,
"loss": 0.0,
"step": 31425
},
{
"epoch": 314.5,
"learning_rate": 8.12753164556962e-06,
"loss": 0.0,
"step": 31450
},
{
"epoch": 314.75,
"learning_rate": 8.103797468354429e-06,
"loss": 0.0,
"step": 31475
},
{
"epoch": 315.0,
"learning_rate": 8.08006329113924e-06,
"loss": 0.0,
"step": 31500
},
{
"epoch": 315.25,
"learning_rate": 8.05632911392405e-06,
"loss": 0.0,
"step": 31525
},
{
"epoch": 315.5,
"learning_rate": 8.032594936708861e-06,
"loss": 0.0,
"step": 31550
},
{
"epoch": 315.75,
"learning_rate": 8.00886075949367e-06,
"loss": 0.0,
"step": 31575
},
{
"epoch": 316.0,
"learning_rate": 7.98512658227848e-06,
"loss": 0.0,
"step": 31600
},
{
"epoch": 316.25,
"learning_rate": 7.961392405063291e-06,
"loss": 0.0,
"step": 31625
},
{
"epoch": 316.5,
"learning_rate": 7.9376582278481e-06,
"loss": 0.0,
"step": 31650
},
{
"epoch": 316.75,
"learning_rate": 7.91392405063291e-06,
"loss": 0.0,
"step": 31675
},
{
"epoch": 317.0,
"learning_rate": 7.89018987341772e-06,
"loss": 0.0,
"step": 31700
},
{
"epoch": 317.25,
"learning_rate": 7.866455696202531e-06,
"loss": 0.0,
"step": 31725
},
{
"epoch": 317.5,
"learning_rate": 7.842721518987342e-06,
"loss": 0.0,
"step": 31750
},
{
"epoch": 317.75,
"learning_rate": 7.818987341772152e-06,
"loss": 0.0,
"step": 31775
},
{
"epoch": 318.0,
"learning_rate": 7.795253164556961e-06,
"loss": 0.0,
"step": 31800
},
{
"epoch": 318.25,
"learning_rate": 7.77151898734177e-06,
"loss": 0.0,
"step": 31825
},
{
"epoch": 318.5,
"learning_rate": 7.747784810126582e-06,
"loss": 0.0,
"step": 31850
},
{
"epoch": 318.75,
"learning_rate": 7.724050632911391e-06,
"loss": 0.0,
"step": 31875
},
{
"epoch": 319.0,
"learning_rate": 7.7003164556962e-06,
"loss": 0.0,
"step": 31900
},
{
"epoch": 319.25,
"learning_rate": 7.676582278481012e-06,
"loss": 0.0,
"step": 31925
},
{
"epoch": 319.5,
"learning_rate": 7.652848101265823e-06,
"loss": 0.0,
"step": 31950
},
{
"epoch": 319.75,
"learning_rate": 7.629113924050633e-06,
"loss": 0.0,
"step": 31975
},
{
"epoch": 320.0,
"learning_rate": 7.605379746835442e-06,
"loss": 0.0,
"step": 32000
},
{
"epoch": 320.0,
"eval_loss": 0.573691189289093,
"eval_runtime": 80.5487,
"eval_samples_per_second": 158.19,
"eval_steps_per_second": 1.241,
"eval_wer": 19.322534000312647,
"step": 32000
},
{
"epoch": 320.25,
"learning_rate": 7.5816455696202526e-06,
"loss": 0.0,
"step": 32025
},
{
"epoch": 320.5,
"learning_rate": 7.557911392405062e-06,
"loss": 0.0,
"step": 32050
},
{
"epoch": 320.75,
"learning_rate": 7.5341772151898724e-06,
"loss": 0.0,
"step": 32075
},
{
"epoch": 321.0,
"learning_rate": 7.510443037974683e-06,
"loss": 0.0,
"step": 32100
},
{
"epoch": 321.25,
"learning_rate": 7.486708860759493e-06,
"loss": 0.0,
"step": 32125
},
{
"epoch": 321.5,
"learning_rate": 7.4629746835443035e-06,
"loss": 0.0,
"step": 32150
},
{
"epoch": 321.75,
"learning_rate": 7.439240506329114e-06,
"loss": 0.0,
"step": 32175
},
{
"epoch": 322.0,
"learning_rate": 7.415506329113923e-06,
"loss": 0.0,
"step": 32200
},
{
"epoch": 322.25,
"learning_rate": 7.391772151898734e-06,
"loss": 0.0,
"step": 32225
},
{
"epoch": 322.5,
"learning_rate": 7.368037974683543e-06,
"loss": 0.0,
"step": 32250
},
{
"epoch": 322.75,
"learning_rate": 7.3443037974683536e-06,
"loss": 0.0,
"step": 32275
},
{
"epoch": 323.0,
"learning_rate": 7.320569620253164e-06,
"loss": 0.0,
"step": 32300
},
{
"epoch": 323.25,
"learning_rate": 7.296835443037974e-06,
"loss": 0.0,
"step": 32325
},
{
"epoch": 323.5,
"learning_rate": 7.273101265822785e-06,
"loss": 0.0,
"step": 32350
},
{
"epoch": 323.75,
"learning_rate": 7.249367088607594e-06,
"loss": 0.0,
"step": 32375
},
{
"epoch": 324.0,
"learning_rate": 7.2256329113924045e-06,
"loss": 0.0,
"step": 32400
},
{
"epoch": 324.25,
"learning_rate": 7.201898734177215e-06,
"loss": 0.0,
"step": 32425
},
{
"epoch": 324.5,
"learning_rate": 7.178164556962024e-06,
"loss": 0.0,
"step": 32450
},
{
"epoch": 324.75,
"learning_rate": 7.154430379746835e-06,
"loss": 0.0,
"step": 32475
},
{
"epoch": 325.0,
"learning_rate": 7.130696202531644e-06,
"loss": 0.0,
"step": 32500
},
{
"epoch": 325.25,
"learning_rate": 7.1069620253164546e-06,
"loss": 0.0,
"step": 32525
},
{
"epoch": 325.5,
"learning_rate": 7.083227848101266e-06,
"loss": 0.0,
"step": 32550
},
{
"epoch": 325.75,
"learning_rate": 7.059493670886075e-06,
"loss": 0.0,
"step": 32575
},
{
"epoch": 326.0,
"learning_rate": 7.035759493670886e-06,
"loss": 0.0,
"step": 32600
},
{
"epoch": 326.25,
"learning_rate": 7.012025316455696e-06,
"loss": 0.0,
"step": 32625
},
{
"epoch": 326.5,
"learning_rate": 6.9882911392405055e-06,
"loss": 0.0,
"step": 32650
},
{
"epoch": 326.75,
"learning_rate": 6.964556962025316e-06,
"loss": 0.0,
"step": 32675
},
{
"epoch": 327.0,
"learning_rate": 6.940822784810125e-06,
"loss": 0.0,
"step": 32700
},
{
"epoch": 327.25,
"learning_rate": 6.917088607594936e-06,
"loss": 0.0,
"step": 32725
},
{
"epoch": 327.5,
"learning_rate": 6.893354430379747e-06,
"loss": 0.0,
"step": 32750
},
{
"epoch": 327.75,
"learning_rate": 6.869620253164556e-06,
"loss": 0.0,
"step": 32775
},
{
"epoch": 328.0,
"learning_rate": 6.845886075949367e-06,
"loss": 0.0,
"step": 32800
},
{
"epoch": 328.25,
"learning_rate": 6.822151898734176e-06,
"loss": 0.0,
"step": 32825
},
{
"epoch": 328.5,
"learning_rate": 6.798417721518987e-06,
"loss": 0.0,
"step": 32850
},
{
"epoch": 328.75,
"learning_rate": 6.774683544303797e-06,
"loss": 0.0,
"step": 32875
},
{
"epoch": 329.0,
"learning_rate": 6.7509493670886065e-06,
"loss": 0.0,
"step": 32900
},
{
"epoch": 329.25,
"learning_rate": 6.727215189873417e-06,
"loss": 0.0,
"step": 32925
},
{
"epoch": 329.5,
"learning_rate": 6.703481012658228e-06,
"loss": 0.0,
"step": 32950
},
{
"epoch": 329.75,
"learning_rate": 6.6797468354430375e-06,
"loss": 0.0,
"step": 32975
},
{
"epoch": 330.0,
"learning_rate": 6.656012658227848e-06,
"loss": 0.0,
"step": 33000
},
{
"epoch": 330.0,
"eval_loss": 0.5798343420028687,
"eval_runtime": 80.7786,
"eval_samples_per_second": 157.74,
"eval_steps_per_second": 1.238,
"eval_wer": 19.288338283570425,
"step": 33000
},
{
"epoch": 330.25,
"learning_rate": 6.632278481012657e-06,
"loss": 0.0,
"step": 33025
},
{
"epoch": 330.5,
"learning_rate": 6.608544303797468e-06,
"loss": 0.0,
"step": 33050
},
{
"epoch": 330.75,
"learning_rate": 6.584810126582278e-06,
"loss": 0.0,
"step": 33075
},
{
"epoch": 331.0,
"learning_rate": 6.561075949367088e-06,
"loss": 0.0,
"step": 33100
},
{
"epoch": 331.25,
"learning_rate": 6.537341772151898e-06,
"loss": 0.0,
"step": 33125
},
{
"epoch": 331.5,
"learning_rate": 6.513607594936709e-06,
"loss": 0.0,
"step": 33150
},
{
"epoch": 331.75,
"learning_rate": 6.489873417721519e-06,
"loss": 0.0,
"step": 33175
},
{
"epoch": 332.0,
"learning_rate": 6.466139240506329e-06,
"loss": 0.0,
"step": 33200
},
{
"epoch": 332.25,
"learning_rate": 6.4424050632911385e-06,
"loss": 0.0,
"step": 33225
},
{
"epoch": 332.5,
"learning_rate": 6.418670886075949e-06,
"loss": 0.0,
"step": 33250
},
{
"epoch": 332.75,
"learning_rate": 6.394936708860758e-06,
"loss": 0.0,
"step": 33275
},
{
"epoch": 333.0,
"learning_rate": 6.371202531645569e-06,
"loss": 0.0,
"step": 33300
},
{
"epoch": 333.25,
"learning_rate": 6.347468354430379e-06,
"loss": 0.0,
"step": 33325
},
{
"epoch": 333.5,
"learning_rate": 6.3237341772151895e-06,
"loss": 0.0,
"step": 33350
},
{
"epoch": 333.75,
"learning_rate": 6.3e-06,
"loss": 0.0,
"step": 33375
},
{
"epoch": 334.0,
"learning_rate": 6.27626582278481e-06,
"loss": 0.0,
"step": 33400
},
{
"epoch": 334.25,
"learning_rate": 6.25253164556962e-06,
"loss": 0.0,
"step": 33425
},
{
"epoch": 334.5,
"learning_rate": 6.22879746835443e-06,
"loss": 0.0,
"step": 33450
},
{
"epoch": 334.75,
"learning_rate": 6.2050632911392395e-06,
"loss": 0.0,
"step": 33475
},
{
"epoch": 335.0,
"learning_rate": 6.18132911392405e-06,
"loss": 0.0,
"step": 33500
},
{
"epoch": 335.25,
"learning_rate": 6.15759493670886e-06,
"loss": 0.0,
"step": 33525
},
{
"epoch": 335.5,
"learning_rate": 6.13386075949367e-06,
"loss": 0.0,
"step": 33550
},
{
"epoch": 335.75,
"learning_rate": 6.110126582278481e-06,
"loss": 0.0,
"step": 33575
},
{
"epoch": 336.0,
"learning_rate": 6.086392405063291e-06,
"loss": 0.0,
"step": 33600
},
{
"epoch": 336.25,
"learning_rate": 6.062658227848101e-06,
"loss": 0.0,
"step": 33625
},
{
"epoch": 336.5,
"learning_rate": 6.038924050632911e-06,
"loss": 0.0,
"step": 33650
},
{
"epoch": 336.75,
"learning_rate": 6.015189873417721e-06,
"loss": 0.0,
"step": 33675
},
{
"epoch": 337.0,
"learning_rate": 5.991455696202531e-06,
"loss": 0.0,
"step": 33700
},
{
"epoch": 337.25,
"learning_rate": 5.9677215189873405e-06,
"loss": 0.0,
"step": 33725
},
{
"epoch": 337.5,
"learning_rate": 5.943987341772151e-06,
"loss": 0.0,
"step": 33750
},
{
"epoch": 337.75,
"learning_rate": 5.920253164556962e-06,
"loss": 0.0,
"step": 33775
},
{
"epoch": 338.0,
"learning_rate": 5.896518987341772e-06,
"loss": 0.0,
"step": 33800
},
{
"epoch": 338.25,
"learning_rate": 5.872784810126582e-06,
"loss": 0.0,
"step": 33825
},
{
"epoch": 338.5,
"learning_rate": 5.849050632911392e-06,
"loss": 0.0,
"step": 33850
},
{
"epoch": 338.75,
"learning_rate": 5.825316455696202e-06,
"loss": 0.0,
"step": 33875
},
{
"epoch": 339.0,
"learning_rate": 5.801582278481012e-06,
"loss": 0.0,
"step": 33900
},
{
"epoch": 339.25,
"learning_rate": 5.777848101265822e-06,
"loss": 0.0,
"step": 33925
},
{
"epoch": 339.5,
"learning_rate": 5.754113924050632e-06,
"loss": 0.0,
"step": 33950
},
{
"epoch": 339.75,
"learning_rate": 5.730379746835443e-06,
"loss": 0.0,
"step": 33975
},
{
"epoch": 340.0,
"learning_rate": 5.706645569620253e-06,
"loss": 0.0,
"step": 34000
},
{
"epoch": 340.0,
"eval_loss": 0.5856410264968872,
"eval_runtime": 80.4348,
"eval_samples_per_second": 158.414,
"eval_steps_per_second": 1.243,
"eval_wer": 19.26684383304674,
"step": 34000
},
{
"epoch": 340.25,
"learning_rate": 5.682911392405063e-06,
"loss": 0.0,
"step": 34025
},
{
"epoch": 340.5,
"learning_rate": 5.659177215189873e-06,
"loss": 0.0,
"step": 34050
},
{
"epoch": 340.75,
"learning_rate": 5.635443037974683e-06,
"loss": 0.0,
"step": 34075
},
{
"epoch": 341.0,
"learning_rate": 5.611708860759493e-06,
"loss": 0.0,
"step": 34100
},
{
"epoch": 341.25,
"learning_rate": 5.587974683544303e-06,
"loss": 0.0,
"step": 34125
},
{
"epoch": 341.5,
"learning_rate": 5.564240506329113e-06,
"loss": 0.0,
"step": 34150
},
{
"epoch": 341.75,
"learning_rate": 5.540506329113924e-06,
"loss": 0.0,
"step": 34175
},
{
"epoch": 342.0,
"learning_rate": 5.516772151898734e-06,
"loss": 0.0,
"step": 34200
},
{
"epoch": 342.25,
"learning_rate": 5.493037974683544e-06,
"loss": 0.0,
"step": 34225
},
{
"epoch": 342.5,
"learning_rate": 5.469303797468354e-06,
"loss": 0.0,
"step": 34250
},
{
"epoch": 342.75,
"learning_rate": 5.445569620253164e-06,
"loss": 0.0,
"step": 34275
},
{
"epoch": 343.0,
"learning_rate": 5.4218354430379744e-06,
"loss": 0.0,
"step": 34300
},
{
"epoch": 343.25,
"learning_rate": 5.398101265822784e-06,
"loss": 0.0,
"step": 34325
},
{
"epoch": 343.5,
"learning_rate": 5.374367088607594e-06,
"loss": 0.0,
"step": 34350
},
{
"epoch": 343.75,
"learning_rate": 5.350632911392404e-06,
"loss": 0.0,
"step": 34375
},
{
"epoch": 344.0,
"learning_rate": 5.326898734177215e-06,
"loss": 0.0,
"step": 34400
},
{
"epoch": 344.25,
"learning_rate": 5.303164556962025e-06,
"loss": 0.0,
"step": 34425
},
{
"epoch": 344.5,
"learning_rate": 5.279430379746835e-06,
"loss": 0.0,
"step": 34450
},
{
"epoch": 344.75,
"learning_rate": 5.255696202531645e-06,
"loss": 0.0,
"step": 34475
},
{
"epoch": 345.0,
"learning_rate": 5.231962025316455e-06,
"loss": 0.0,
"step": 34500
},
{
"epoch": 345.25,
"learning_rate": 5.208227848101265e-06,
"loss": 0.0,
"step": 34525
},
{
"epoch": 345.5,
"learning_rate": 5.1844936708860754e-06,
"loss": 0.0,
"step": 34550
},
{
"epoch": 345.75,
"learning_rate": 5.160759493670885e-06,
"loss": 0.0,
"step": 34575
},
{
"epoch": 346.0,
"learning_rate": 5.137025316455696e-06,
"loss": 0.0,
"step": 34600
},
{
"epoch": 346.25,
"learning_rate": 5.1132911392405065e-06,
"loss": 0.0,
"step": 34625
},
{
"epoch": 346.5,
"learning_rate": 5.089556962025316e-06,
"loss": 0.0,
"step": 34650
},
{
"epoch": 346.75,
"learning_rate": 5.065822784810126e-06,
"loss": 0.0,
"step": 34675
},
{
"epoch": 347.0,
"learning_rate": 5.042088607594936e-06,
"loss": 0.0,
"step": 34700
},
{
"epoch": 347.25,
"learning_rate": 5.018354430379746e-06,
"loss": 0.0,
"step": 34725
},
{
"epoch": 347.5,
"learning_rate": 4.9946202531645566e-06,
"loss": 0.0,
"step": 34750
},
{
"epoch": 347.75,
"learning_rate": 4.970886075949366e-06,
"loss": 0.0,
"step": 34775
},
{
"epoch": 348.0,
"learning_rate": 4.947151898734177e-06,
"loss": 0.0,
"step": 34800
},
{
"epoch": 348.25,
"learning_rate": 4.923417721518988e-06,
"loss": 0.0,
"step": 34825
},
{
"epoch": 348.5,
"learning_rate": 4.899683544303797e-06,
"loss": 0.0,
"step": 34850
},
{
"epoch": 348.75,
"learning_rate": 4.8759493670886075e-06,
"loss": 0.0,
"step": 34875
},
{
"epoch": 349.0,
"learning_rate": 4.852215189873417e-06,
"loss": 0.0,
"step": 34900
},
{
"epoch": 349.25,
"learning_rate": 4.828481012658227e-06,
"loss": 0.0,
"step": 34925
},
{
"epoch": 349.5,
"learning_rate": 4.804746835443037e-06,
"loss": 0.0,
"step": 34950
},
{
"epoch": 349.75,
"learning_rate": 4.781012658227847e-06,
"loss": 0.0,
"step": 34975
},
{
"epoch": 350.0,
"learning_rate": 4.757278481012658e-06,
"loss": 0.0,
"step": 35000
},
{
"epoch": 350.0,
"eval_loss": 0.5910990238189697,
"eval_runtime": 80.5464,
"eval_samples_per_second": 158.195,
"eval_steps_per_second": 1.242,
"eval_wer": 19.234602157261214,
"step": 35000
},
{
"epoch": 350.25,
"learning_rate": 4.733544303797468e-06,
"loss": 0.0,
"step": 35025
},
{
"epoch": 350.5,
"learning_rate": 4.709810126582278e-06,
"loss": 0.0,
"step": 35050
},
{
"epoch": 350.75,
"learning_rate": 4.686075949367089e-06,
"loss": 0.0,
"step": 35075
},
{
"epoch": 351.0,
"learning_rate": 4.662341772151898e-06,
"loss": 0.0,
"step": 35100
},
{
"epoch": 351.25,
"learning_rate": 4.6386075949367085e-06,
"loss": 0.0,
"step": 35125
},
{
"epoch": 351.5,
"learning_rate": 4.614873417721519e-06,
"loss": 0.0,
"step": 35150
},
{
"epoch": 351.75,
"learning_rate": 4.591139240506329e-06,
"loss": 0.0,
"step": 35175
},
{
"epoch": 352.0,
"learning_rate": 4.567405063291139e-06,
"loss": 0.0,
"step": 35200
},
{
"epoch": 352.25,
"learning_rate": 4.543670886075949e-06,
"loss": 0.0,
"step": 35225
},
{
"epoch": 352.5,
"learning_rate": 4.5199367088607586e-06,
"loss": 0.0,
"step": 35250
},
{
"epoch": 352.75,
"learning_rate": 4.49620253164557e-06,
"loss": 0.0,
"step": 35275
},
{
"epoch": 353.0,
"learning_rate": 4.472468354430379e-06,
"loss": 0.0,
"step": 35300
},
{
"epoch": 353.25,
"learning_rate": 4.44873417721519e-06,
"loss": 0.0,
"step": 35325
},
{
"epoch": 353.5,
"learning_rate": 4.424999999999999e-06,
"loss": 0.0,
"step": 35350
},
{
"epoch": 353.75,
"learning_rate": 4.4012658227848095e-06,
"loss": 0.0,
"step": 35375
},
{
"epoch": 354.0,
"learning_rate": 4.37753164556962e-06,
"loss": 0.0,
"step": 35400
},
{
"epoch": 354.25,
"learning_rate": 4.35379746835443e-06,
"loss": 0.0,
"step": 35425
},
{
"epoch": 354.5,
"learning_rate": 4.33006329113924e-06,
"loss": 0.0,
"step": 35450
},
{
"epoch": 354.75,
"learning_rate": 4.30632911392405e-06,
"loss": 0.0,
"step": 35475
},
{
"epoch": 355.0,
"learning_rate": 4.28259493670886e-06,
"loss": 0.0,
"step": 35500
},
{
"epoch": 355.25,
"learning_rate": 4.258860759493671e-06,
"loss": 0.0,
"step": 35525
},
{
"epoch": 355.5,
"learning_rate": 4.23512658227848e-06,
"loss": 0.0,
"step": 35550
},
{
"epoch": 355.75,
"learning_rate": 4.211392405063291e-06,
"loss": 0.0,
"step": 35575
},
{
"epoch": 356.0,
"learning_rate": 4.187658227848101e-06,
"loss": 0.0,
"step": 35600
},
{
"epoch": 356.25,
"learning_rate": 4.163924050632911e-06,
"loss": 0.0,
"step": 35625
},
{
"epoch": 356.5,
"learning_rate": 4.140189873417721e-06,
"loss": 0.0,
"step": 35650
},
{
"epoch": 356.75,
"learning_rate": 4.116455696202531e-06,
"loss": 0.0,
"step": 35675
},
{
"epoch": 357.0,
"learning_rate": 4.0927215189873416e-06,
"loss": 0.0,
"step": 35700
},
{
"epoch": 357.25,
"learning_rate": 4.068987341772152e-06,
"loss": 0.0,
"step": 35725
},
{
"epoch": 357.5,
"learning_rate": 4.045253164556961e-06,
"loss": 0.0,
"step": 35750
},
{
"epoch": 357.75,
"learning_rate": 4.021518987341772e-06,
"loss": 0.0,
"step": 35775
},
{
"epoch": 358.0,
"learning_rate": 3.997784810126582e-06,
"loss": 0.0,
"step": 35800
},
{
"epoch": 358.25,
"learning_rate": 3.974050632911392e-06,
"loss": 0.0,
"step": 35825
},
{
"epoch": 358.5,
"learning_rate": 3.950316455696202e-06,
"loss": 0.0,
"step": 35850
},
{
"epoch": 358.75,
"learning_rate": 3.926582278481012e-06,
"loss": 0.0,
"step": 35875
},
{
"epoch": 359.0,
"learning_rate": 3.902848101265823e-06,
"loss": 0.0,
"step": 35900
},
{
"epoch": 359.25,
"learning_rate": 3.879113924050632e-06,
"loss": 0.0,
"step": 35925
},
{
"epoch": 359.5,
"learning_rate": 3.8553797468354425e-06,
"loss": 0.0,
"step": 35950
},
{
"epoch": 359.75,
"learning_rate": 3.831645569620253e-06,
"loss": 0.0,
"step": 35975
},
{
"epoch": 360.0,
"learning_rate": 3.8088607594936704e-06,
"loss": 0.0,
"step": 36000
},
{
"epoch": 360.0,
"eval_loss": 0.5961853861808777,
"eval_runtime": 80.7236,
"eval_samples_per_second": 157.847,
"eval_steps_per_second": 1.239,
"eval_wer": 19.22874003439112,
"step": 36000
},
{
"epoch": 360.25,
"learning_rate": 3.7851265822784808e-06,
"loss": 0.0,
"step": 36025
},
{
"epoch": 360.5,
"learning_rate": 3.7613924050632907e-06,
"loss": 0.0,
"step": 36050
},
{
"epoch": 360.75,
"learning_rate": 3.737658227848101e-06,
"loss": 0.0,
"step": 36075
},
{
"epoch": 361.0,
"learning_rate": 3.713924050632911e-06,
"loss": 0.0,
"step": 36100
},
{
"epoch": 361.25,
"learning_rate": 3.690189873417721e-06,
"loss": 0.0,
"step": 36125
},
{
"epoch": 361.5,
"learning_rate": 3.6664556962025313e-06,
"loss": 0.0,
"step": 36150
},
{
"epoch": 361.75,
"learning_rate": 3.6427215189873416e-06,
"loss": 0.0,
"step": 36175
},
{
"epoch": 362.0,
"learning_rate": 3.6189873417721516e-06,
"loss": 0.0,
"step": 36200
},
{
"epoch": 362.25,
"learning_rate": 3.5952531645569615e-06,
"loss": 0.0,
"step": 36225
},
{
"epoch": 362.5,
"learning_rate": 3.571518987341772e-06,
"loss": 0.0,
"step": 36250
},
{
"epoch": 362.75,
"learning_rate": 3.547784810126582e-06,
"loss": 0.0,
"step": 36275
},
{
"epoch": 363.0,
"learning_rate": 3.524050632911392e-06,
"loss": 0.0,
"step": 36300
},
{
"epoch": 363.25,
"learning_rate": 3.500316455696202e-06,
"loss": 0.0,
"step": 36325
},
{
"epoch": 363.5,
"learning_rate": 3.476582278481012e-06,
"loss": 0.0,
"step": 36350
},
{
"epoch": 363.75,
"learning_rate": 3.4528481012658228e-06,
"loss": 0.0,
"step": 36375
},
{
"epoch": 364.0,
"learning_rate": 3.4291139240506327e-06,
"loss": 0.0,
"step": 36400
},
{
"epoch": 364.25,
"learning_rate": 3.4053797468354426e-06,
"loss": 0.0,
"step": 36425
},
{
"epoch": 364.5,
"learning_rate": 3.3816455696202526e-06,
"loss": 0.0,
"step": 36450
},
{
"epoch": 364.75,
"learning_rate": 3.3579113924050633e-06,
"loss": 0.0,
"step": 36475
},
{
"epoch": 365.0,
"learning_rate": 3.3341772151898733e-06,
"loss": 0.0,
"step": 36500
},
{
"epoch": 365.25,
"learning_rate": 3.310443037974683e-06,
"loss": 0.0,
"step": 36525
},
{
"epoch": 365.5,
"learning_rate": 3.286708860759493e-06,
"loss": 0.0,
"step": 36550
},
{
"epoch": 365.75,
"learning_rate": 3.262974683544304e-06,
"loss": 0.0,
"step": 36575
},
{
"epoch": 366.0,
"learning_rate": 3.239240506329114e-06,
"loss": 0.0,
"step": 36600
},
{
"epoch": 366.25,
"learning_rate": 3.2155063291139238e-06,
"loss": 0.0,
"step": 36625
},
{
"epoch": 366.5,
"learning_rate": 3.1917721518987337e-06,
"loss": 0.0,
"step": 36650
},
{
"epoch": 366.75,
"learning_rate": 3.1680379746835436e-06,
"loss": 0.0,
"step": 36675
},
{
"epoch": 367.0,
"learning_rate": 3.1443037974683544e-06,
"loss": 0.0,
"step": 36700
},
{
"epoch": 367.25,
"learning_rate": 3.1205696202531643e-06,
"loss": 0.0,
"step": 36725
},
{
"epoch": 367.5,
"learning_rate": 3.0968354430379743e-06,
"loss": 0.0,
"step": 36750
},
{
"epoch": 367.75,
"learning_rate": 3.073101265822784e-06,
"loss": 0.0,
"step": 36775
},
{
"epoch": 368.0,
"learning_rate": 3.049367088607595e-06,
"loss": 0.0,
"step": 36800
},
{
"epoch": 368.25,
"learning_rate": 3.025632911392405e-06,
"loss": 0.0,
"step": 36825
},
{
"epoch": 368.5,
"learning_rate": 3.001898734177215e-06,
"loss": 0.0,
"step": 36850
},
{
"epoch": 368.75,
"learning_rate": 2.9781645569620248e-06,
"loss": 0.0,
"step": 36875
},
{
"epoch": 369.0,
"learning_rate": 2.9544303797468355e-06,
"loss": 0.0,
"step": 36900
},
{
"epoch": 369.25,
"learning_rate": 2.9306962025316455e-06,
"loss": 0.0,
"step": 36925
},
{
"epoch": 369.5,
"learning_rate": 2.9069620253164554e-06,
"loss": 0.0,
"step": 36950
},
{
"epoch": 369.75,
"learning_rate": 2.8832278481012653e-06,
"loss": 0.0,
"step": 36975
},
{
"epoch": 370.0,
"learning_rate": 2.8594936708860757e-06,
"loss": 0.0,
"step": 37000
},
{
"epoch": 370.0,
"eval_loss": 0.6009894013404846,
"eval_runtime": 80.466,
"eval_samples_per_second": 158.353,
"eval_steps_per_second": 1.243,
"eval_wer": 19.232648116304517,
"step": 37000
},
{
"epoch": 370.25,
"learning_rate": 2.835759493670886e-06,
"loss": 0.0,
"step": 37025
},
{
"epoch": 370.5,
"learning_rate": 2.812025316455696e-06,
"loss": 0.0,
"step": 37050
},
{
"epoch": 370.75,
"learning_rate": 2.788291139240506e-06,
"loss": 0.0,
"step": 37075
},
{
"epoch": 371.0,
"learning_rate": 2.7645569620253162e-06,
"loss": 0.0,
"step": 37100
},
{
"epoch": 371.25,
"learning_rate": 2.7408227848101266e-06,
"loss": 0.0,
"step": 37125
},
{
"epoch": 371.5,
"learning_rate": 2.7170886075949365e-06,
"loss": 0.0,
"step": 37150
},
{
"epoch": 371.75,
"learning_rate": 2.6933544303797465e-06,
"loss": 0.0,
"step": 37175
},
{
"epoch": 372.0,
"learning_rate": 2.669620253164557e-06,
"loss": 0.0,
"step": 37200
},
{
"epoch": 372.25,
"learning_rate": 2.6458860759493667e-06,
"loss": 0.0,
"step": 37225
},
{
"epoch": 372.5,
"learning_rate": 2.622151898734177e-06,
"loss": 0.0,
"step": 37250
},
{
"epoch": 372.75,
"learning_rate": 2.598417721518987e-06,
"loss": 0.0,
"step": 37275
},
{
"epoch": 373.0,
"learning_rate": 2.5746835443037974e-06,
"loss": 0.0,
"step": 37300
},
{
"epoch": 373.25,
"learning_rate": 2.5509493670886073e-06,
"loss": 0.0,
"step": 37325
},
{
"epoch": 373.5,
"learning_rate": 2.5272151898734177e-06,
"loss": 0.0,
"step": 37350
},
{
"epoch": 373.75,
"learning_rate": 2.5034810126582276e-06,
"loss": 0.0,
"step": 37375
},
{
"epoch": 374.0,
"learning_rate": 2.479746835443038e-06,
"loss": 0.0,
"step": 37400
},
{
"epoch": 374.25,
"learning_rate": 2.456012658227848e-06,
"loss": 0.0,
"step": 37425
},
{
"epoch": 374.5,
"learning_rate": 2.432278481012658e-06,
"loss": 0.0,
"step": 37450
},
{
"epoch": 374.75,
"learning_rate": 2.408544303797468e-06,
"loss": 0.0,
"step": 37475
},
{
"epoch": 375.0,
"learning_rate": 2.384810126582278e-06,
"loss": 0.0,
"step": 37500
},
{
"epoch": 375.25,
"learning_rate": 2.3610759493670884e-06,
"loss": 0.0,
"step": 37525
},
{
"epoch": 375.5,
"learning_rate": 2.3373417721518984e-06,
"loss": 0.0,
"step": 37550
},
{
"epoch": 375.75,
"learning_rate": 2.3136075949367087e-06,
"loss": 0.0,
"step": 37575
},
{
"epoch": 376.0,
"learning_rate": 2.2898734177215187e-06,
"loss": 0.0,
"step": 37600
},
{
"epoch": 376.25,
"learning_rate": 2.2661392405063286e-06,
"loss": 0.0,
"step": 37625
},
{
"epoch": 376.5,
"learning_rate": 2.242405063291139e-06,
"loss": 0.0,
"step": 37650
},
{
"epoch": 376.75,
"learning_rate": 2.218670886075949e-06,
"loss": 0.0,
"step": 37675
},
{
"epoch": 377.0,
"learning_rate": 2.1949367088607592e-06,
"loss": 0.0,
"step": 37700
},
{
"epoch": 377.25,
"learning_rate": 2.171202531645569e-06,
"loss": 0.0,
"step": 37725
},
{
"epoch": 377.5,
"learning_rate": 2.1474683544303795e-06,
"loss": 0.0,
"step": 37750
},
{
"epoch": 377.75,
"learning_rate": 2.1237341772151894e-06,
"loss": 0.0,
"step": 37775
},
{
"epoch": 378.0,
"learning_rate": 2.1e-06,
"loss": 0.0,
"step": 37800
},
{
"epoch": 378.25,
"learning_rate": 2.0762658227848097e-06,
"loss": 0.0,
"step": 37825
},
{
"epoch": 378.5,
"learning_rate": 2.05253164556962e-06,
"loss": 0.0,
"step": 37850
},
{
"epoch": 378.75,
"learning_rate": 2.02879746835443e-06,
"loss": 0.0,
"step": 37875
},
{
"epoch": 379.0,
"learning_rate": 2.0050632911392404e-06,
"loss": 0.0,
"step": 37900
},
{
"epoch": 379.25,
"learning_rate": 1.9813291139240503e-06,
"loss": 0.0,
"step": 37925
},
{
"epoch": 379.5,
"learning_rate": 1.9575949367088607e-06,
"loss": 0.0,
"step": 37950
},
{
"epoch": 379.75,
"learning_rate": 1.9338607594936706e-06,
"loss": 0.0,
"step": 37975
},
{
"epoch": 380.0,
"learning_rate": 1.910126582278481e-06,
"loss": 0.0,
"step": 38000
},
{
"epoch": 380.0,
"eval_loss": 0.6050010919570923,
"eval_runtime": 80.5317,
"eval_samples_per_second": 158.223,
"eval_steps_per_second": 1.242,
"eval_wer": 19.22874003439112,
"step": 38000
},
{
"epoch": 380.25,
"learning_rate": 1.8863924050632909e-06,
"loss": 0.0,
"step": 38025
},
{
"epoch": 380.5,
"learning_rate": 1.8626582278481012e-06,
"loss": 0.0,
"step": 38050
},
{
"epoch": 380.75,
"learning_rate": 1.8389240506329112e-06,
"loss": 0.0,
"step": 38075
},
{
"epoch": 381.0,
"learning_rate": 1.8151898734177215e-06,
"loss": 0.0,
"step": 38100
},
{
"epoch": 381.25,
"learning_rate": 1.7914556962025314e-06,
"loss": 0.0,
"step": 38125
},
{
"epoch": 381.5,
"learning_rate": 1.7677215189873418e-06,
"loss": 0.0,
"step": 38150
},
{
"epoch": 381.75,
"learning_rate": 1.7439873417721517e-06,
"loss": 0.0,
"step": 38175
},
{
"epoch": 382.0,
"learning_rate": 1.720253164556962e-06,
"loss": 0.0,
"step": 38200
},
{
"epoch": 382.25,
"learning_rate": 1.696518987341772e-06,
"loss": 0.0,
"step": 38225
},
{
"epoch": 382.5,
"learning_rate": 1.6727848101265821e-06,
"loss": 0.0,
"step": 38250
},
{
"epoch": 382.75,
"learning_rate": 1.6490506329113923e-06,
"loss": 0.0,
"step": 38275
},
{
"epoch": 383.0,
"learning_rate": 1.6253164556962024e-06,
"loss": 0.0,
"step": 38300
},
{
"epoch": 383.25,
"learning_rate": 1.6015822784810126e-06,
"loss": 0.0,
"step": 38325
},
{
"epoch": 383.5,
"learning_rate": 1.5778481012658227e-06,
"loss": 0.0,
"step": 38350
},
{
"epoch": 383.75,
"learning_rate": 1.5541139240506329e-06,
"loss": 0.0,
"step": 38375
},
{
"epoch": 384.0,
"learning_rate": 1.5303797468354428e-06,
"loss": 0.0,
"step": 38400
},
{
"epoch": 384.25,
"learning_rate": 1.5066455696202531e-06,
"loss": 0.0,
"step": 38425
},
{
"epoch": 384.5,
"learning_rate": 1.482911392405063e-06,
"loss": 0.0,
"step": 38450
},
{
"epoch": 384.75,
"learning_rate": 1.4591772151898732e-06,
"loss": 0.0,
"step": 38475
},
{
"epoch": 385.0,
"learning_rate": 1.4354430379746834e-06,
"loss": 0.0,
"step": 38500
},
{
"epoch": 385.25,
"learning_rate": 1.4117088607594935e-06,
"loss": 0.0,
"step": 38525
},
{
"epoch": 385.5,
"learning_rate": 1.3879746835443036e-06,
"loss": 0.0,
"step": 38550
},
{
"epoch": 385.75,
"learning_rate": 1.3642405063291138e-06,
"loss": 0.0,
"step": 38575
},
{
"epoch": 386.0,
"learning_rate": 1.340506329113924e-06,
"loss": 0.0,
"step": 38600
},
{
"epoch": 386.25,
"learning_rate": 1.316772151898734e-06,
"loss": 0.0,
"step": 38625
},
{
"epoch": 386.5,
"learning_rate": 1.293037974683544e-06,
"loss": 0.0,
"step": 38650
},
{
"epoch": 386.75,
"learning_rate": 1.2693037974683543e-06,
"loss": 0.0,
"step": 38675
},
{
"epoch": 387.0,
"learning_rate": 1.2455696202531643e-06,
"loss": 0.0,
"step": 38700
},
{
"epoch": 387.25,
"learning_rate": 1.2218354430379746e-06,
"loss": 0.0,
"step": 38725
},
{
"epoch": 387.5,
"learning_rate": 1.1981012658227846e-06,
"loss": 0.0,
"step": 38750
},
{
"epoch": 387.75,
"learning_rate": 1.174367088607595e-06,
"loss": 0.0,
"step": 38775
},
{
"epoch": 388.0,
"learning_rate": 1.150632911392405e-06,
"loss": 0.0,
"step": 38800
},
{
"epoch": 388.25,
"learning_rate": 1.1268987341772152e-06,
"loss": 0.0,
"step": 38825
},
{
"epoch": 388.5,
"learning_rate": 1.1031645569620251e-06,
"loss": 0.0,
"step": 38850
},
{
"epoch": 388.75,
"learning_rate": 1.0794303797468353e-06,
"loss": 0.0,
"step": 38875
},
{
"epoch": 389.0,
"learning_rate": 1.0556962025316454e-06,
"loss": 0.0,
"step": 38900
},
{
"epoch": 389.25,
"learning_rate": 1.0319620253164556e-06,
"loss": 0.0,
"step": 38925
},
{
"epoch": 389.5,
"learning_rate": 1.0082278481012657e-06,
"loss": 0.0,
"step": 38950
},
{
"epoch": 389.75,
"learning_rate": 9.844936708860758e-07,
"loss": 0.0,
"step": 38975
},
{
"epoch": 390.0,
"learning_rate": 9.60759493670886e-07,
"loss": 0.0,
"step": 39000
},
{
"epoch": 390.0,
"eval_loss": 0.608101487159729,
"eval_runtime": 80.4312,
"eval_samples_per_second": 158.421,
"eval_steps_per_second": 1.243,
"eval_wer": 19.237533218696264,
"step": 39000
},
{
"epoch": 390.25,
"learning_rate": 9.370253164556961e-07,
"loss": 0.0,
"step": 39025
},
{
"epoch": 390.5,
"learning_rate": 9.132911392405062e-07,
"loss": 0.0,
"step": 39050
},
{
"epoch": 390.75,
"learning_rate": 8.895569620253163e-07,
"loss": 0.0,
"step": 39075
},
{
"epoch": 391.0,
"learning_rate": 8.658227848101264e-07,
"loss": 0.0,
"step": 39100
},
{
"epoch": 391.25,
"learning_rate": 8.420886075949366e-07,
"loss": 0.0,
"step": 39125
},
{
"epoch": 391.5,
"learning_rate": 8.183544303797467e-07,
"loss": 0.0,
"step": 39150
},
{
"epoch": 391.75,
"learning_rate": 7.946202531645569e-07,
"loss": 0.0,
"step": 39175
},
{
"epoch": 392.0,
"learning_rate": 7.70886075949367e-07,
"loss": 0.0,
"step": 39200
},
{
"epoch": 392.25,
"learning_rate": 7.471518987341772e-07,
"loss": 0.0,
"step": 39225
},
{
"epoch": 392.5,
"learning_rate": 7.234177215189873e-07,
"loss": 0.0,
"step": 39250
},
{
"epoch": 392.75,
"learning_rate": 6.996835443037974e-07,
"loss": 0.0,
"step": 39275
},
{
"epoch": 393.0,
"learning_rate": 6.759493670886076e-07,
"loss": 0.0,
"step": 39300
},
{
"epoch": 393.25,
"learning_rate": 6.522151898734176e-07,
"loss": 0.0,
"step": 39325
},
{
"epoch": 393.5,
"learning_rate": 6.284810126582278e-07,
"loss": 0.0,
"step": 39350
},
{
"epoch": 393.75,
"learning_rate": 6.047468354430379e-07,
"loss": 0.0,
"step": 39375
},
{
"epoch": 394.0,
"learning_rate": 5.81012658227848e-07,
"loss": 0.0,
"step": 39400
},
{
"epoch": 394.25,
"learning_rate": 5.572784810126582e-07,
"loss": 0.0,
"step": 39425
},
{
"epoch": 394.5,
"learning_rate": 5.335443037974683e-07,
"loss": 0.0,
"step": 39450
},
{
"epoch": 394.75,
"learning_rate": 5.098101265822785e-07,
"loss": 0.0,
"step": 39475
},
{
"epoch": 395.0,
"learning_rate": 4.860759493670886e-07,
"loss": 0.0,
"step": 39500
},
{
"epoch": 395.25,
"learning_rate": 4.6234177215189865e-07,
"loss": 0.0,
"step": 39525
},
{
"epoch": 395.5,
"learning_rate": 4.386075949367088e-07,
"loss": 0.0,
"step": 39550
},
{
"epoch": 395.75,
"learning_rate": 4.1487341772151893e-07,
"loss": 0.0,
"step": 39575
},
{
"epoch": 396.0,
"learning_rate": 3.911392405063291e-07,
"loss": 0.0,
"step": 39600
},
{
"epoch": 396.25,
"learning_rate": 3.674050632911392e-07,
"loss": 0.0,
"step": 39625
},
{
"epoch": 396.5,
"learning_rate": 3.436708860759493e-07,
"loss": 0.0,
"step": 39650
},
{
"epoch": 396.75,
"learning_rate": 3.1993670886075945e-07,
"loss": 0.0,
"step": 39675
},
{
"epoch": 397.0,
"learning_rate": 2.962025316455696e-07,
"loss": 0.0,
"step": 39700
},
{
"epoch": 397.25,
"learning_rate": 2.7246835443037973e-07,
"loss": 0.0,
"step": 39725
},
{
"epoch": 397.5,
"learning_rate": 2.487341772151899e-07,
"loss": 0.0,
"step": 39750
},
{
"epoch": 397.75,
"learning_rate": 2.25e-07,
"loss": 0.0,
"step": 39775
},
{
"epoch": 398.0,
"learning_rate": 2.012658227848101e-07,
"loss": 0.0,
"step": 39800
},
{
"epoch": 398.25,
"learning_rate": 1.7753164556962025e-07,
"loss": 0.0,
"step": 39825
},
{
"epoch": 398.5,
"learning_rate": 1.537974683544304e-07,
"loss": 0.0,
"step": 39850
},
{
"epoch": 398.75,
"learning_rate": 1.300632911392405e-07,
"loss": 0.0,
"step": 39875
},
{
"epoch": 399.0,
"learning_rate": 1.0632911392405063e-07,
"loss": 0.0,
"step": 39900
},
{
"epoch": 399.25,
"learning_rate": 8.259493670886075e-08,
"loss": 0.0,
"step": 39925
},
{
"epoch": 399.5,
"learning_rate": 5.886075949367088e-08,
"loss": 0.0,
"step": 39950
},
{
"epoch": 399.75,
"learning_rate": 3.5126582278481014e-08,
"loss": 0.0,
"step": 39975
},
{
"epoch": 400.0,
"learning_rate": 1.2341772151898733e-08,
"loss": 0.0,
"step": 40000
},
{
"epoch": 400.0,
"eval_loss": 0.6094558238983154,
"eval_runtime": 80.3325,
"eval_samples_per_second": 158.616,
"eval_steps_per_second": 1.245,
"eval_wer": 19.196498358605595,
"step": 40000
},
{
"epoch": 400.0,
"step": 40000,
"total_flos": 2.50955067359232e+20,
"train_loss": 0.010605198578223871,
"train_runtime": 40076.3871,
"train_samples_per_second": 255.512,
"train_steps_per_second": 0.998
}
],
"logging_steps": 25,
"max_steps": 40000,
"num_input_tokens_seen": 0,
"num_train_epochs": 400,
"save_steps": 1000,
"total_flos": 2.50955067359232e+20,
"train_batch_size": 256,
"trial_name": null,
"trial_params": null
}