Edresson's picture
Add checkpints
e226caa
{
"best_metric": 0.5058531761169434,
"best_model_checkpoint": "../checkpoints/Wav2Vec-voxpopuli/one-speaker/Final-paper/GT/PT/140-epoch/checkpoint-7360",
"epoch": 101.99688473520249,
"global_step": 8160,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"learning_rate": 4.016064257028112e-08,
"loss": 13.7434,
"step": 1
},
{
"epoch": 1.0,
"eval_loss": 21.166763305664062,
"eval_runtime": 236.3766,
"eval_samples_per_second": 29.893,
"eval_wer": 1.0027969233842773,
"step": 80
},
{
"epoch": 1.25,
"learning_rate": 4.016064257028113e-06,
"loss": 18.0487,
"step": 100
},
{
"epoch": 2.0,
"eval_loss": 13.212292671203613,
"eval_runtime": 235.4679,
"eval_samples_per_second": 30.008,
"eval_wer": 1.0,
"step": 160
},
{
"epoch": 2.5,
"learning_rate": 7.991967871485944e-06,
"loss": 13.4798,
"step": 200
},
{
"epoch": 3.0,
"eval_loss": 8.697088241577148,
"eval_runtime": 235.1241,
"eval_samples_per_second": 30.052,
"eval_wer": 1.0,
"step": 240
},
{
"epoch": 3.75,
"learning_rate": 1.2008032128514056e-05,
"loss": 8.6518,
"step": 300
},
{
"epoch": 4.0,
"eval_loss": 6.402597904205322,
"eval_runtime": 233.852,
"eval_samples_per_second": 30.216,
"eval_wer": 1.0,
"step": 320
},
{
"epoch": 5.0,
"learning_rate": 1.6024096385542168e-05,
"loss": 6.2486,
"step": 400
},
{
"epoch": 5.0,
"eval_loss": 5.096883296966553,
"eval_runtime": 235.426,
"eval_samples_per_second": 30.014,
"eval_wer": 1.0,
"step": 400
},
{
"epoch": 6.0,
"eval_loss": 4.204596519470215,
"eval_runtime": 235.3347,
"eval_samples_per_second": 30.025,
"eval_wer": 1.0,
"step": 480
},
{
"epoch": 6.25,
"learning_rate": 2.0040160642570282e-05,
"loss": 4.7563,
"step": 500
},
{
"epoch": 7.0,
"eval_loss": 3.5930964946746826,
"eval_runtime": 233.5038,
"eval_samples_per_second": 30.261,
"eval_wer": 1.0,
"step": 560
},
{
"epoch": 7.5,
"learning_rate": 2.4056224899598393e-05,
"loss": 3.756,
"step": 600
},
{
"epoch": 8.0,
"eval_loss": 3.2295875549316406,
"eval_runtime": 235.3066,
"eval_samples_per_second": 30.029,
"eval_wer": 1.0,
"step": 640
},
{
"epoch": 8.75,
"learning_rate": 2.8072289156626508e-05,
"loss": 3.23,
"step": 700
},
{
"epoch": 9.0,
"eval_loss": 3.0816433429718018,
"eval_runtime": 235.38,
"eval_samples_per_second": 30.02,
"eval_wer": 1.0,
"step": 720
},
{
"epoch": 10.0,
"learning_rate": 2.9850760547211327e-05,
"loss": 3.0413,
"step": 800
},
{
"epoch": 10.0,
"eval_loss": 3.010103940963745,
"eval_runtime": 235.1911,
"eval_samples_per_second": 30.044,
"eval_wer": 1.0,
"step": 800
},
{
"epoch": 11.0,
"eval_loss": 2.9560742378234863,
"eval_runtime": 234.3165,
"eval_samples_per_second": 30.156,
"eval_wer": 1.0,
"step": 880
},
{
"epoch": 11.25,
"learning_rate": 2.9563761599540802e-05,
"loss": 2.9748,
"step": 900
},
{
"epoch": 12.0,
"eval_loss": 2.9139442443847656,
"eval_runtime": 235.2653,
"eval_samples_per_second": 30.034,
"eval_wer": 1.0,
"step": 960
},
{
"epoch": 12.5,
"learning_rate": 2.9276762651870278e-05,
"loss": 2.9122,
"step": 1000
},
{
"epoch": 13.0,
"eval_loss": 2.897088050842285,
"eval_runtime": 235.1263,
"eval_samples_per_second": 30.052,
"eval_wer": 1.0,
"step": 1040
},
{
"epoch": 13.75,
"learning_rate": 2.8989763704199754e-05,
"loss": 2.8791,
"step": 1100
},
{
"epoch": 14.0,
"eval_loss": 2.8461437225341797,
"eval_runtime": 237.2882,
"eval_samples_per_second": 29.778,
"eval_wer": 1.0,
"step": 1120
},
{
"epoch": 15.0,
"learning_rate": 2.8702764756529226e-05,
"loss": 2.8098,
"step": 1200
},
{
"epoch": 15.0,
"eval_loss": 2.71140718460083,
"eval_runtime": 236.1183,
"eval_samples_per_second": 29.926,
"eval_wer": 0.9989611427429828,
"step": 1200
},
{
"epoch": 16.0,
"eval_loss": 2.430983066558838,
"eval_runtime": 234.0852,
"eval_samples_per_second": 30.186,
"eval_wer": 0.9871341524323245,
"step": 1280
},
{
"epoch": 16.25,
"learning_rate": 2.84157658088587e-05,
"loss": 2.6134,
"step": 1300
},
{
"epoch": 17.0,
"eval_loss": 2.0400171279907227,
"eval_runtime": 236.1033,
"eval_samples_per_second": 29.928,
"eval_wer": 0.9695534911597243,
"step": 1360
},
{
"epoch": 17.5,
"learning_rate": 2.8128766861188177e-05,
"loss": 2.2164,
"step": 1400
},
{
"epoch": 18.0,
"eval_loss": 1.610411286354065,
"eval_runtime": 234.9978,
"eval_samples_per_second": 30.068,
"eval_wer": 0.8650484467086205,
"step": 1440
},
{
"epoch": 18.75,
"learning_rate": 2.784176791351765e-05,
"loss": 1.7608,
"step": 1500
},
{
"epoch": 19.0,
"eval_loss": 1.3267238140106201,
"eval_runtime": 236.1618,
"eval_samples_per_second": 29.92,
"eval_wer": 0.7361502347417841,
"step": 1520
},
{
"epoch": 20.0,
"learning_rate": 2.7554768965847124e-05,
"loss": 1.4269,
"step": 1600
},
{
"epoch": 20.0,
"eval_loss": 1.1435879468917847,
"eval_runtime": 235.9998,
"eval_samples_per_second": 29.941,
"eval_wer": 0.6568774348216961,
"step": 1600
},
{
"epoch": 21.0,
"eval_loss": 1.0661028623580933,
"eval_runtime": 235.7709,
"eval_samples_per_second": 29.97,
"eval_wer": 0.6220956947357906,
"step": 1680
},
{
"epoch": 21.25,
"learning_rate": 2.72677700181766e-05,
"loss": 1.2421,
"step": 1700
},
{
"epoch": 22.0,
"eval_loss": 0.9825426936149597,
"eval_runtime": 235.4357,
"eval_samples_per_second": 30.012,
"eval_wer": 0.5804015582858856,
"step": 1760
},
{
"epoch": 22.5,
"learning_rate": 2.6980771070506075e-05,
"loss": 1.1212,
"step": 1800
},
{
"epoch": 23.0,
"eval_loss": 0.9016405344009399,
"eval_runtime": 236.5199,
"eval_samples_per_second": 29.875,
"eval_wer": 0.5381680151832984,
"step": 1840
},
{
"epoch": 23.75,
"learning_rate": 2.669377212283555e-05,
"loss": 1.0251,
"step": 1900
},
{
"epoch": 24.0,
"eval_loss": 0.8733579516410828,
"eval_runtime": 236.0952,
"eval_samples_per_second": 29.929,
"eval_wer": 0.5140145839576465,
"step": 1920
},
{
"epoch": 25.0,
"learning_rate": 2.6406773175165027e-05,
"loss": 0.9619,
"step": 2000
},
{
"epoch": 25.0,
"eval_loss": 0.815034031867981,
"eval_runtime": 236.7344,
"eval_samples_per_second": 29.848,
"eval_wer": 0.48626510838078113,
"step": 2000
},
{
"epoch": 26.0,
"eval_loss": 0.8121696710586548,
"eval_runtime": 236.6854,
"eval_samples_per_second": 29.854,
"eval_wer": 0.47379882129657375,
"step": 2080
},
{
"epoch": 26.25,
"learning_rate": 2.6119774227494502e-05,
"loss": 0.9102,
"step": 2100
},
{
"epoch": 27.0,
"eval_loss": 0.7858432531356812,
"eval_runtime": 235.5249,
"eval_samples_per_second": 30.001,
"eval_wer": 0.4592348416741584,
"step": 2160
},
{
"epoch": 27.5,
"learning_rate": 2.5832775279823974e-05,
"loss": 0.8691,
"step": 2200
},
{
"epoch": 28.0,
"eval_loss": 0.7678278088569641,
"eval_runtime": 236.2494,
"eval_samples_per_second": 29.909,
"eval_wer": 0.4526820497452802,
"step": 2240
},
{
"epoch": 28.75,
"learning_rate": 2.554577633215345e-05,
"loss": 0.8358,
"step": 2300
},
{
"epoch": 29.0,
"eval_loss": 0.744153618812561,
"eval_runtime": 236.3798,
"eval_samples_per_second": 29.893,
"eval_wer": 0.4421736090300669,
"step": 2320
},
{
"epoch": 30.0,
"learning_rate": 2.5258777384482922e-05,
"loss": 0.8078,
"step": 2400
},
{
"epoch": 30.0,
"eval_loss": 0.7339251637458801,
"eval_runtime": 236.5399,
"eval_samples_per_second": 29.872,
"eval_wer": 0.4369793227449805,
"step": 2400
},
{
"epoch": 31.0,
"eval_loss": 0.6944392919540405,
"eval_runtime": 236.1263,
"eval_samples_per_second": 29.925,
"eval_wer": 0.4234542003795825,
"step": 2480
},
{
"epoch": 31.25,
"learning_rate": 2.4971778436812397e-05,
"loss": 0.7813,
"step": 2500
},
{
"epoch": 32.0,
"eval_loss": 0.7018499374389648,
"eval_runtime": 236.4001,
"eval_samples_per_second": 29.89,
"eval_wer": 0.42349415642792926,
"step": 2560
},
{
"epoch": 32.5,
"learning_rate": 2.4684779489141873e-05,
"loss": 0.7586,
"step": 2600
},
{
"epoch": 33.0,
"eval_loss": 0.691132664680481,
"eval_runtime": 236.4392,
"eval_samples_per_second": 29.885,
"eval_wer": 0.4159824193387274,
"step": 2640
},
{
"epoch": 33.75,
"learning_rate": 2.439778054147135e-05,
"loss": 0.7311,
"step": 2700
},
{
"epoch": 34.0,
"eval_loss": 0.6664403080940247,
"eval_runtime": 235.2837,
"eval_samples_per_second": 30.032,
"eval_wer": 0.4046748576565778,
"step": 2720
},
{
"epoch": 35.0,
"learning_rate": 2.4110781593800824e-05,
"loss": 0.7201,
"step": 2800
},
{
"epoch": 35.0,
"eval_loss": 0.6681694388389587,
"eval_runtime": 237.7483,
"eval_samples_per_second": 29.721,
"eval_wer": 0.4040755169313755,
"step": 2800
},
{
"epoch": 36.0,
"eval_loss": 0.6622908115386963,
"eval_runtime": 235.7553,
"eval_samples_per_second": 29.972,
"eval_wer": 0.40017980221756067,
"step": 2880
},
{
"epoch": 36.25,
"learning_rate": 2.38237826461303e-05,
"loss": 0.6993,
"step": 2900
},
{
"epoch": 37.0,
"eval_loss": 0.6478127241134644,
"eval_runtime": 236.8845,
"eval_samples_per_second": 29.829,
"eval_wer": 0.394825691739087,
"step": 2960
},
{
"epoch": 37.5,
"learning_rate": 2.3536783698459775e-05,
"loss": 0.6855,
"step": 3000
},
{
"epoch": 38.0,
"eval_loss": 0.6474733352661133,
"eval_runtime": 234.8758,
"eval_samples_per_second": 30.084,
"eval_wer": 0.39692338427729495,
"step": 3040
},
{
"epoch": 38.75,
"learning_rate": 2.324978475078925e-05,
"loss": 0.676,
"step": 3100
},
{
"epoch": 39.0,
"eval_loss": 0.6449029445648193,
"eval_runtime": 236.3414,
"eval_samples_per_second": 29.897,
"eval_wer": 0.3954250324642893,
"step": 3120
},
{
"epoch": 40.0,
"learning_rate": 2.296278580311872e-05,
"loss": 0.6623,
"step": 3200
},
{
"epoch": 40.0,
"eval_loss": 0.631065309047699,
"eval_runtime": 236.9217,
"eval_samples_per_second": 29.824,
"eval_wer": 0.38497652582159625,
"step": 3200
},
{
"epoch": 41.0,
"eval_loss": 0.6289655566215515,
"eval_runtime": 236.5702,
"eval_samples_per_second": 29.869,
"eval_wer": 0.3841574268304865,
"step": 3280
},
{
"epoch": 41.25,
"learning_rate": 2.2675786855448195e-05,
"loss": 0.6458,
"step": 3300
},
{
"epoch": 42.0,
"eval_loss": 0.6317856907844543,
"eval_runtime": 235.0808,
"eval_samples_per_second": 30.058,
"eval_wer": 0.3838178004195385,
"step": 3360
},
{
"epoch": 42.5,
"learning_rate": 2.238878790777767e-05,
"loss": 0.6327,
"step": 3400
},
{
"epoch": 43.0,
"eval_loss": 0.6043937802314758,
"eval_runtime": 236.0018,
"eval_samples_per_second": 29.94,
"eval_wer": 0.3680950953950654,
"step": 3440
},
{
"epoch": 43.75,
"learning_rate": 2.2101788960107146e-05,
"loss": 0.6317,
"step": 3500
},
{
"epoch": 44.0,
"eval_loss": 0.6136683821678162,
"eval_runtime": 236.7044,
"eval_samples_per_second": 29.852,
"eval_wer": 0.37600639296773547,
"step": 3520
},
{
"epoch": 45.0,
"learning_rate": 2.181479001243662e-05,
"loss": 0.6206,
"step": 3600
},
{
"epoch": 45.0,
"eval_loss": 0.6018360257148743,
"eval_runtime": 235.576,
"eval_samples_per_second": 29.995,
"eval_wer": 0.37245030466486867,
"step": 3600
},
{
"epoch": 46.0,
"eval_loss": 0.6160127520561218,
"eval_runtime": 236.4202,
"eval_samples_per_second": 29.887,
"eval_wer": 0.378423733892718,
"step": 3680
},
{
"epoch": 46.25,
"learning_rate": 2.1527791064766097e-05,
"loss": 0.6045,
"step": 3700
},
{
"epoch": 47.0,
"eval_loss": 0.6069476008415222,
"eval_runtime": 237.3738,
"eval_samples_per_second": 29.767,
"eval_wer": 0.36865448007192086,
"step": 3760
},
{
"epoch": 47.5,
"learning_rate": 2.1240792117095573e-05,
"loss": 0.6049,
"step": 3800
},
{
"epoch": 48.0,
"eval_loss": 0.5968321561813354,
"eval_runtime": 235.4281,
"eval_samples_per_second": 30.013,
"eval_wer": 0.36411946858455696,
"step": 3840
},
{
"epoch": 48.75,
"learning_rate": 2.0953793169425048e-05,
"loss": 0.5877,
"step": 3900
},
{
"epoch": 49.0,
"eval_loss": 0.6001846790313721,
"eval_runtime": 235.467,
"eval_samples_per_second": 30.008,
"eval_wer": 0.36515832584157426,
"step": 3920
},
{
"epoch": 50.0,
"learning_rate": 2.066679422175452e-05,
"loss": 0.5865,
"step": 4000
},
{
"epoch": 50.0,
"eval_loss": 0.5853711366653442,
"eval_runtime": 235.5406,
"eval_samples_per_second": 29.999,
"eval_wer": 0.3635001498351813,
"step": 4000
},
{
"epoch": 51.0,
"eval_loss": 0.5745455622673035,
"eval_runtime": 236.1025,
"eval_samples_per_second": 29.928,
"eval_wer": 0.35540905004495055,
"step": 4080
},
{
"epoch": 51.25,
"learning_rate": 2.0379795274083996e-05,
"loss": 0.5764,
"step": 4100
},
{
"epoch": 52.0,
"eval_loss": 0.5656818151473999,
"eval_runtime": 237.1421,
"eval_samples_per_second": 29.796,
"eval_wer": 0.35113375287184095,
"step": 4160
},
{
"epoch": 52.5,
"learning_rate": 2.0092796326413468e-05,
"loss": 0.5706,
"step": 4200
},
{
"epoch": 53.0,
"eval_loss": 0.5767672657966614,
"eval_runtime": 235.7491,
"eval_samples_per_second": 29.973,
"eval_wer": 0.355089401658176,
"step": 4240
},
{
"epoch": 53.75,
"learning_rate": 1.9805797378742943e-05,
"loss": 0.565,
"step": 4300
},
{
"epoch": 54.0,
"eval_loss": 0.5638183355331421,
"eval_runtime": 236.1669,
"eval_samples_per_second": 29.92,
"eval_wer": 0.3511936869443612,
"step": 4320
},
{
"epoch": 55.0,
"learning_rate": 1.951879843107242e-05,
"loss": 0.5499,
"step": 4400
},
{
"epoch": 55.0,
"eval_loss": 0.5843964219093323,
"eval_runtime": 237.455,
"eval_samples_per_second": 29.757,
"eval_wer": 0.3593047647587654,
"step": 4400
},
{
"epoch": 56.0,
"eval_loss": 0.5718104839324951,
"eval_runtime": 235.3494,
"eval_samples_per_second": 30.023,
"eval_wer": 0.35534911597243035,
"step": 4480
},
{
"epoch": 56.25,
"learning_rate": 1.9231799483401894e-05,
"loss": 0.5554,
"step": 4500
},
{
"epoch": 57.0,
"eval_loss": 0.5693724155426025,
"eval_runtime": 237.1158,
"eval_samples_per_second": 29.8,
"eval_wer": 0.3528718409749276,
"step": 4560
},
{
"epoch": 57.5,
"learning_rate": 1.894480053573137e-05,
"loss": 0.5464,
"step": 4600
},
{
"epoch": 58.0,
"eval_loss": 0.5594637989997864,
"eval_runtime": 237.4676,
"eval_samples_per_second": 29.756,
"eval_wer": 0.3494156427929278,
"step": 4640
},
{
"epoch": 58.75,
"learning_rate": 1.8657801588060845e-05,
"loss": 0.539,
"step": 4700
},
{
"epoch": 59.0,
"eval_loss": 0.5721908807754517,
"eval_runtime": 236.7283,
"eval_samples_per_second": 29.849,
"eval_wer": 0.35081410448506645,
"step": 4720
},
{
"epoch": 60.0,
"learning_rate": 1.837080264039032e-05,
"loss": 0.5359,
"step": 4800
},
{
"epoch": 60.0,
"eval_loss": 0.5462157130241394,
"eval_runtime": 235.957,
"eval_samples_per_second": 29.946,
"eval_wer": 0.3440015982419339,
"step": 4800
},
{
"epoch": 61.0,
"eval_loss": 0.5488569736480713,
"eval_runtime": 236.1407,
"eval_samples_per_second": 29.923,
"eval_wer": 0.34198381780041953,
"step": 4880
},
{
"epoch": 61.25,
"learning_rate": 1.8083803692719793e-05,
"loss": 0.5304,
"step": 4900
},
{
"epoch": 62.0,
"eval_loss": 0.5528755784034729,
"eval_runtime": 235.178,
"eval_samples_per_second": 30.045,
"eval_wer": 0.3452202577165118,
"step": 4960
},
{
"epoch": 62.5,
"learning_rate": 1.779680474504927e-05,
"loss": 0.52,
"step": 5000
},
{
"epoch": 63.0,
"eval_loss": 0.5493497252464294,
"eval_runtime": 234.848,
"eval_samples_per_second": 30.088,
"eval_wer": 0.34174408151033864,
"step": 5040
},
{
"epoch": 63.75,
"learning_rate": 1.7509805797378744e-05,
"loss": 0.5316,
"step": 5100
},
{
"epoch": 64.0,
"eval_loss": 0.5514699816703796,
"eval_runtime": 234.6944,
"eval_samples_per_second": 30.107,
"eval_wer": 0.34138447707521724,
"step": 5120
},
{
"epoch": 65.0,
"learning_rate": 1.7222806849708216e-05,
"loss": 0.5191,
"step": 5200
},
{
"epoch": 65.0,
"eval_loss": 0.5479201674461365,
"eval_runtime": 235.3908,
"eval_samples_per_second": 30.018,
"eval_wer": 0.3387273998601538,
"step": 5200
},
{
"epoch": 66.0,
"eval_loss": 0.5452239513397217,
"eval_runtime": 233.7285,
"eval_samples_per_second": 30.232,
"eval_wer": 0.34569973029667367,
"step": 5280
},
{
"epoch": 66.25,
"learning_rate": 1.6935807902037692e-05,
"loss": 0.5138,
"step": 5300
},
{
"epoch": 67.0,
"eval_loss": 0.5339746475219727,
"eval_runtime": 238.4195,
"eval_samples_per_second": 29.637,
"eval_wer": 0.3345120367595645,
"step": 5360
},
{
"epoch": 67.5,
"learning_rate": 1.6648808954367167e-05,
"loss": 0.5161,
"step": 5400
},
{
"epoch": 68.0,
"eval_loss": 0.529504120349884,
"eval_runtime": 235.3768,
"eval_samples_per_second": 30.02,
"eval_wer": 0.3316352012785935,
"step": 5440
},
{
"epoch": 68.75,
"learning_rate": 1.6361810006696643e-05,
"loss": 0.5038,
"step": 5500
},
{
"epoch": 69.0,
"eval_loss": 0.540134847164154,
"eval_runtime": 234.8619,
"eval_samples_per_second": 30.086,
"eval_wer": 0.3354310258715413,
"step": 5520
},
{
"epoch": 70.0,
"learning_rate": 1.607481105902612e-05,
"loss": 0.4976,
"step": 5600
},
{
"epoch": 70.0,
"eval_loss": 0.5468968749046326,
"eval_runtime": 234.2977,
"eval_samples_per_second": 30.158,
"eval_wer": 0.33575067425831584,
"step": 5600
},
{
"epoch": 71.0,
"eval_loss": 0.5490255951881409,
"eval_runtime": 235.056,
"eval_samples_per_second": 30.061,
"eval_wer": 0.33371291579262813,
"step": 5680
},
{
"epoch": 71.25,
"learning_rate": 1.578781211135559e-05,
"loss": 0.4983,
"step": 5700
},
{
"epoch": 72.0,
"eval_loss": 0.5308582782745361,
"eval_runtime": 240.9129,
"eval_samples_per_second": 29.33,
"eval_wer": 0.32967735490959943,
"step": 5760
},
{
"epoch": 72.5,
"learning_rate": 1.5500813163685066e-05,
"loss": 0.4893,
"step": 5800
},
{
"epoch": 73.0,
"eval_loss": 0.5336333513259888,
"eval_runtime": 234.8259,
"eval_samples_per_second": 30.09,
"eval_wer": 0.33373289381680155,
"step": 5840
},
{
"epoch": 73.75,
"learning_rate": 1.5213814216014542e-05,
"loss": 0.4926,
"step": 5900
},
{
"epoch": 74.0,
"eval_loss": 0.5315715074539185,
"eval_runtime": 233.7173,
"eval_samples_per_second": 30.233,
"eval_wer": 0.3309359704325242,
"step": 5920
},
{
"epoch": 75.0,
"learning_rate": 1.4926815268344016e-05,
"loss": 0.4844,
"step": 6000
},
{
"epoch": 75.0,
"eval_loss": 0.5397169589996338,
"eval_runtime": 233.3548,
"eval_samples_per_second": 30.28,
"eval_wer": 0.3329937069223854,
"step": 6000
},
{
"epoch": 76.0,
"eval_loss": 0.5310106873512268,
"eval_runtime": 234.4399,
"eval_samples_per_second": 30.14,
"eval_wer": 0.334292278493657,
"step": 6080
},
{
"epoch": 76.25,
"learning_rate": 1.4639816320673491e-05,
"loss": 0.4821,
"step": 6100
},
{
"epoch": 77.0,
"eval_loss": 0.5305867791175842,
"eval_runtime": 233.3613,
"eval_samples_per_second": 30.279,
"eval_wer": 0.3270402557187094,
"step": 6160
},
{
"epoch": 77.5,
"learning_rate": 1.4352817373002967e-05,
"loss": 0.4772,
"step": 6200
},
{
"epoch": 78.0,
"eval_loss": 0.5232115387916565,
"eval_runtime": 234.4045,
"eval_samples_per_second": 30.144,
"eval_wer": 0.32903805813605036,
"step": 6240
},
{
"epoch": 78.75,
"learning_rate": 1.406581842533244e-05,
"loss": 0.4876,
"step": 6300
},
{
"epoch": 79.0,
"eval_loss": 0.5481472015380859,
"eval_runtime": 235.1064,
"eval_samples_per_second": 30.054,
"eval_wer": 0.32951753071621215,
"step": 6320
},
{
"epoch": 80.0,
"learning_rate": 1.3778819477661916e-05,
"loss": 0.471,
"step": 6400
},
{
"epoch": 80.0,
"eval_loss": 0.5388906598091125,
"eval_runtime": 234.5017,
"eval_samples_per_second": 30.132,
"eval_wer": 0.3307761462391369,
"step": 6400
},
{
"epoch": 81.0,
"eval_loss": 0.5276188254356384,
"eval_runtime": 234.907,
"eval_samples_per_second": 30.08,
"eval_wer": 0.32865847567675555,
"step": 6480
},
{
"epoch": 81.25,
"learning_rate": 1.349182052999139e-05,
"loss": 0.4721,
"step": 6500
},
{
"epoch": 82.0,
"eval_loss": 0.5138600468635559,
"eval_runtime": 236.3966,
"eval_samples_per_second": 29.89,
"eval_wer": 0.32388372789931075,
"step": 6560
},
{
"epoch": 82.5,
"learning_rate": 1.3204821582320865e-05,
"loss": 0.4706,
"step": 6600
},
{
"epoch": 83.0,
"eval_loss": 0.5274313688278198,
"eval_runtime": 234.3438,
"eval_samples_per_second": 30.152,
"eval_wer": 0.32626111277594644,
"step": 6640
},
{
"epoch": 83.75,
"learning_rate": 1.2917822634650339e-05,
"loss": 0.4659,
"step": 6700
},
{
"epoch": 84.0,
"eval_loss": 0.5202988386154175,
"eval_runtime": 234.4209,
"eval_samples_per_second": 30.142,
"eval_wer": 0.3222255518929178,
"step": 6720
},
{
"epoch": 85.0,
"learning_rate": 1.2630823686979815e-05,
"loss": 0.4607,
"step": 6800
},
{
"epoch": 85.0,
"eval_loss": 0.5231702923774719,
"eval_runtime": 235.6072,
"eval_samples_per_second": 29.991,
"eval_wer": 0.320867046249126,
"step": 6800
},
{
"epoch": 86.0,
"eval_loss": 0.5206882953643799,
"eval_runtime": 235.3295,
"eval_samples_per_second": 30.026,
"eval_wer": 0.32252522225551894,
"step": 6880
},
{
"epoch": 86.25,
"learning_rate": 1.234382473930929e-05,
"loss": 0.4634,
"step": 6900
},
{
"epoch": 87.0,
"eval_loss": 0.522659182548523,
"eval_runtime": 235.3665,
"eval_samples_per_second": 30.021,
"eval_wer": 0.32252522225551894,
"step": 6960
},
{
"epoch": 87.5,
"learning_rate": 1.2056825791638764e-05,
"loss": 0.4546,
"step": 7000
},
{
"epoch": 88.0,
"eval_loss": 0.5252255201339722,
"eval_runtime": 234.3682,
"eval_samples_per_second": 30.149,
"eval_wer": 0.32510238737388875,
"step": 7040
},
{
"epoch": 88.75,
"learning_rate": 1.1769826843968238e-05,
"loss": 0.4606,
"step": 7100
},
{
"epoch": 89.0,
"eval_loss": 0.5120769739151001,
"eval_runtime": 236.0459,
"eval_samples_per_second": 29.935,
"eval_wer": 0.32012785935470983,
"step": 7120
},
{
"epoch": 90.0,
"learning_rate": 1.1482827896297713e-05,
"loss": 0.4565,
"step": 7200
},
{
"epoch": 90.0,
"eval_loss": 0.5241296291351318,
"eval_runtime": 233.918,
"eval_samples_per_second": 30.207,
"eval_wer": 0.32190590350614323,
"step": 7200
},
{
"epoch": 91.0,
"eval_loss": 0.5129281282424927,
"eval_runtime": 235.5104,
"eval_samples_per_second": 30.003,
"eval_wer": 0.3203675956447907,
"step": 7280
},
{
"epoch": 91.25,
"learning_rate": 1.1195828948627189e-05,
"loss": 0.4557,
"step": 7300
},
{
"epoch": 92.0,
"eval_loss": 0.5058531761169434,
"eval_runtime": 235.6964,
"eval_samples_per_second": 29.979,
"eval_wer": 0.3161522325442014,
"step": 7360
},
{
"epoch": 92.5,
"learning_rate": 1.0908830000956664e-05,
"loss": 0.4528,
"step": 7400
},
{
"epoch": 93.0,
"eval_loss": 0.5195637345314026,
"eval_runtime": 236.5815,
"eval_samples_per_second": 29.867,
"eval_wer": 0.32304465088402756,
"step": 7440
},
{
"epoch": 93.75,
"learning_rate": 1.0621831053286138e-05,
"loss": 0.4507,
"step": 7500
},
{
"epoch": 94.0,
"eval_loss": 0.5212134718894958,
"eval_runtime": 236.6887,
"eval_samples_per_second": 29.854,
"eval_wer": 0.3194286285086405,
"step": 7520
},
{
"epoch": 95.0,
"learning_rate": 1.0334832105615612e-05,
"loss": 0.4491,
"step": 7600
},
{
"epoch": 95.0,
"eval_loss": 0.5105758905410767,
"eval_runtime": 236.3704,
"eval_samples_per_second": 29.894,
"eval_wer": 0.31345519928079113,
"step": 7600
},
{
"epoch": 96.0,
"eval_loss": 0.5123084187507629,
"eval_runtime": 236.3046,
"eval_samples_per_second": 29.902,
"eval_wer": 0.31884926580761164,
"step": 7680
},
{
"epoch": 96.25,
"learning_rate": 1.0047833157945088e-05,
"loss": 0.446,
"step": 7700
},
{
"epoch": 97.0,
"eval_loss": 0.5163899660110474,
"eval_runtime": 236.0105,
"eval_samples_per_second": 29.939,
"eval_wer": 0.3189691339526521,
"step": 7760
},
{
"epoch": 97.5,
"learning_rate": 9.760834210274563e-06,
"loss": 0.4474,
"step": 7800
},
{
"epoch": 98.0,
"eval_loss": 0.5071632266044617,
"eval_runtime": 238.0944,
"eval_samples_per_second": 29.677,
"eval_wer": 0.3145340125861552,
"step": 7840
},
{
"epoch": 98.75,
"learning_rate": 9.473835262604039e-06,
"loss": 0.4389,
"step": 7900
},
{
"epoch": 99.0,
"eval_loss": 0.5162996649742126,
"eval_runtime": 234.5869,
"eval_samples_per_second": 30.121,
"eval_wer": 0.3179502547198082,
"step": 7920
},
{
"epoch": 100.0,
"learning_rate": 9.186836314933511e-06,
"loss": 0.4408,
"step": 8000
},
{
"epoch": 100.0,
"eval_loss": 0.511136531829834,
"eval_runtime": 235.2605,
"eval_samples_per_second": 30.035,
"eval_wer": 0.3154929577464789,
"step": 8000
},
{
"epoch": 101.0,
"eval_loss": 0.5172923803329468,
"eval_runtime": 237.12,
"eval_samples_per_second": 29.799,
"eval_wer": 0.3147937269004096,
"step": 8080
},
{
"epoch": 101.25,
"learning_rate": 8.899837367262986e-06,
"loss": 0.4399,
"step": 8100
},
{
"epoch": 102.0,
"eval_loss": 0.5145618915557861,
"eval_runtime": 236.8186,
"eval_samples_per_second": 29.837,
"eval_wer": 0.3172909799220857,
"step": 8160
},
{
"epoch": 102.0,
"step": 8160,
"total_flos": 0,
"train_runtime": 110050.311,
"train_samples_per_second": 0.102
}
],
"max_steps": 11200,
"num_train_epochs": 140,
"total_flos": 0,
"trial_name": null,
"trial_params": null
}