gary109's picture
End of training
f87e482
raw
history blame
67.5 kB
{
"best_metric": 1.8990676403045654,
"best_model_checkpoint": "ai-light-dance_drums_ft_pretrain_wav2vec2-base/checkpoint-496",
"epoch": 199.90140845070422,
"global_step": 1600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.9,
"eval_loss": 2.043365240097046,
"eval_runtime": 7.4215,
"eval_samples_per_second": 8.489,
"eval_steps_per_second": 1.078,
"eval_wer": 0.622568093385214,
"step": 8
},
{
"epoch": 1.23,
"learning_rate": 0.0002,
"loss": 0.4739,
"step": 10
},
{
"epoch": 1.9,
"eval_loss": 2.102400064468384,
"eval_runtime": 7.4428,
"eval_samples_per_second": 8.465,
"eval_steps_per_second": 1.075,
"eval_wer": 0.6246632744687219,
"step": 16
},
{
"epoch": 2.45,
"learning_rate": 0.0004,
"loss": 0.4693,
"step": 20
},
{
"epoch": 2.9,
"eval_loss": 1.9824020862579346,
"eval_runtime": 7.4471,
"eval_samples_per_second": 8.46,
"eval_steps_per_second": 1.074,
"eval_wer": 0.6210715354684226,
"step": 24
},
{
"epoch": 3.68,
"learning_rate": 0.00039746835443037974,
"loss": 0.5139,
"step": 30
},
{
"epoch": 3.9,
"eval_loss": 2.2961695194244385,
"eval_runtime": 7.4429,
"eval_samples_per_second": 8.464,
"eval_steps_per_second": 1.075,
"eval_wer": 0.6429212810535768,
"step": 32
},
{
"epoch": 4.9,
"learning_rate": 0.0003949367088607595,
"loss": 0.5081,
"step": 40
},
{
"epoch": 4.9,
"eval_loss": 2.2200775146484375,
"eval_runtime": 7.4534,
"eval_samples_per_second": 8.452,
"eval_steps_per_second": 1.073,
"eval_wer": 0.6291529482190961,
"step": 40
},
{
"epoch": 5.9,
"eval_loss": 2.139875888824463,
"eval_runtime": 7.459,
"eval_samples_per_second": 8.446,
"eval_steps_per_second": 1.073,
"eval_wer": 0.6207722238850644,
"step": 48
},
{
"epoch": 6.23,
"learning_rate": 0.0003924050632911393,
"loss": 0.5785,
"step": 50
},
{
"epoch": 6.9,
"eval_loss": 2.145110607147217,
"eval_runtime": 7.4526,
"eval_samples_per_second": 8.453,
"eval_steps_per_second": 1.073,
"eval_wer": 0.6417240347201437,
"step": 56
},
{
"epoch": 7.45,
"learning_rate": 0.000389873417721519,
"loss": 0.533,
"step": 60
},
{
"epoch": 7.9,
"eval_loss": 2.118384599685669,
"eval_runtime": 7.4549,
"eval_samples_per_second": 8.451,
"eval_steps_per_second": 1.073,
"eval_wer": 0.6330439988027536,
"step": 64
},
{
"epoch": 8.68,
"learning_rate": 0.00038734177215189877,
"loss": 0.5141,
"step": 70
},
{
"epoch": 8.9,
"eval_loss": 2.02298903465271,
"eval_runtime": 7.4493,
"eval_samples_per_second": 8.457,
"eval_steps_per_second": 1.074,
"eval_wer": 0.6342412451361867,
"step": 72
},
{
"epoch": 9.9,
"learning_rate": 0.0003848101265822785,
"loss": 0.4971,
"step": 80
},
{
"epoch": 9.9,
"eval_loss": 2.2136712074279785,
"eval_runtime": 7.4321,
"eval_samples_per_second": 8.477,
"eval_steps_per_second": 1.076,
"eval_wer": 0.6381322957198443,
"step": 80
},
{
"epoch": 10.9,
"eval_loss": 2.1159048080444336,
"eval_runtime": 7.3886,
"eval_samples_per_second": 8.527,
"eval_steps_per_second": 1.083,
"eval_wer": 0.6252618976354385,
"step": 88
},
{
"epoch": 11.23,
"learning_rate": 0.00038227848101265825,
"loss": 0.5645,
"step": 90
},
{
"epoch": 11.9,
"eval_loss": 2.096606969833374,
"eval_runtime": 7.4372,
"eval_samples_per_second": 8.471,
"eval_steps_per_second": 1.076,
"eval_wer": 0.6246632744687219,
"step": 96
},
{
"epoch": 12.45,
"learning_rate": 0.00037974683544303797,
"loss": 0.4932,
"step": 100
},
{
"epoch": 12.9,
"eval_loss": 1.9248937368392944,
"eval_runtime": 7.4436,
"eval_samples_per_second": 8.464,
"eval_steps_per_second": 1.075,
"eval_wer": 0.6222687818018557,
"step": 104
},
{
"epoch": 13.68,
"learning_rate": 0.00037721518987341774,
"loss": 0.4918,
"step": 110
},
{
"epoch": 13.9,
"eval_loss": 2.044543504714966,
"eval_runtime": 7.3836,
"eval_samples_per_second": 8.532,
"eval_steps_per_second": 1.083,
"eval_wer": 0.6234660281352888,
"step": 112
},
{
"epoch": 14.9,
"learning_rate": 0.00037468354430379746,
"loss": 0.5053,
"step": 120
},
{
"epoch": 14.9,
"eval_loss": 2.1316659450531006,
"eval_runtime": 7.3635,
"eval_samples_per_second": 8.556,
"eval_steps_per_second": 1.086,
"eval_wer": 0.6303501945525292,
"step": 120
},
{
"epoch": 15.9,
"eval_loss": 2.0722815990448,
"eval_runtime": 7.4257,
"eval_samples_per_second": 8.484,
"eval_steps_per_second": 1.077,
"eval_wer": 0.6255612092187968,
"step": 128
},
{
"epoch": 16.23,
"learning_rate": 0.00037215189873417723,
"loss": 0.5565,
"step": 130
},
{
"epoch": 16.9,
"eval_loss": 2.1390268802642822,
"eval_runtime": 7.3865,
"eval_samples_per_second": 8.529,
"eval_steps_per_second": 1.083,
"eval_wer": 0.6402274768033522,
"step": 136
},
{
"epoch": 17.45,
"learning_rate": 0.000369620253164557,
"loss": 0.4819,
"step": 140
},
{
"epoch": 17.9,
"eval_loss": 1.9555976390838623,
"eval_runtime": 7.4506,
"eval_samples_per_second": 8.456,
"eval_steps_per_second": 1.074,
"eval_wer": 0.6321460640526788,
"step": 144
},
{
"epoch": 18.68,
"learning_rate": 0.0003670886075949367,
"loss": 0.5131,
"step": 150
},
{
"epoch": 18.9,
"eval_loss": 1.9886202812194824,
"eval_runtime": 7.4236,
"eval_samples_per_second": 8.486,
"eval_steps_per_second": 1.078,
"eval_wer": 0.6333433103861119,
"step": 152
},
{
"epoch": 19.9,
"learning_rate": 0.0003645569620253165,
"loss": 0.4798,
"step": 160
},
{
"epoch": 19.9,
"eval_loss": 1.9700343608856201,
"eval_runtime": 7.4038,
"eval_samples_per_second": 8.509,
"eval_steps_per_second": 1.081,
"eval_wer": 0.625860520802155,
"step": 160
},
{
"epoch": 20.9,
"eval_loss": 1.9770878553390503,
"eval_runtime": 7.3878,
"eval_samples_per_second": 8.528,
"eval_steps_per_second": 1.083,
"eval_wer": 0.6294522598024543,
"step": 168
},
{
"epoch": 21.23,
"learning_rate": 0.00036202531645569626,
"loss": 0.5221,
"step": 170
},
{
"epoch": 21.9,
"eval_loss": 1.9879639148712158,
"eval_runtime": 7.4443,
"eval_samples_per_second": 8.463,
"eval_steps_per_second": 1.075,
"eval_wer": 0.6234660281352888,
"step": 176
},
{
"epoch": 22.45,
"learning_rate": 0.000359493670886076,
"loss": 0.4862,
"step": 180
},
{
"epoch": 22.9,
"eval_loss": 2.0993940830230713,
"eval_runtime": 7.4025,
"eval_samples_per_second": 8.511,
"eval_steps_per_second": 1.081,
"eval_wer": 0.6297515713858126,
"step": 184
},
{
"epoch": 23.68,
"learning_rate": 0.0003569620253164557,
"loss": 0.4831,
"step": 190
},
{
"epoch": 23.9,
"eval_loss": 2.0521020889282227,
"eval_runtime": 7.4186,
"eval_samples_per_second": 8.492,
"eval_steps_per_second": 1.078,
"eval_wer": 0.6204729123017061,
"step": 192
},
{
"epoch": 24.9,
"learning_rate": 0.00035443037974683546,
"loss": 0.4952,
"step": 200
},
{
"epoch": 24.9,
"eval_loss": 1.9838017225265503,
"eval_runtime": 7.3891,
"eval_samples_per_second": 8.526,
"eval_steps_per_second": 1.083,
"eval_wer": 0.6064052678838671,
"step": 200
},
{
"epoch": 25.9,
"eval_loss": 2.0318851470947266,
"eval_runtime": 7.3778,
"eval_samples_per_second": 8.539,
"eval_steps_per_second": 1.084,
"eval_wer": 0.6102963184675247,
"step": 208
},
{
"epoch": 26.23,
"learning_rate": 0.00035189873417721524,
"loss": 0.5119,
"step": 210
},
{
"epoch": 26.9,
"eval_loss": 2.041926383972168,
"eval_runtime": 7.4175,
"eval_samples_per_second": 8.493,
"eval_steps_per_second": 1.079,
"eval_wer": 0.615983238551332,
"step": 216
},
{
"epoch": 27.45,
"learning_rate": 0.00034936708860759495,
"loss": 0.4996,
"step": 220
},
{
"epoch": 27.9,
"eval_loss": 2.0072860717773438,
"eval_runtime": 7.4199,
"eval_samples_per_second": 8.491,
"eval_steps_per_second": 1.078,
"eval_wer": 0.6177791080514816,
"step": 224
},
{
"epoch": 28.68,
"learning_rate": 0.00034683544303797467,
"loss": 0.488,
"step": 230
},
{
"epoch": 28.9,
"eval_loss": 2.1739721298217773,
"eval_runtime": 7.4297,
"eval_samples_per_second": 8.479,
"eval_steps_per_second": 1.077,
"eval_wer": 0.6303501945525292,
"step": 232
},
{
"epoch": 29.9,
"learning_rate": 0.00034430379746835444,
"loss": 0.4978,
"step": 240
},
{
"epoch": 29.9,
"eval_loss": 2.2731006145477295,
"eval_runtime": 7.4184,
"eval_samples_per_second": 8.492,
"eval_steps_per_second": 1.078,
"eval_wer": 0.6162825501346902,
"step": 240
},
{
"epoch": 30.9,
"eval_loss": 2.241990804672241,
"eval_runtime": 7.3744,
"eval_samples_per_second": 8.543,
"eval_steps_per_second": 1.085,
"eval_wer": 0.6204729123017061,
"step": 248
},
{
"epoch": 31.23,
"learning_rate": 0.0003417721518987342,
"loss": 0.5259,
"step": 250
},
{
"epoch": 31.9,
"eval_loss": 2.056137800216675,
"eval_runtime": 7.5227,
"eval_samples_per_second": 8.375,
"eval_steps_per_second": 1.063,
"eval_wer": 0.6183777312181982,
"step": 256
},
{
"epoch": 32.45,
"learning_rate": 0.00033924050632911393,
"loss": 0.47,
"step": 260
},
{
"epoch": 32.9,
"eval_loss": 1.9454554319381714,
"eval_runtime": 7.427,
"eval_samples_per_second": 8.483,
"eval_steps_per_second": 1.077,
"eval_wer": 0.6135887458844658,
"step": 264
},
{
"epoch": 33.68,
"learning_rate": 0.0003367088607594937,
"loss": 0.5132,
"step": 270
},
{
"epoch": 33.9,
"eval_loss": 1.9306591749191284,
"eval_runtime": 7.4197,
"eval_samples_per_second": 8.491,
"eval_steps_per_second": 1.078,
"eval_wer": 0.6043100868003591,
"step": 272
},
{
"epoch": 34.9,
"learning_rate": 0.0003341772151898734,
"loss": 0.4972,
"step": 280
},
{
"epoch": 34.9,
"eval_loss": 2.0536110401153564,
"eval_runtime": 7.3867,
"eval_samples_per_second": 8.529,
"eval_steps_per_second": 1.083,
"eval_wer": 0.612690811134391,
"step": 280
},
{
"epoch": 35.9,
"eval_loss": 1.9113465547561646,
"eval_runtime": 7.4412,
"eval_samples_per_second": 8.466,
"eval_steps_per_second": 1.075,
"eval_wer": 0.6222687818018557,
"step": 288
},
{
"epoch": 36.23,
"learning_rate": 0.0003316455696202532,
"loss": 0.5147,
"step": 290
},
{
"epoch": 36.9,
"eval_loss": 1.9317280054092407,
"eval_runtime": 7.3447,
"eval_samples_per_second": 8.578,
"eval_steps_per_second": 1.089,
"eval_wer": 0.6285543250523795,
"step": 296
},
{
"epoch": 37.45,
"learning_rate": 0.00032911392405063296,
"loss": 0.4914,
"step": 300
},
{
"epoch": 37.9,
"eval_loss": 2.1809628009796143,
"eval_runtime": 7.4319,
"eval_samples_per_second": 8.477,
"eval_steps_per_second": 1.076,
"eval_wer": 0.6240646513020054,
"step": 304
},
{
"epoch": 38.68,
"learning_rate": 0.0003265822784810127,
"loss": 0.472,
"step": 310
},
{
"epoch": 38.9,
"eval_loss": 2.1403472423553467,
"eval_runtime": 7.4116,
"eval_samples_per_second": 8.5,
"eval_steps_per_second": 1.079,
"eval_wer": 0.615983238551332,
"step": 312
},
{
"epoch": 39.9,
"learning_rate": 0.0003240506329113924,
"loss": 0.4825,
"step": 320
},
{
"epoch": 39.9,
"eval_loss": 2.1141297817230225,
"eval_runtime": 7.4006,
"eval_samples_per_second": 8.513,
"eval_steps_per_second": 1.081,
"eval_wer": 0.6093983837174499,
"step": 320
},
{
"epoch": 40.9,
"eval_loss": 2.2869985103607178,
"eval_runtime": 7.4339,
"eval_samples_per_second": 8.475,
"eval_steps_per_second": 1.076,
"eval_wer": 0.603112840466926,
"step": 328
},
{
"epoch": 41.23,
"learning_rate": 0.00032151898734177216,
"loss": 0.5138,
"step": 330
},
{
"epoch": 41.9,
"eval_loss": 2.14039945602417,
"eval_runtime": 7.4445,
"eval_samples_per_second": 8.463,
"eval_steps_per_second": 1.075,
"eval_wer": 0.6180784196348399,
"step": 336
},
{
"epoch": 42.45,
"learning_rate": 0.00031898734177215193,
"loss": 0.48,
"step": 340
},
{
"epoch": 42.9,
"eval_loss": 2.024348497390747,
"eval_runtime": 7.3969,
"eval_samples_per_second": 8.517,
"eval_steps_per_second": 1.082,
"eval_wer": 0.6264591439688716,
"step": 344
},
{
"epoch": 43.68,
"learning_rate": 0.00031645569620253165,
"loss": 0.4598,
"step": 350
},
{
"epoch": 43.9,
"eval_loss": 2.111736297607422,
"eval_runtime": 7.411,
"eval_samples_per_second": 8.501,
"eval_steps_per_second": 1.079,
"eval_wer": 0.6198742891349895,
"step": 352
},
{
"epoch": 44.9,
"learning_rate": 0.00031392405063291137,
"loss": 0.474,
"step": 360
},
{
"epoch": 44.9,
"eval_loss": 2.0378293991088867,
"eval_runtime": 7.4069,
"eval_samples_per_second": 8.506,
"eval_steps_per_second": 1.08,
"eval_wer": 0.6321460640526788,
"step": 360
},
{
"epoch": 45.9,
"eval_loss": 2.191941261291504,
"eval_runtime": 7.392,
"eval_samples_per_second": 8.523,
"eval_steps_per_second": 1.082,
"eval_wer": 0.6210715354684226,
"step": 368
},
{
"epoch": 46.23,
"learning_rate": 0.0003113924050632912,
"loss": 0.4933,
"step": 370
},
{
"epoch": 46.9,
"eval_loss": 2.3645358085632324,
"eval_runtime": 7.3897,
"eval_samples_per_second": 8.525,
"eval_steps_per_second": 1.083,
"eval_wer": 0.6108949416342413,
"step": 376
},
{
"epoch": 47.45,
"learning_rate": 0.0003088607594936709,
"loss": 0.4692,
"step": 380
},
{
"epoch": 47.9,
"eval_loss": 2.1920251846313477,
"eval_runtime": 7.4249,
"eval_samples_per_second": 8.485,
"eval_steps_per_second": 1.077,
"eval_wer": 0.6076025142173002,
"step": 384
},
{
"epoch": 48.68,
"learning_rate": 0.00030632911392405063,
"loss": 0.4716,
"step": 390
},
{
"epoch": 48.9,
"eval_loss": 2.366262912750244,
"eval_runtime": 7.3885,
"eval_samples_per_second": 8.527,
"eval_steps_per_second": 1.083,
"eval_wer": 0.6034121520502843,
"step": 392
},
{
"epoch": 49.9,
"learning_rate": 0.0003037974683544304,
"loss": 0.4601,
"step": 400
},
{
"epoch": 49.9,
"eval_loss": 2.2838327884674072,
"eval_runtime": 7.4359,
"eval_samples_per_second": 8.472,
"eval_steps_per_second": 1.076,
"eval_wer": 0.627955701885663,
"step": 400
},
{
"epoch": 50.9,
"eval_loss": 2.0287113189697266,
"eval_runtime": 7.3496,
"eval_samples_per_second": 8.572,
"eval_steps_per_second": 1.088,
"eval_wer": 0.6147859922178989,
"step": 408
},
{
"epoch": 51.23,
"learning_rate": 0.00030126582278481017,
"loss": 0.4891,
"step": 410
},
{
"epoch": 51.9,
"eval_loss": 2.13460636138916,
"eval_runtime": 7.487,
"eval_samples_per_second": 8.415,
"eval_steps_per_second": 1.069,
"eval_wer": 0.6129901227177492,
"step": 416
},
{
"epoch": 52.45,
"learning_rate": 0.0002987341772151899,
"loss": 0.4506,
"step": 420
},
{
"epoch": 52.9,
"eval_loss": 2.155635356903076,
"eval_runtime": 7.4274,
"eval_samples_per_second": 8.482,
"eval_steps_per_second": 1.077,
"eval_wer": 0.6180784196348399,
"step": 424
},
{
"epoch": 53.68,
"learning_rate": 0.0002962025316455696,
"loss": 0.4581,
"step": 430
},
{
"epoch": 53.9,
"eval_loss": 2.0560076236724854,
"eval_runtime": 7.4656,
"eval_samples_per_second": 8.439,
"eval_steps_per_second": 1.072,
"eval_wer": 0.6228674049685723,
"step": 432
},
{
"epoch": 54.9,
"learning_rate": 0.0002936708860759494,
"loss": 0.4485,
"step": 440
},
{
"epoch": 54.9,
"eval_loss": 1.9943857192993164,
"eval_runtime": 7.4255,
"eval_samples_per_second": 8.484,
"eval_steps_per_second": 1.077,
"eval_wer": 0.5971266087997605,
"step": 440
},
{
"epoch": 55.9,
"eval_loss": 1.979053020477295,
"eval_runtime": 7.3558,
"eval_samples_per_second": 8.565,
"eval_steps_per_second": 1.088,
"eval_wer": 0.6096976953008082,
"step": 448
},
{
"epoch": 56.23,
"learning_rate": 0.00029113924050632915,
"loss": 0.4942,
"step": 450
},
{
"epoch": 56.9,
"eval_loss": 2.1165554523468018,
"eval_runtime": 7.3957,
"eval_samples_per_second": 8.518,
"eval_steps_per_second": 1.082,
"eval_wer": 0.6070038910505836,
"step": 456
},
{
"epoch": 57.45,
"learning_rate": 0.00028860759493670886,
"loss": 0.4748,
"step": 460
},
{
"epoch": 57.9,
"eval_loss": 2.027055263519287,
"eval_runtime": 7.413,
"eval_samples_per_second": 8.499,
"eval_steps_per_second": 1.079,
"eval_wer": 0.6123914995510327,
"step": 464
},
{
"epoch": 58.68,
"learning_rate": 0.00028607594936708863,
"loss": 0.4229,
"step": 470
},
{
"epoch": 58.9,
"eval_loss": 2.0436832904815674,
"eval_runtime": 7.4475,
"eval_samples_per_second": 8.459,
"eval_steps_per_second": 1.074,
"eval_wer": 0.6228674049685723,
"step": 472
},
{
"epoch": 59.9,
"learning_rate": 0.00028354430379746835,
"loss": 0.45,
"step": 480
},
{
"epoch": 59.9,
"eval_loss": 2.101158618927002,
"eval_runtime": 7.4226,
"eval_samples_per_second": 8.488,
"eval_steps_per_second": 1.078,
"eval_wer": 0.6141873690511823,
"step": 480
},
{
"epoch": 60.9,
"eval_loss": 1.9150625467300415,
"eval_runtime": 7.4336,
"eval_samples_per_second": 8.475,
"eval_steps_per_second": 1.076,
"eval_wer": 0.6049087099670757,
"step": 488
},
{
"epoch": 61.23,
"learning_rate": 0.0002810126582278481,
"loss": 0.4936,
"step": 490
},
{
"epoch": 61.9,
"eval_loss": 1.8990676403045654,
"eval_runtime": 7.475,
"eval_samples_per_second": 8.428,
"eval_steps_per_second": 1.07,
"eval_wer": 0.6046093983837174,
"step": 496
},
{
"epoch": 62.45,
"learning_rate": 0.0002784810126582279,
"loss": 0.4602,
"step": 500
},
{
"epoch": 62.9,
"eval_loss": 1.9813122749328613,
"eval_runtime": 7.4459,
"eval_samples_per_second": 8.461,
"eval_steps_per_second": 1.074,
"eval_wer": 0.6111942532175996,
"step": 504
},
{
"epoch": 63.68,
"learning_rate": 0.0002759493670886076,
"loss": 0.4626,
"step": 510
},
{
"epoch": 63.9,
"eval_loss": 1.9371625185012817,
"eval_runtime": 7.4834,
"eval_samples_per_second": 8.419,
"eval_steps_per_second": 1.069,
"eval_wer": 0.6135887458844658,
"step": 512
},
{
"epoch": 64.9,
"learning_rate": 0.0002734177215189873,
"loss": 0.445,
"step": 520
},
{
"epoch": 64.9,
"eval_loss": 1.9060248136520386,
"eval_runtime": 7.5103,
"eval_samples_per_second": 8.389,
"eval_steps_per_second": 1.065,
"eval_wer": 0.6153846153846154,
"step": 520
},
{
"epoch": 65.9,
"eval_loss": 1.9573534727096558,
"eval_runtime": 7.3508,
"eval_samples_per_second": 8.571,
"eval_steps_per_second": 1.088,
"eval_wer": 0.6150853038012571,
"step": 528
},
{
"epoch": 66.23,
"learning_rate": 0.0002708860759493671,
"loss": 0.4907,
"step": 530
},
{
"epoch": 66.9,
"eval_loss": 2.094677209854126,
"eval_runtime": 7.4211,
"eval_samples_per_second": 8.489,
"eval_steps_per_second": 1.078,
"eval_wer": 0.6022149057168512,
"step": 536
},
{
"epoch": 67.45,
"learning_rate": 0.00026835443037974687,
"loss": 0.4723,
"step": 540
},
{
"epoch": 67.9,
"eval_loss": 2.0061404705047607,
"eval_runtime": 7.3728,
"eval_samples_per_second": 8.545,
"eval_steps_per_second": 1.085,
"eval_wer": 0.6010176593834181,
"step": 544
},
{
"epoch": 68.68,
"learning_rate": 0.0002658227848101266,
"loss": 0.4103,
"step": 550
},
{
"epoch": 68.9,
"eval_loss": 1.9557090997695923,
"eval_runtime": 7.4208,
"eval_samples_per_second": 8.49,
"eval_steps_per_second": 1.078,
"eval_wer": 0.6093983837174499,
"step": 552
},
{
"epoch": 69.9,
"learning_rate": 0.0002632911392405063,
"loss": 0.4808,
"step": 560
},
{
"epoch": 69.9,
"eval_loss": 2.1042206287384033,
"eval_runtime": 7.4448,
"eval_samples_per_second": 8.462,
"eval_steps_per_second": 1.075,
"eval_wer": 0.6087997605507333,
"step": 560
},
{
"epoch": 70.9,
"eval_loss": 2.1360342502593994,
"eval_runtime": 7.4355,
"eval_samples_per_second": 8.473,
"eval_steps_per_second": 1.076,
"eval_wer": 0.6073032026339419,
"step": 568
},
{
"epoch": 71.23,
"learning_rate": 0.00026075949367088613,
"loss": 0.4682,
"step": 570
},
{
"epoch": 71.9,
"eval_loss": 2.128976583480835,
"eval_runtime": 7.3612,
"eval_samples_per_second": 8.558,
"eval_steps_per_second": 1.087,
"eval_wer": 0.6013169709667764,
"step": 576
},
{
"epoch": 72.45,
"learning_rate": 0.00025822784810126584,
"loss": 0.4472,
"step": 580
},
{
"epoch": 72.9,
"eval_loss": 1.9453884363174438,
"eval_runtime": 7.3992,
"eval_samples_per_second": 8.514,
"eval_steps_per_second": 1.081,
"eval_wer": 0.5989224782999102,
"step": 584
},
{
"epoch": 73.68,
"learning_rate": 0.00025569620253164556,
"loss": 0.4259,
"step": 590
},
{
"epoch": 73.9,
"eval_loss": 2.0936951637268066,
"eval_runtime": 7.4127,
"eval_samples_per_second": 8.499,
"eval_steps_per_second": 1.079,
"eval_wer": 0.6043100868003591,
"step": 592
},
{
"epoch": 74.9,
"learning_rate": 0.00025316455696202533,
"loss": 0.4464,
"step": 600
},
{
"epoch": 74.9,
"eval_loss": 2.0821897983551025,
"eval_runtime": 7.4228,
"eval_samples_per_second": 8.487,
"eval_steps_per_second": 1.078,
"eval_wer": 0.6058066447171505,
"step": 600
},
{
"epoch": 75.9,
"eval_loss": 2.0128111839294434,
"eval_runtime": 7.4657,
"eval_samples_per_second": 8.439,
"eval_steps_per_second": 1.072,
"eval_wer": 0.6058066447171505,
"step": 608
},
{
"epoch": 76.23,
"learning_rate": 0.0002506329113924051,
"loss": 0.4775,
"step": 610
},
{
"epoch": 76.9,
"eval_loss": 1.9743807315826416,
"eval_runtime": 7.4326,
"eval_samples_per_second": 8.476,
"eval_steps_per_second": 1.076,
"eval_wer": 0.6093983837174499,
"step": 616
},
{
"epoch": 77.45,
"learning_rate": 0.0002481012658227848,
"loss": 0.4394,
"step": 620
},
{
"epoch": 77.9,
"eval_loss": 1.9991949796676636,
"eval_runtime": 7.4315,
"eval_samples_per_second": 8.477,
"eval_steps_per_second": 1.076,
"eval_wer": 0.6010176593834181,
"step": 624
},
{
"epoch": 78.68,
"learning_rate": 0.0002455696202531646,
"loss": 0.418,
"step": 630
},
{
"epoch": 78.9,
"eval_loss": 2.169315814971924,
"eval_runtime": 7.4483,
"eval_samples_per_second": 8.458,
"eval_steps_per_second": 1.074,
"eval_wer": 0.5947321161328943,
"step": 632
},
{
"epoch": 79.9,
"learning_rate": 0.00024303797468354434,
"loss": 0.4384,
"step": 640
},
{
"epoch": 79.9,
"eval_loss": 2.132563829421997,
"eval_runtime": 7.3909,
"eval_samples_per_second": 8.524,
"eval_steps_per_second": 1.082,
"eval_wer": 0.5923376234660281,
"step": 640
},
{
"epoch": 80.9,
"eval_loss": 2.115138292312622,
"eval_runtime": 7.409,
"eval_samples_per_second": 8.503,
"eval_steps_per_second": 1.08,
"eval_wer": 0.5950314277162526,
"step": 648
},
{
"epoch": 81.23,
"learning_rate": 0.00024050632911392405,
"loss": 0.4971,
"step": 650
},
{
"epoch": 81.9,
"eval_loss": 2.1581170558929443,
"eval_runtime": 7.4413,
"eval_samples_per_second": 8.466,
"eval_steps_per_second": 1.075,
"eval_wer": 0.5923376234660281,
"step": 656
},
{
"epoch": 82.45,
"learning_rate": 0.0002379746835443038,
"loss": 0.4176,
"step": 660
},
{
"epoch": 82.9,
"eval_loss": 2.087625741958618,
"eval_runtime": 7.4281,
"eval_samples_per_second": 8.481,
"eval_steps_per_second": 1.077,
"eval_wer": 0.6013169709667764,
"step": 664
},
{
"epoch": 83.68,
"learning_rate": 0.00023544303797468357,
"loss": 0.4312,
"step": 670
},
{
"epoch": 83.9,
"eval_loss": 2.1316428184509277,
"eval_runtime": 7.4214,
"eval_samples_per_second": 8.489,
"eval_steps_per_second": 1.078,
"eval_wer": 0.5935348697994612,
"step": 672
},
{
"epoch": 84.9,
"learning_rate": 0.0002329113924050633,
"loss": 0.4408,
"step": 680
},
{
"epoch": 84.9,
"eval_loss": 2.2627344131469727,
"eval_runtime": 7.4182,
"eval_samples_per_second": 8.493,
"eval_steps_per_second": 1.078,
"eval_wer": 0.5971266087997605,
"step": 680
},
{
"epoch": 85.9,
"eval_loss": 2.279871702194214,
"eval_runtime": 7.385,
"eval_samples_per_second": 8.531,
"eval_steps_per_second": 1.083,
"eval_wer": 0.6111942532175996,
"step": 688
},
{
"epoch": 86.23,
"learning_rate": 0.00023037974683544303,
"loss": 0.4678,
"step": 690
},
{
"epoch": 86.9,
"eval_loss": 2.1239001750946045,
"eval_runtime": 7.4279,
"eval_samples_per_second": 8.482,
"eval_steps_per_second": 1.077,
"eval_wer": 0.5989224782999102,
"step": 696
},
{
"epoch": 87.45,
"learning_rate": 0.0002278481012658228,
"loss": 0.4288,
"step": 700
},
{
"epoch": 87.9,
"eval_loss": 2.157447576522827,
"eval_runtime": 7.401,
"eval_samples_per_second": 8.512,
"eval_steps_per_second": 1.081,
"eval_wer": 0.5983238551331936,
"step": 704
},
{
"epoch": 88.68,
"learning_rate": 0.00022531645569620254,
"loss": 0.4157,
"step": 710
},
{
"epoch": 88.9,
"eval_loss": 2.2124781608581543,
"eval_runtime": 7.411,
"eval_samples_per_second": 8.501,
"eval_steps_per_second": 1.079,
"eval_wer": 0.5908410655492368,
"step": 712
},
{
"epoch": 89.9,
"learning_rate": 0.0002227848101265823,
"loss": 0.444,
"step": 720
},
{
"epoch": 89.9,
"eval_loss": 2.054173469543457,
"eval_runtime": 7.3891,
"eval_samples_per_second": 8.526,
"eval_steps_per_second": 1.083,
"eval_wer": 0.5986231667165519,
"step": 720
},
{
"epoch": 90.9,
"eval_loss": 2.0898985862731934,
"eval_runtime": 7.4515,
"eval_samples_per_second": 8.455,
"eval_steps_per_second": 1.074,
"eval_wer": 0.5920383118826699,
"step": 728
},
{
"epoch": 91.23,
"learning_rate": 0.00022025316455696206,
"loss": 0.4694,
"step": 730
},
{
"epoch": 91.9,
"eval_loss": 2.11220645904541,
"eval_runtime": 7.3648,
"eval_samples_per_second": 8.554,
"eval_steps_per_second": 1.086,
"eval_wer": 0.6076025142173002,
"step": 736
},
{
"epoch": 92.45,
"learning_rate": 0.00021772151898734177,
"loss": 0.4314,
"step": 740
},
{
"epoch": 92.9,
"eval_loss": 2.0633835792541504,
"eval_runtime": 7.4479,
"eval_samples_per_second": 8.459,
"eval_steps_per_second": 1.074,
"eval_wer": 0.5950314277162526,
"step": 744
},
{
"epoch": 93.68,
"learning_rate": 0.00021518987341772152,
"loss": 0.4348,
"step": 750
},
{
"epoch": 93.9,
"eval_loss": 2.033348321914673,
"eval_runtime": 7.4247,
"eval_samples_per_second": 8.485,
"eval_steps_per_second": 1.077,
"eval_wer": 0.6046093983837174,
"step": 752
},
{
"epoch": 94.9,
"learning_rate": 0.00021265822784810126,
"loss": 0.4558,
"step": 760
},
{
"epoch": 94.9,
"eval_loss": 2.118844509124756,
"eval_runtime": 7.3971,
"eval_samples_per_second": 8.517,
"eval_steps_per_second": 1.082,
"eval_wer": 0.5956300508829692,
"step": 760
},
{
"epoch": 95.9,
"eval_loss": 2.060605764389038,
"eval_runtime": 7.4121,
"eval_samples_per_second": 8.5,
"eval_steps_per_second": 1.079,
"eval_wer": 0.5995211014666267,
"step": 768
},
{
"epoch": 96.23,
"learning_rate": 0.00021012658227848103,
"loss": 0.461,
"step": 770
},
{
"epoch": 96.9,
"eval_loss": 2.0599749088287354,
"eval_runtime": 7.378,
"eval_samples_per_second": 8.539,
"eval_steps_per_second": 1.084,
"eval_wer": 0.5971266087997605,
"step": 776
},
{
"epoch": 97.45,
"learning_rate": 0.00020759493670886078,
"loss": 0.4258,
"step": 780
},
{
"epoch": 97.9,
"eval_loss": 2.0478837490081787,
"eval_runtime": 7.4178,
"eval_samples_per_second": 8.493,
"eval_steps_per_second": 1.078,
"eval_wer": 0.6040107752170009,
"step": 784
},
{
"epoch": 98.68,
"learning_rate": 0.0002050632911392405,
"loss": 0.4395,
"step": 790
},
{
"epoch": 98.9,
"eval_loss": 2.128241539001465,
"eval_runtime": 7.3865,
"eval_samples_per_second": 8.529,
"eval_steps_per_second": 1.083,
"eval_wer": 0.6055073331337922,
"step": 792
},
{
"epoch": 99.9,
"learning_rate": 0.00020253164556962027,
"loss": 0.4282,
"step": 800
},
{
"epoch": 99.9,
"eval_loss": 2.0592732429504395,
"eval_runtime": 7.4314,
"eval_samples_per_second": 8.478,
"eval_steps_per_second": 1.077,
"eval_wer": 0.6043100868003591,
"step": 800
},
{
"epoch": 100.9,
"eval_loss": 2.0591721534729004,
"eval_runtime": 7.3516,
"eval_samples_per_second": 8.57,
"eval_steps_per_second": 1.088,
"eval_wer": 0.5920383118826699,
"step": 808
},
{
"epoch": 101.23,
"learning_rate": 0.0002,
"loss": 0.4623,
"step": 810
},
{
"epoch": 101.9,
"eval_loss": 2.0852437019348145,
"eval_runtime": 7.4242,
"eval_samples_per_second": 8.486,
"eval_steps_per_second": 1.078,
"eval_wer": 0.5944328045495361,
"step": 816
},
{
"epoch": 102.45,
"learning_rate": 0.00019746835443037975,
"loss": 0.4392,
"step": 820
},
{
"epoch": 102.9,
"eval_loss": 2.202364206314087,
"eval_runtime": 7.4726,
"eval_samples_per_second": 8.431,
"eval_steps_per_second": 1.071,
"eval_wer": 0.5920383118826699,
"step": 824
},
{
"epoch": 103.68,
"learning_rate": 0.0001949367088607595,
"loss": 0.4308,
"step": 830
},
{
"epoch": 103.9,
"eval_loss": 2.178584337234497,
"eval_runtime": 7.4755,
"eval_samples_per_second": 8.427,
"eval_steps_per_second": 1.07,
"eval_wer": 0.5935348697994612,
"step": 832
},
{
"epoch": 104.9,
"learning_rate": 0.00019240506329113924,
"loss": 0.4375,
"step": 840
},
{
"epoch": 104.9,
"eval_loss": 2.108534574508667,
"eval_runtime": 7.495,
"eval_samples_per_second": 8.406,
"eval_steps_per_second": 1.067,
"eval_wer": 0.591140377132595,
"step": 840
},
{
"epoch": 105.9,
"eval_loss": 2.072387218475342,
"eval_runtime": 7.5191,
"eval_samples_per_second": 8.379,
"eval_steps_per_second": 1.064,
"eval_wer": 0.5974259203831188,
"step": 848
},
{
"epoch": 106.23,
"learning_rate": 0.00018987341772151899,
"loss": 0.4501,
"step": 850
},
{
"epoch": 106.9,
"eval_loss": 2.13057804107666,
"eval_runtime": 7.3849,
"eval_samples_per_second": 8.531,
"eval_steps_per_second": 1.083,
"eval_wer": 0.5881472612990123,
"step": 856
},
{
"epoch": 107.45,
"learning_rate": 0.00018734177215189873,
"loss": 0.4273,
"step": 860
},
{
"epoch": 107.9,
"eval_loss": 2.134038209915161,
"eval_runtime": 7.4115,
"eval_samples_per_second": 8.5,
"eval_steps_per_second": 1.079,
"eval_wer": 0.5899431307991619,
"step": 864
},
{
"epoch": 108.68,
"learning_rate": 0.0001848101265822785,
"loss": 0.4234,
"step": 870
},
{
"epoch": 108.9,
"eval_loss": 2.1124684810638428,
"eval_runtime": 7.4267,
"eval_samples_per_second": 8.483,
"eval_steps_per_second": 1.077,
"eval_wer": 0.5980245435498354,
"step": 872
},
{
"epoch": 109.9,
"learning_rate": 0.00018227848101265824,
"loss": 0.4289,
"step": 880
},
{
"epoch": 109.9,
"eval_loss": 2.052570104598999,
"eval_runtime": 7.4264,
"eval_samples_per_second": 8.483,
"eval_steps_per_second": 1.077,
"eval_wer": 0.6007183478000598,
"step": 880
},
{
"epoch": 110.9,
"eval_loss": 2.095505714416504,
"eval_runtime": 7.4204,
"eval_samples_per_second": 8.49,
"eval_steps_per_second": 1.078,
"eval_wer": 0.5884465728823706,
"step": 888
},
{
"epoch": 111.23,
"learning_rate": 0.000179746835443038,
"loss": 0.478,
"step": 890
},
{
"epoch": 111.9,
"eval_loss": 2.1146061420440674,
"eval_runtime": 7.4324,
"eval_samples_per_second": 8.476,
"eval_steps_per_second": 1.076,
"eval_wer": 0.5872493265489375,
"step": 896
},
{
"epoch": 112.45,
"learning_rate": 0.00017721518987341773,
"loss": 0.4143,
"step": 900
},
{
"epoch": 112.9,
"eval_loss": 2.230980396270752,
"eval_runtime": 7.4614,
"eval_samples_per_second": 8.443,
"eval_steps_per_second": 1.072,
"eval_wer": 0.5899431307991619,
"step": 904
},
{
"epoch": 113.68,
"learning_rate": 0.00017468354430379748,
"loss": 0.4193,
"step": 910
},
{
"epoch": 113.9,
"eval_loss": 2.2165205478668213,
"eval_runtime": 7.4217,
"eval_samples_per_second": 8.489,
"eval_steps_per_second": 1.078,
"eval_wer": 0.5899431307991619,
"step": 912
},
{
"epoch": 114.9,
"learning_rate": 0.00017215189873417722,
"loss": 0.4159,
"step": 920
},
{
"epoch": 114.9,
"eval_loss": 2.163135528564453,
"eval_runtime": 7.3968,
"eval_samples_per_second": 8.517,
"eval_steps_per_second": 1.082,
"eval_wer": 0.5941334929661778,
"step": 920
},
{
"epoch": 115.9,
"eval_loss": 2.1370790004730225,
"eval_runtime": 7.4829,
"eval_samples_per_second": 8.419,
"eval_steps_per_second": 1.069,
"eval_wer": 0.5938341813828195,
"step": 928
},
{
"epoch": 116.23,
"learning_rate": 0.00016962025316455696,
"loss": 0.4776,
"step": 930
},
{
"epoch": 116.9,
"eval_loss": 2.0972321033477783,
"eval_runtime": 7.416,
"eval_samples_per_second": 8.495,
"eval_steps_per_second": 1.079,
"eval_wer": 0.5935348697994612,
"step": 936
},
{
"epoch": 117.45,
"learning_rate": 0.0001670886075949367,
"loss": 0.4143,
"step": 940
},
{
"epoch": 117.9,
"eval_loss": 2.1247801780700684,
"eval_runtime": 7.4939,
"eval_samples_per_second": 8.407,
"eval_steps_per_second": 1.068,
"eval_wer": 0.5917390002993116,
"step": 944
},
{
"epoch": 118.68,
"learning_rate": 0.00016455696202531648,
"loss": 0.4022,
"step": 950
},
{
"epoch": 118.9,
"eval_loss": 2.1317126750946045,
"eval_runtime": 7.4457,
"eval_samples_per_second": 8.461,
"eval_steps_per_second": 1.074,
"eval_wer": 0.5956300508829692,
"step": 952
},
{
"epoch": 119.9,
"learning_rate": 0.0001620253164556962,
"loss": 0.4346,
"step": 960
},
{
"epoch": 119.9,
"eval_loss": 2.123711347579956,
"eval_runtime": 7.4822,
"eval_samples_per_second": 8.42,
"eval_steps_per_second": 1.069,
"eval_wer": 0.5992217898832685,
"step": 960
},
{
"epoch": 120.9,
"eval_loss": 2.068420648574829,
"eval_runtime": 7.4345,
"eval_samples_per_second": 8.474,
"eval_steps_per_second": 1.076,
"eval_wer": 0.5935348697994612,
"step": 968
},
{
"epoch": 121.23,
"learning_rate": 0.00015949367088607597,
"loss": 0.4564,
"step": 970
},
{
"epoch": 121.9,
"eval_loss": 2.0721840858459473,
"eval_runtime": 7.5192,
"eval_samples_per_second": 8.379,
"eval_steps_per_second": 1.064,
"eval_wer": 0.5947321161328943,
"step": 976
},
{
"epoch": 122.45,
"learning_rate": 0.00015696202531645568,
"loss": 0.4243,
"step": 980
},
{
"epoch": 122.9,
"eval_loss": 2.1361429691314697,
"eval_runtime": 7.41,
"eval_samples_per_second": 8.502,
"eval_steps_per_second": 1.08,
"eval_wer": 0.5884465728823706,
"step": 984
},
{
"epoch": 123.68,
"learning_rate": 0.00015443037974683546,
"loss": 0.413,
"step": 990
},
{
"epoch": 123.9,
"eval_loss": 2.120671510696411,
"eval_runtime": 7.446,
"eval_samples_per_second": 8.461,
"eval_steps_per_second": 1.074,
"eval_wer": 0.5893445076324454,
"step": 992
},
{
"epoch": 124.9,
"learning_rate": 0.0001518987341772152,
"loss": 0.4113,
"step": 1000
},
{
"epoch": 124.9,
"eval_loss": 2.0697362422943115,
"eval_runtime": 7.3738,
"eval_samples_per_second": 8.544,
"eval_steps_per_second": 1.085,
"eval_wer": 0.5836575875486382,
"step": 1000
},
{
"epoch": 125.9,
"eval_loss": 2.1004655361175537,
"eval_runtime": 7.4731,
"eval_samples_per_second": 8.43,
"eval_steps_per_second": 1.071,
"eval_wer": 0.5875486381322957,
"step": 1008
},
{
"epoch": 126.23,
"learning_rate": 0.00014936708860759494,
"loss": 0.4426,
"step": 1010
},
{
"epoch": 126.9,
"eval_loss": 2.082164764404297,
"eval_runtime": 7.3929,
"eval_samples_per_second": 8.522,
"eval_steps_per_second": 1.082,
"eval_wer": 0.5869500149655792,
"step": 1016
},
{
"epoch": 127.45,
"learning_rate": 0.0001468354430379747,
"loss": 0.4255,
"step": 1020
},
{
"epoch": 127.9,
"eval_loss": 2.057152032852173,
"eval_runtime": 7.3561,
"eval_samples_per_second": 8.564,
"eval_steps_per_second": 1.088,
"eval_wer": 0.5959293624663274,
"step": 1024
},
{
"epoch": 128.68,
"learning_rate": 0.00014430379746835443,
"loss": 0.4214,
"step": 1030
},
{
"epoch": 128.9,
"eval_loss": 2.0343050956726074,
"eval_runtime": 7.3751,
"eval_samples_per_second": 8.542,
"eval_steps_per_second": 1.085,
"eval_wer": 0.5935348697994612,
"step": 1032
},
{
"epoch": 129.9,
"learning_rate": 0.00014177215189873418,
"loss": 0.4042,
"step": 1040
},
{
"epoch": 129.9,
"eval_loss": 2.028167486190796,
"eval_runtime": 7.4579,
"eval_samples_per_second": 8.447,
"eval_steps_per_second": 1.073,
"eval_wer": 0.5902424423825202,
"step": 1040
},
{
"epoch": 130.9,
"eval_loss": 2.0313541889190674,
"eval_runtime": 7.451,
"eval_samples_per_second": 8.455,
"eval_steps_per_second": 1.074,
"eval_wer": 0.584555522298713,
"step": 1048
},
{
"epoch": 131.23,
"learning_rate": 0.00013924050632911395,
"loss": 0.4515,
"step": 1050
},
{
"epoch": 131.9,
"eval_loss": 2.0620908737182617,
"eval_runtime": 7.3689,
"eval_samples_per_second": 8.549,
"eval_steps_per_second": 1.086,
"eval_wer": 0.5869500149655792,
"step": 1056
},
{
"epoch": 132.45,
"learning_rate": 0.00013670886075949366,
"loss": 0.4138,
"step": 1060
},
{
"epoch": 132.9,
"eval_loss": 2.0703771114349365,
"eval_runtime": 7.4244,
"eval_samples_per_second": 8.486,
"eval_steps_per_second": 1.078,
"eval_wer": 0.5938341813828195,
"step": 1064
},
{
"epoch": 133.68,
"learning_rate": 0.00013417721518987343,
"loss": 0.4289,
"step": 1070
},
{
"epoch": 133.9,
"eval_loss": 2.0221784114837646,
"eval_runtime": 7.3955,
"eval_samples_per_second": 8.519,
"eval_steps_per_second": 1.082,
"eval_wer": 0.5896438192158037,
"step": 1072
},
{
"epoch": 134.9,
"learning_rate": 0.00013164556962025315,
"loss": 0.3908,
"step": 1080
},
{
"epoch": 134.9,
"eval_loss": 2.087918281555176,
"eval_runtime": 7.4644,
"eval_samples_per_second": 8.44,
"eval_steps_per_second": 1.072,
"eval_wer": 0.5854534570487878,
"step": 1080
},
{
"epoch": 135.9,
"eval_loss": 2.1067752838134766,
"eval_runtime": 7.4189,
"eval_samples_per_second": 8.492,
"eval_steps_per_second": 1.078,
"eval_wer": 0.5821610296318468,
"step": 1088
},
{
"epoch": 136.23,
"learning_rate": 0.00012911392405063292,
"loss": 0.4489,
"step": 1090
},
{
"epoch": 136.9,
"eval_loss": 2.0702497959136963,
"eval_runtime": 7.407,
"eval_samples_per_second": 8.506,
"eval_steps_per_second": 1.08,
"eval_wer": 0.5836575875486382,
"step": 1096
},
{
"epoch": 137.45,
"learning_rate": 0.00012658227848101267,
"loss": 0.4191,
"step": 1100
},
{
"epoch": 137.9,
"eval_loss": 2.1092591285705566,
"eval_runtime": 7.3713,
"eval_samples_per_second": 8.547,
"eval_steps_per_second": 1.085,
"eval_wer": 0.5881472612990123,
"step": 1104
},
{
"epoch": 138.68,
"learning_rate": 0.0001240506329113924,
"loss": 0.4149,
"step": 1110
},
{
"epoch": 138.9,
"eval_loss": 2.1046438217163086,
"eval_runtime": 7.4579,
"eval_samples_per_second": 8.447,
"eval_steps_per_second": 1.073,
"eval_wer": 0.5818617180484885,
"step": 1112
},
{
"epoch": 139.9,
"learning_rate": 0.00012151898734177217,
"loss": 0.4127,
"step": 1120
},
{
"epoch": 139.9,
"eval_loss": 2.1728851795196533,
"eval_runtime": 7.4678,
"eval_samples_per_second": 8.436,
"eval_steps_per_second": 1.071,
"eval_wer": 0.5776713558814726,
"step": 1120
},
{
"epoch": 140.9,
"eval_loss": 2.163623809814453,
"eval_runtime": 7.3779,
"eval_samples_per_second": 8.539,
"eval_steps_per_second": 1.084,
"eval_wer": 0.5809637832984137,
"step": 1128
},
{
"epoch": 141.23,
"learning_rate": 0.0001189873417721519,
"loss": 0.4449,
"step": 1130
},
{
"epoch": 141.9,
"eval_loss": 2.1514804363250732,
"eval_runtime": 7.4355,
"eval_samples_per_second": 8.473,
"eval_steps_per_second": 1.076,
"eval_wer": 0.5785692906315475,
"step": 1136
},
{
"epoch": 142.45,
"learning_rate": 0.00011645569620253166,
"loss": 0.3977,
"step": 1140
},
{
"epoch": 142.9,
"eval_loss": 2.153089761734009,
"eval_runtime": 7.4012,
"eval_samples_per_second": 8.512,
"eval_steps_per_second": 1.081,
"eval_wer": 0.5773720442981143,
"step": 1144
},
{
"epoch": 143.68,
"learning_rate": 0.0001139240506329114,
"loss": 0.4121,
"step": 1150
},
{
"epoch": 143.9,
"eval_loss": 2.0857479572296143,
"eval_runtime": 7.4307,
"eval_samples_per_second": 8.478,
"eval_steps_per_second": 1.077,
"eval_wer": 0.5815624064651302,
"step": 1152
},
{
"epoch": 144.9,
"learning_rate": 0.00011139240506329114,
"loss": 0.4363,
"step": 1160
},
{
"epoch": 144.9,
"eval_loss": 2.137199878692627,
"eval_runtime": 7.4589,
"eval_samples_per_second": 8.446,
"eval_steps_per_second": 1.073,
"eval_wer": 0.5821610296318468,
"step": 1160
},
{
"epoch": 145.9,
"eval_loss": 2.1901986598968506,
"eval_runtime": 7.401,
"eval_samples_per_second": 8.512,
"eval_steps_per_second": 1.081,
"eval_wer": 0.5827596527985633,
"step": 1168
},
{
"epoch": 146.23,
"learning_rate": 0.00010886075949367089,
"loss": 0.4318,
"step": 1170
},
{
"epoch": 146.9,
"eval_loss": 2.1464831829071045,
"eval_runtime": 7.3966,
"eval_samples_per_second": 8.517,
"eval_steps_per_second": 1.082,
"eval_wer": 0.5830589643819216,
"step": 1176
},
{
"epoch": 147.45,
"learning_rate": 0.00010632911392405063,
"loss": 0.4112,
"step": 1180
},
{
"epoch": 147.9,
"eval_loss": 2.0696558952331543,
"eval_runtime": 7.4385,
"eval_samples_per_second": 8.469,
"eval_steps_per_second": 1.075,
"eval_wer": 0.5857527686321461,
"step": 1184
},
{
"epoch": 148.68,
"learning_rate": 0.00010379746835443039,
"loss": 0.4292,
"step": 1190
},
{
"epoch": 148.9,
"eval_loss": 2.084959030151367,
"eval_runtime": 7.5078,
"eval_samples_per_second": 8.391,
"eval_steps_per_second": 1.066,
"eval_wer": 0.5836575875486382,
"step": 1192
},
{
"epoch": 149.9,
"learning_rate": 0.00010126582278481013,
"loss": 0.4182,
"step": 1200
},
{
"epoch": 149.9,
"eval_loss": 2.1171438694000244,
"eval_runtime": 7.4243,
"eval_samples_per_second": 8.486,
"eval_steps_per_second": 1.078,
"eval_wer": 0.584555522298713,
"step": 1200
},
{
"epoch": 150.9,
"eval_loss": 2.1019790172576904,
"eval_runtime": 7.4383,
"eval_samples_per_second": 8.47,
"eval_steps_per_second": 1.076,
"eval_wer": 0.5866507033822209,
"step": 1208
},
{
"epoch": 151.23,
"learning_rate": 9.873417721518988e-05,
"loss": 0.4381,
"step": 1210
},
{
"epoch": 151.9,
"eval_loss": 2.105226516723633,
"eval_runtime": 7.4571,
"eval_samples_per_second": 8.448,
"eval_steps_per_second": 1.073,
"eval_wer": 0.5848548338820713,
"step": 1216
},
{
"epoch": 152.45,
"learning_rate": 9.620253164556962e-05,
"loss": 0.4235,
"step": 1220
},
{
"epoch": 152.9,
"eval_loss": 2.1429975032806396,
"eval_runtime": 7.4629,
"eval_samples_per_second": 8.442,
"eval_steps_per_second": 1.072,
"eval_wer": 0.5863513917988626,
"step": 1224
},
{
"epoch": 153.68,
"learning_rate": 9.367088607594936e-05,
"loss": 0.4173,
"step": 1230
},
{
"epoch": 153.9,
"eval_loss": 2.1130850315093994,
"eval_runtime": 7.4382,
"eval_samples_per_second": 8.47,
"eval_steps_per_second": 1.076,
"eval_wer": 0.5833582759652799,
"step": 1232
},
{
"epoch": 154.9,
"learning_rate": 9.113924050632912e-05,
"loss": 0.3927,
"step": 1240
},
{
"epoch": 154.9,
"eval_loss": 2.113377571105957,
"eval_runtime": 7.4677,
"eval_samples_per_second": 8.436,
"eval_steps_per_second": 1.071,
"eval_wer": 0.584555522298713,
"step": 1240
},
{
"epoch": 155.9,
"eval_loss": 2.117252826690674,
"eval_runtime": 7.4474,
"eval_samples_per_second": 8.459,
"eval_steps_per_second": 1.074,
"eval_wer": 0.584555522298713,
"step": 1248
},
{
"epoch": 156.23,
"learning_rate": 8.860759493670887e-05,
"loss": 0.4492,
"step": 1250
},
{
"epoch": 156.9,
"eval_loss": 2.077221393585205,
"eval_runtime": 7.4748,
"eval_samples_per_second": 8.428,
"eval_steps_per_second": 1.07,
"eval_wer": 0.5800658485483389,
"step": 1256
},
{
"epoch": 157.45,
"learning_rate": 8.607594936708861e-05,
"loss": 0.4313,
"step": 1260
},
{
"epoch": 157.9,
"eval_loss": 2.030902862548828,
"eval_runtime": 7.3649,
"eval_samples_per_second": 8.554,
"eval_steps_per_second": 1.086,
"eval_wer": 0.5860520802155044,
"step": 1264
},
{
"epoch": 158.68,
"learning_rate": 8.354430379746835e-05,
"loss": 0.4015,
"step": 1270
},
{
"epoch": 158.9,
"eval_loss": 2.088667154312134,
"eval_runtime": 7.4182,
"eval_samples_per_second": 8.493,
"eval_steps_per_second": 1.078,
"eval_wer": 0.5818617180484885,
"step": 1272
},
{
"epoch": 159.9,
"learning_rate": 8.10126582278481e-05,
"loss": 0.4268,
"step": 1280
},
{
"epoch": 159.9,
"eval_loss": 2.1811771392822266,
"eval_runtime": 7.3167,
"eval_samples_per_second": 8.61,
"eval_steps_per_second": 1.093,
"eval_wer": 0.5848548338820713,
"step": 1280
},
{
"epoch": 160.9,
"eval_loss": 2.1568429470062256,
"eval_runtime": 7.4406,
"eval_samples_per_second": 8.467,
"eval_steps_per_second": 1.075,
"eval_wer": 0.5881472612990123,
"step": 1288
},
{
"epoch": 161.23,
"learning_rate": 7.848101265822784e-05,
"loss": 0.4496,
"step": 1290
},
{
"epoch": 161.9,
"eval_loss": 2.080479860305786,
"eval_runtime": 7.4143,
"eval_samples_per_second": 8.497,
"eval_steps_per_second": 1.079,
"eval_wer": 0.5800658485483389,
"step": 1296
},
{
"epoch": 162.45,
"learning_rate": 7.59493670886076e-05,
"loss": 0.4121,
"step": 1300
},
{
"epoch": 162.9,
"eval_loss": 2.046131134033203,
"eval_runtime": 7.4233,
"eval_samples_per_second": 8.487,
"eval_steps_per_second": 1.078,
"eval_wer": 0.5872493265489375,
"step": 1304
},
{
"epoch": 163.68,
"learning_rate": 7.341772151898734e-05,
"loss": 0.401,
"step": 1310
},
{
"epoch": 163.9,
"eval_loss": 2.037684202194214,
"eval_runtime": 7.3482,
"eval_samples_per_second": 8.574,
"eval_steps_per_second": 1.089,
"eval_wer": 0.5863513917988626,
"step": 1312
},
{
"epoch": 164.9,
"learning_rate": 7.088607594936709e-05,
"loss": 0.4192,
"step": 1320
},
{
"epoch": 164.9,
"eval_loss": 2.0183184146881104,
"eval_runtime": 7.3373,
"eval_samples_per_second": 8.586,
"eval_steps_per_second": 1.09,
"eval_wer": 0.5872493265489375,
"step": 1320
},
{
"epoch": 165.9,
"eval_loss": 2.0107128620147705,
"eval_runtime": 7.443,
"eval_samples_per_second": 8.464,
"eval_steps_per_second": 1.075,
"eval_wer": 0.5854534570487878,
"step": 1328
},
{
"epoch": 166.23,
"learning_rate": 6.835443037974683e-05,
"loss": 0.4466,
"step": 1330
},
{
"epoch": 166.9,
"eval_loss": 2.052823781967163,
"eval_runtime": 7.4214,
"eval_samples_per_second": 8.489,
"eval_steps_per_second": 1.078,
"eval_wer": 0.5881472612990123,
"step": 1336
},
{
"epoch": 167.45,
"learning_rate": 6.582278481012658e-05,
"loss": 0.3981,
"step": 1340
},
{
"epoch": 167.9,
"eval_loss": 2.05106258392334,
"eval_runtime": 7.4774,
"eval_samples_per_second": 8.425,
"eval_steps_per_second": 1.07,
"eval_wer": 0.587847949715654,
"step": 1344
},
{
"epoch": 168.68,
"learning_rate": 6.329113924050633e-05,
"loss": 0.3967,
"step": 1350
},
{
"epoch": 168.9,
"eval_loss": 2.0374269485473633,
"eval_runtime": 7.4229,
"eval_samples_per_second": 8.487,
"eval_steps_per_second": 1.078,
"eval_wer": 0.5866507033822209,
"step": 1352
},
{
"epoch": 169.9,
"learning_rate": 6.0759493670886084e-05,
"loss": 0.4072,
"step": 1360
},
{
"epoch": 169.9,
"eval_loss": 2.0553550720214844,
"eval_runtime": 7.3678,
"eval_samples_per_second": 8.551,
"eval_steps_per_second": 1.086,
"eval_wer": 0.5866507033822209,
"step": 1360
},
{
"epoch": 170.9,
"eval_loss": 2.0388166904449463,
"eval_runtime": 7.4353,
"eval_samples_per_second": 8.473,
"eval_steps_per_second": 1.076,
"eval_wer": 0.5857527686321461,
"step": 1368
},
{
"epoch": 171.23,
"learning_rate": 5.822784810126583e-05,
"loss": 0.4581,
"step": 1370
},
{
"epoch": 171.9,
"eval_loss": 2.0188472270965576,
"eval_runtime": 7.467,
"eval_samples_per_second": 8.437,
"eval_steps_per_second": 1.071,
"eval_wer": 0.5914396887159533,
"step": 1376
},
{
"epoch": 172.45,
"learning_rate": 5.569620253164557e-05,
"loss": 0.3937,
"step": 1380
},
{
"epoch": 172.9,
"eval_loss": 1.9998791217803955,
"eval_runtime": 7.4081,
"eval_samples_per_second": 8.504,
"eval_steps_per_second": 1.08,
"eval_wer": 0.5851541454654295,
"step": 1384
},
{
"epoch": 173.68,
"learning_rate": 5.3164556962025316e-05,
"loss": 0.4074,
"step": 1390
},
{
"epoch": 173.9,
"eval_loss": 1.9738383293151855,
"eval_runtime": 7.4171,
"eval_samples_per_second": 8.494,
"eval_steps_per_second": 1.079,
"eval_wer": 0.5839568991319964,
"step": 1392
},
{
"epoch": 174.9,
"learning_rate": 5.0632911392405066e-05,
"loss": 0.4085,
"step": 1400
},
{
"epoch": 174.9,
"eval_loss": 2.009026050567627,
"eval_runtime": 7.412,
"eval_samples_per_second": 8.5,
"eval_steps_per_second": 1.079,
"eval_wer": 0.5842562107153547,
"step": 1400
},
{
"epoch": 175.9,
"eval_loss": 1.999009370803833,
"eval_runtime": 7.341,
"eval_samples_per_second": 8.582,
"eval_steps_per_second": 1.09,
"eval_wer": 0.5863513917988626,
"step": 1408
},
{
"epoch": 176.23,
"learning_rate": 4.810126582278481e-05,
"loss": 0.4224,
"step": 1410
},
{
"epoch": 176.9,
"eval_loss": 2.03910756111145,
"eval_runtime": 7.4284,
"eval_samples_per_second": 8.481,
"eval_steps_per_second": 1.077,
"eval_wer": 0.5851541454654295,
"step": 1416
},
{
"epoch": 177.45,
"learning_rate": 4.556962025316456e-05,
"loss": 0.4471,
"step": 1420
},
{
"epoch": 177.9,
"eval_loss": 2.026160955429077,
"eval_runtime": 7.4109,
"eval_samples_per_second": 8.501,
"eval_steps_per_second": 1.079,
"eval_wer": 0.5854534570487878,
"step": 1424
},
{
"epoch": 178.68,
"learning_rate": 4.3037974683544305e-05,
"loss": 0.4233,
"step": 1430
},
{
"epoch": 178.9,
"eval_loss": 2.0620737075805664,
"eval_runtime": 7.4368,
"eval_samples_per_second": 8.471,
"eval_steps_per_second": 1.076,
"eval_wer": 0.5800658485483389,
"step": 1432
},
{
"epoch": 179.9,
"learning_rate": 4.050632911392405e-05,
"loss": 0.409,
"step": 1440
},
{
"epoch": 179.9,
"eval_loss": 2.048555612564087,
"eval_runtime": 7.408,
"eval_samples_per_second": 8.504,
"eval_steps_per_second": 1.08,
"eval_wer": 0.584555522298713,
"step": 1440
},
{
"epoch": 180.9,
"eval_loss": 2.050809383392334,
"eval_runtime": 7.4021,
"eval_samples_per_second": 8.511,
"eval_steps_per_second": 1.081,
"eval_wer": 0.5806644717150554,
"step": 1448
},
{
"epoch": 181.23,
"learning_rate": 3.79746835443038e-05,
"loss": 0.4518,
"step": 1450
},
{
"epoch": 181.9,
"eval_loss": 2.024106979370117,
"eval_runtime": 7.3365,
"eval_samples_per_second": 8.587,
"eval_steps_per_second": 1.09,
"eval_wer": 0.5887458844657288,
"step": 1456
},
{
"epoch": 182.45,
"learning_rate": 3.5443037974683544e-05,
"loss": 0.4077,
"step": 1460
},
{
"epoch": 182.9,
"eval_loss": 2.0168745517730713,
"eval_runtime": 7.4996,
"eval_samples_per_second": 8.4,
"eval_steps_per_second": 1.067,
"eval_wer": 0.5842562107153547,
"step": 1464
},
{
"epoch": 183.68,
"learning_rate": 3.291139240506329e-05,
"loss": 0.4197,
"step": 1470
},
{
"epoch": 183.9,
"eval_loss": 2.001417636871338,
"eval_runtime": 7.4742,
"eval_samples_per_second": 8.429,
"eval_steps_per_second": 1.07,
"eval_wer": 0.5896438192158037,
"step": 1472
},
{
"epoch": 184.9,
"learning_rate": 3.0379746835443042e-05,
"loss": 0.4237,
"step": 1480
},
{
"epoch": 184.9,
"eval_loss": 2.018913507461548,
"eval_runtime": 7.5256,
"eval_samples_per_second": 8.371,
"eval_steps_per_second": 1.063,
"eval_wer": 0.5842562107153547,
"step": 1480
},
{
"epoch": 185.9,
"eval_loss": 2.0095009803771973,
"eval_runtime": 7.4628,
"eval_samples_per_second": 8.442,
"eval_steps_per_second": 1.072,
"eval_wer": 0.5866507033822209,
"step": 1488
},
{
"epoch": 186.23,
"learning_rate": 2.7848101265822786e-05,
"loss": 0.4394,
"step": 1490
},
{
"epoch": 186.9,
"eval_loss": 1.9993491172790527,
"eval_runtime": 7.4937,
"eval_samples_per_second": 8.407,
"eval_steps_per_second": 1.068,
"eval_wer": 0.5884465728823706,
"step": 1496
},
{
"epoch": 187.45,
"learning_rate": 2.5316455696202533e-05,
"loss": 0.4299,
"step": 1500
},
{
"epoch": 187.9,
"eval_loss": 2.009735345840454,
"eval_runtime": 7.4524,
"eval_samples_per_second": 8.454,
"eval_steps_per_second": 1.073,
"eval_wer": 0.5899431307991619,
"step": 1504
},
{
"epoch": 188.68,
"learning_rate": 2.278481012658228e-05,
"loss": 0.4198,
"step": 1510
},
{
"epoch": 188.9,
"eval_loss": 2.004906177520752,
"eval_runtime": 7.476,
"eval_samples_per_second": 8.427,
"eval_steps_per_second": 1.07,
"eval_wer": 0.5869500149655792,
"step": 1512
},
{
"epoch": 189.9,
"learning_rate": 2.0253164556962025e-05,
"loss": 0.4116,
"step": 1520
},
{
"epoch": 189.9,
"eval_loss": 1.989935040473938,
"eval_runtime": 7.5052,
"eval_samples_per_second": 8.394,
"eval_steps_per_second": 1.066,
"eval_wer": 0.5875486381322957,
"step": 1520
},
{
"epoch": 190.9,
"eval_loss": 1.9814202785491943,
"eval_runtime": 7.5147,
"eval_samples_per_second": 8.384,
"eval_steps_per_second": 1.065,
"eval_wer": 0.5881472612990123,
"step": 1528
},
{
"epoch": 191.23,
"learning_rate": 1.7721518987341772e-05,
"loss": 0.445,
"step": 1530
},
{
"epoch": 191.9,
"eval_loss": 1.9819977283477783,
"eval_runtime": 7.4909,
"eval_samples_per_second": 8.41,
"eval_steps_per_second": 1.068,
"eval_wer": 0.5887458844657288,
"step": 1536
},
{
"epoch": 192.45,
"learning_rate": 1.5189873417721521e-05,
"loss": 0.4198,
"step": 1540
},
{
"epoch": 192.9,
"eval_loss": 1.9838072061538696,
"eval_runtime": 7.5105,
"eval_samples_per_second": 8.388,
"eval_steps_per_second": 1.065,
"eval_wer": 0.5881472612990123,
"step": 1544
},
{
"epoch": 193.68,
"learning_rate": 1.2658227848101267e-05,
"loss": 0.4065,
"step": 1550
},
{
"epoch": 193.9,
"eval_loss": 1.984854817390442,
"eval_runtime": 7.4309,
"eval_samples_per_second": 8.478,
"eval_steps_per_second": 1.077,
"eval_wer": 0.5884465728823706,
"step": 1552
},
{
"epoch": 194.9,
"learning_rate": 1.0126582278481012e-05,
"loss": 0.3917,
"step": 1560
},
{
"epoch": 194.9,
"eval_loss": 1.980286717414856,
"eval_runtime": 7.5285,
"eval_samples_per_second": 8.368,
"eval_steps_per_second": 1.063,
"eval_wer": 0.5866507033822209,
"step": 1560
},
{
"epoch": 195.9,
"eval_loss": 1.9776644706726074,
"eval_runtime": 7.4846,
"eval_samples_per_second": 8.417,
"eval_steps_per_second": 1.069,
"eval_wer": 0.5881472612990123,
"step": 1568
},
{
"epoch": 196.23,
"learning_rate": 7.5949367088607605e-06,
"loss": 0.4239,
"step": 1570
},
{
"epoch": 196.9,
"eval_loss": 1.9751547574996948,
"eval_runtime": 7.4451,
"eval_samples_per_second": 8.462,
"eval_steps_per_second": 1.075,
"eval_wer": 0.5875486381322957,
"step": 1576
},
{
"epoch": 197.45,
"learning_rate": 5.063291139240506e-06,
"loss": 0.4183,
"step": 1580
},
{
"epoch": 197.9,
"eval_loss": 1.9765574932098389,
"eval_runtime": 7.4708,
"eval_samples_per_second": 8.433,
"eval_steps_per_second": 1.071,
"eval_wer": 0.5872493265489375,
"step": 1584
},
{
"epoch": 198.68,
"learning_rate": 2.531645569620253e-06,
"loss": 0.3965,
"step": 1590
},
{
"epoch": 198.9,
"eval_loss": 1.9772560596466064,
"eval_runtime": 7.4376,
"eval_samples_per_second": 8.471,
"eval_steps_per_second": 1.076,
"eval_wer": 0.5872493265489375,
"step": 1592
},
{
"epoch": 199.9,
"learning_rate": 0.0,
"loss": 0.4144,
"step": 1600
},
{
"epoch": 199.9,
"eval_loss": 1.9781134128570557,
"eval_runtime": 7.3567,
"eval_samples_per_second": 8.564,
"eval_steps_per_second": 1.087,
"eval_wer": 0.5872493265489375,
"step": 1600
},
{
"epoch": 199.9,
"step": 1600,
"total_flos": 1.1848602213269387e+19,
"train_loss": 0.4494818127155304,
"train_runtime": 18323.7781,
"train_samples_per_second": 6.145,
"train_steps_per_second": 0.087
}
],
"max_steps": 1600,
"num_train_epochs": 200,
"total_flos": 1.1848602213269387e+19,
"trial_name": null,
"trial_params": null
}