gary109's picture
End of training
642e48b
raw
history blame
67.5 kB
{
"best_metric": 1.9551260471343994,
"best_model_checkpoint": "ai-light-dance_drums_ft_pretrain_wav2vec2-base/checkpoint-1408",
"epoch": 199.90140845070422,
"global_step": 1600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.9,
"eval_loss": 2.037254571914673,
"eval_runtime": 7.6198,
"eval_samples_per_second": 8.268,
"eval_steps_per_second": 1.05,
"eval_wer": 0.6779407363064951,
"step": 8
},
{
"epoch": 1.23,
"learning_rate": 0.0002,
"loss": 0.6674,
"step": 10
},
{
"epoch": 1.9,
"eval_loss": 2.2592625617980957,
"eval_runtime": 7.6185,
"eval_samples_per_second": 8.269,
"eval_steps_per_second": 1.05,
"eval_wer": 0.6749476204729123,
"step": 16
},
{
"epoch": 2.45,
"learning_rate": 0.0004,
"loss": 0.6653,
"step": 20
},
{
"epoch": 2.9,
"eval_loss": 2.043417453765869,
"eval_runtime": 7.6392,
"eval_samples_per_second": 8.247,
"eval_steps_per_second": 1.047,
"eval_wer": 0.6668662077222388,
"step": 24
},
{
"epoch": 3.68,
"learning_rate": 0.00039746835443037974,
"loss": 0.7249,
"step": 30
},
{
"epoch": 3.9,
"eval_loss": 2.1789791584014893,
"eval_runtime": 7.6684,
"eval_samples_per_second": 8.216,
"eval_steps_per_second": 1.043,
"eval_wer": 0.6935049386411254,
"step": 32
},
{
"epoch": 4.9,
"learning_rate": 0.0003949367088607595,
"loss": 0.683,
"step": 40
},
{
"epoch": 4.9,
"eval_loss": 2.1209700107574463,
"eval_runtime": 7.7094,
"eval_samples_per_second": 8.172,
"eval_steps_per_second": 1.038,
"eval_wer": 0.6866207722238851,
"step": 40
},
{
"epoch": 5.9,
"eval_loss": 2.240757703781128,
"eval_runtime": 7.6326,
"eval_samples_per_second": 8.254,
"eval_steps_per_second": 1.048,
"eval_wer": 0.6803352289733613,
"step": 48
},
{
"epoch": 6.23,
"learning_rate": 0.0003924050632911393,
"loss": 0.7518,
"step": 50
},
{
"epoch": 6.9,
"eval_loss": 2.28826642036438,
"eval_runtime": 7.57,
"eval_samples_per_second": 8.322,
"eval_steps_per_second": 1.057,
"eval_wer": 0.6902125112241844,
"step": 56
},
{
"epoch": 7.45,
"learning_rate": 0.000389873417721519,
"loss": 0.686,
"step": 60
},
{
"epoch": 7.9,
"eval_loss": 2.1073131561279297,
"eval_runtime": 7.7427,
"eval_samples_per_second": 8.137,
"eval_steps_per_second": 1.033,
"eval_wer": 0.6818317868901527,
"step": 64
},
{
"epoch": 8.68,
"learning_rate": 0.00038734177215189877,
"loss": 0.6771,
"step": 70
},
{
"epoch": 8.9,
"eval_loss": 2.340881109237671,
"eval_runtime": 7.6198,
"eval_samples_per_second": 8.268,
"eval_steps_per_second": 1.05,
"eval_wer": 0.6689613888057467,
"step": 72
},
{
"epoch": 9.9,
"learning_rate": 0.0003848101265822785,
"loss": 0.6593,
"step": 80
},
{
"epoch": 9.9,
"eval_loss": 2.4714651107788086,
"eval_runtime": 7.6918,
"eval_samples_per_second": 8.191,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6602813528883568,
"step": 80
},
{
"epoch": 10.9,
"eval_loss": 2.097456455230713,
"eval_runtime": 7.666,
"eval_samples_per_second": 8.218,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6722538162226879,
"step": 88
},
{
"epoch": 11.23,
"learning_rate": 0.00038227848101265825,
"loss": 0.7433,
"step": 90
},
{
"epoch": 11.9,
"eval_loss": 2.033815860748291,
"eval_runtime": 7.6612,
"eval_samples_per_second": 8.223,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6728524393894044,
"step": 96
},
{
"epoch": 12.45,
"learning_rate": 0.00037974683544303797,
"loss": 0.6497,
"step": 100
},
{
"epoch": 12.9,
"eval_loss": 2.141453266143799,
"eval_runtime": 7.6044,
"eval_samples_per_second": 8.285,
"eval_steps_per_second": 1.052,
"eval_wer": 0.6824304100568692,
"step": 104
},
{
"epoch": 13.68,
"learning_rate": 0.00037721518987341774,
"loss": 0.6497,
"step": 110
},
{
"epoch": 13.9,
"eval_loss": 2.181793689727783,
"eval_runtime": 7.6888,
"eval_samples_per_second": 8.194,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6653696498054474,
"step": 112
},
{
"epoch": 14.9,
"learning_rate": 0.00037468354430379746,
"loss": 0.6799,
"step": 120
},
{
"epoch": 14.9,
"eval_loss": 2.0863850116729736,
"eval_runtime": 7.6642,
"eval_samples_per_second": 8.22,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6755462436396289,
"step": 120
},
{
"epoch": 15.9,
"eval_loss": 2.4925379753112793,
"eval_runtime": 7.6569,
"eval_samples_per_second": 8.228,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6797366058066447,
"step": 128
},
{
"epoch": 16.23,
"learning_rate": 0.00037215189873417723,
"loss": 0.7459,
"step": 130
},
{
"epoch": 16.9,
"eval_loss": 2.335496425628662,
"eval_runtime": 7.6286,
"eval_samples_per_second": 8.258,
"eval_steps_per_second": 1.049,
"eval_wer": 0.6860221490571685,
"step": 136
},
{
"epoch": 17.45,
"learning_rate": 0.000369620253164557,
"loss": 0.6576,
"step": 140
},
{
"epoch": 17.9,
"eval_loss": 2.234079360961914,
"eval_runtime": 7.6403,
"eval_samples_per_second": 8.246,
"eval_steps_per_second": 1.047,
"eval_wer": 0.6704579467225381,
"step": 144
},
{
"epoch": 18.68,
"learning_rate": 0.0003670886075949367,
"loss": 0.6798,
"step": 150
},
{
"epoch": 18.9,
"eval_loss": 2.142047643661499,
"eval_runtime": 7.5893,
"eval_samples_per_second": 8.301,
"eval_steps_per_second": 1.054,
"eval_wer": 0.6614785992217899,
"step": 152
},
{
"epoch": 19.9,
"learning_rate": 0.0003645569620253165,
"loss": 0.6479,
"step": 160
},
{
"epoch": 19.9,
"eval_loss": 2.4265201091766357,
"eval_runtime": 7.5945,
"eval_samples_per_second": 8.296,
"eval_steps_per_second": 1.053,
"eval_wer": 0.6755462436396289,
"step": 160
},
{
"epoch": 20.9,
"eval_loss": 2.300034523010254,
"eval_runtime": 7.6736,
"eval_samples_per_second": 8.21,
"eval_steps_per_second": 1.043,
"eval_wer": 0.6944028733912002,
"step": 168
},
{
"epoch": 21.23,
"learning_rate": 0.00036202531645569626,
"loss": 0.708,
"step": 170
},
{
"epoch": 21.9,
"eval_loss": 2.246602773666382,
"eval_runtime": 7.6898,
"eval_samples_per_second": 8.193,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6731517509727627,
"step": 176
},
{
"epoch": 22.45,
"learning_rate": 0.000359493670886076,
"loss": 0.6596,
"step": 180
},
{
"epoch": 22.9,
"eval_loss": 2.4366281032562256,
"eval_runtime": 7.6554,
"eval_samples_per_second": 8.23,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6776414247231368,
"step": 184
},
{
"epoch": 23.68,
"learning_rate": 0.0003569620253164557,
"loss": 0.643,
"step": 190
},
{
"epoch": 23.9,
"eval_loss": 2.091036081314087,
"eval_runtime": 7.7242,
"eval_samples_per_second": 8.156,
"eval_steps_per_second": 1.036,
"eval_wer": 0.6513020053876085,
"step": 192
},
{
"epoch": 24.9,
"learning_rate": 0.00035443037974683546,
"loss": 0.6644,
"step": 200
},
{
"epoch": 24.9,
"eval_loss": 2.265995740890503,
"eval_runtime": 7.6041,
"eval_samples_per_second": 8.285,
"eval_steps_per_second": 1.052,
"eval_wer": 0.6644717150553726,
"step": 200
},
{
"epoch": 25.9,
"eval_loss": 2.1543314456939697,
"eval_runtime": 7.6598,
"eval_samples_per_second": 8.225,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6764441783897037,
"step": 208
},
{
"epoch": 26.23,
"learning_rate": 0.00035189873417721524,
"loss": 0.6936,
"step": 210
},
{
"epoch": 26.9,
"eval_loss": 2.150484561920166,
"eval_runtime": 7.5916,
"eval_samples_per_second": 8.299,
"eval_steps_per_second": 1.054,
"eval_wer": 0.6698593235558216,
"step": 216
},
{
"epoch": 27.45,
"learning_rate": 0.00034936708860759495,
"loss": 0.6338,
"step": 220
},
{
"epoch": 27.9,
"eval_loss": 2.2812647819519043,
"eval_runtime": 7.6091,
"eval_samples_per_second": 8.28,
"eval_steps_per_second": 1.051,
"eval_wer": 0.6707572583058964,
"step": 224
},
{
"epoch": 28.68,
"learning_rate": 0.00034683544303797467,
"loss": 0.6393,
"step": 230
},
{
"epoch": 28.9,
"eval_loss": 2.103980779647827,
"eval_runtime": 7.6072,
"eval_samples_per_second": 8.282,
"eval_steps_per_second": 1.052,
"eval_wer": 0.6596827297216402,
"step": 232
},
{
"epoch": 29.9,
"learning_rate": 0.00034430379746835444,
"loss": 0.6378,
"step": 240
},
{
"epoch": 29.9,
"eval_loss": 2.2749102115631104,
"eval_runtime": 7.6923,
"eval_samples_per_second": 8.19,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6740496857228375,
"step": 240
},
{
"epoch": 30.9,
"eval_loss": 2.109790802001953,
"eval_runtime": 7.5197,
"eval_samples_per_second": 8.378,
"eval_steps_per_second": 1.064,
"eval_wer": 0.6611792876384316,
"step": 248
},
{
"epoch": 31.23,
"learning_rate": 0.0003417721518987342,
"loss": 0.6829,
"step": 250
},
{
"epoch": 31.9,
"eval_loss": 2.1962344646453857,
"eval_runtime": 7.7439,
"eval_samples_per_second": 8.135,
"eval_steps_per_second": 1.033,
"eval_wer": 0.6513020053876085,
"step": 256
},
{
"epoch": 32.45,
"learning_rate": 0.00033924050632911393,
"loss": 0.6002,
"step": 260
},
{
"epoch": 32.9,
"eval_loss": 2.131077289581299,
"eval_runtime": 7.5878,
"eval_samples_per_second": 8.303,
"eval_steps_per_second": 1.054,
"eval_wer": 0.6617779108051481,
"step": 264
},
{
"epoch": 33.68,
"learning_rate": 0.0003367088607594937,
"loss": 0.6656,
"step": 270
},
{
"epoch": 33.9,
"eval_loss": 2.2650504112243652,
"eval_runtime": 7.6783,
"eval_samples_per_second": 8.205,
"eval_steps_per_second": 1.042,
"eval_wer": 0.6510026938042502,
"step": 272
},
{
"epoch": 34.9,
"learning_rate": 0.0003341772151898734,
"loss": 0.633,
"step": 280
},
{
"epoch": 34.9,
"eval_loss": 2.2622334957122803,
"eval_runtime": 7.6997,
"eval_samples_per_second": 8.182,
"eval_steps_per_second": 1.039,
"eval_wer": 0.6513020053876085,
"step": 280
},
{
"epoch": 35.9,
"eval_loss": 2.2585790157318115,
"eval_runtime": 7.6561,
"eval_samples_per_second": 8.229,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6620772223885064,
"step": 288
},
{
"epoch": 36.23,
"learning_rate": 0.0003316455696202532,
"loss": 0.6644,
"step": 290
},
{
"epoch": 36.9,
"eval_loss": 2.4157793521881104,
"eval_runtime": 7.6013,
"eval_samples_per_second": 8.288,
"eval_steps_per_second": 1.052,
"eval_wer": 0.6593834181382819,
"step": 296
},
{
"epoch": 37.45,
"learning_rate": 0.00032911392405063296,
"loss": 0.6235,
"step": 300
},
{
"epoch": 37.9,
"eval_loss": 2.425449848175049,
"eval_runtime": 7.5997,
"eval_samples_per_second": 8.29,
"eval_steps_per_second": 1.053,
"eval_wer": 0.6477102663873092,
"step": 304
},
{
"epoch": 38.68,
"learning_rate": 0.0003265822784810127,
"loss": 0.6041,
"step": 310
},
{
"epoch": 38.9,
"eval_loss": 2.308098793029785,
"eval_runtime": 7.8174,
"eval_samples_per_second": 8.059,
"eval_steps_per_second": 1.023,
"eval_wer": 0.6632744687219395,
"step": 312
},
{
"epoch": 39.9,
"learning_rate": 0.0003240506329113924,
"loss": 0.6215,
"step": 320
},
{
"epoch": 39.9,
"eval_loss": 2.425708532333374,
"eval_runtime": 7.5701,
"eval_samples_per_second": 8.322,
"eval_steps_per_second": 1.057,
"eval_wer": 0.6498054474708171,
"step": 320
},
{
"epoch": 40.9,
"eval_loss": 2.301248550415039,
"eval_runtime": 7.574,
"eval_samples_per_second": 8.318,
"eval_steps_per_second": 1.056,
"eval_wer": 0.6366357378030529,
"step": 328
},
{
"epoch": 41.23,
"learning_rate": 0.00032151898734177216,
"loss": 0.6684,
"step": 330
},
{
"epoch": 41.9,
"eval_loss": 2.2059545516967773,
"eval_runtime": 7.5863,
"eval_samples_per_second": 8.304,
"eval_steps_per_second": 1.055,
"eval_wer": 0.6584854833882071,
"step": 336
},
{
"epoch": 42.45,
"learning_rate": 0.00031898734177215193,
"loss": 0.6201,
"step": 340
},
{
"epoch": 42.9,
"eval_loss": 2.030762195587158,
"eval_runtime": 7.5021,
"eval_samples_per_second": 8.398,
"eval_steps_per_second": 1.066,
"eval_wer": 0.6680634540556719,
"step": 344
},
{
"epoch": 43.68,
"learning_rate": 0.00031645569620253165,
"loss": 0.5957,
"step": 350
},
{
"epoch": 43.9,
"eval_loss": 2.137511730194092,
"eval_runtime": 7.6442,
"eval_samples_per_second": 8.242,
"eval_steps_per_second": 1.047,
"eval_wer": 0.6575875486381323,
"step": 352
},
{
"epoch": 44.9,
"learning_rate": 0.00031392405063291137,
"loss": 0.6158,
"step": 360
},
{
"epoch": 44.9,
"eval_loss": 2.0826189517974854,
"eval_runtime": 7.5707,
"eval_samples_per_second": 8.322,
"eval_steps_per_second": 1.057,
"eval_wer": 0.6671655193055971,
"step": 360
},
{
"epoch": 45.9,
"eval_loss": 2.198957681655884,
"eval_runtime": 7.6122,
"eval_samples_per_second": 8.276,
"eval_steps_per_second": 1.051,
"eval_wer": 0.6584854833882071,
"step": 368
},
{
"epoch": 46.23,
"learning_rate": 0.0003113924050632912,
"loss": 0.6291,
"step": 370
},
{
"epoch": 46.9,
"eval_loss": 2.054161787033081,
"eval_runtime": 7.6382,
"eval_samples_per_second": 8.248,
"eval_steps_per_second": 1.047,
"eval_wer": 0.6650703382220892,
"step": 376
},
{
"epoch": 47.45,
"learning_rate": 0.0003088607594936709,
"loss": 0.5924,
"step": 380
},
{
"epoch": 47.9,
"eval_loss": 2.057255983352661,
"eval_runtime": 7.5837,
"eval_samples_per_second": 8.307,
"eval_steps_per_second": 1.055,
"eval_wer": 0.653995809637833,
"step": 384
},
{
"epoch": 48.68,
"learning_rate": 0.00030632911392405063,
"loss": 0.6063,
"step": 390
},
{
"epoch": 48.9,
"eval_loss": 2.248441457748413,
"eval_runtime": 7.5574,
"eval_samples_per_second": 8.336,
"eval_steps_per_second": 1.059,
"eval_wer": 0.6530978748877582,
"step": 392
},
{
"epoch": 49.9,
"learning_rate": 0.0003037974683544304,
"loss": 0.5984,
"step": 400
},
{
"epoch": 49.9,
"eval_loss": 2.0361733436584473,
"eval_runtime": 7.6951,
"eval_samples_per_second": 8.187,
"eval_steps_per_second": 1.04,
"eval_wer": 0.660580664471715,
"step": 400
},
{
"epoch": 50.9,
"eval_loss": 2.1027872562408447,
"eval_runtime": 7.6986,
"eval_samples_per_second": 8.183,
"eval_steps_per_second": 1.039,
"eval_wer": 0.6554923675546244,
"step": 408
},
{
"epoch": 51.23,
"learning_rate": 0.00030126582278481017,
"loss": 0.6309,
"step": 410
},
{
"epoch": 51.9,
"eval_loss": 2.2151310443878174,
"eval_runtime": 7.7336,
"eval_samples_per_second": 8.146,
"eval_steps_per_second": 1.034,
"eval_wer": 0.6590841065549237,
"step": 416
},
{
"epoch": 52.45,
"learning_rate": 0.0002987341772151899,
"loss": 0.5979,
"step": 420
},
{
"epoch": 52.9,
"eval_loss": 2.0955023765563965,
"eval_runtime": 7.7001,
"eval_samples_per_second": 8.182,
"eval_steps_per_second": 1.039,
"eval_wer": 0.6608799760550733,
"step": 424
},
{
"epoch": 53.68,
"learning_rate": 0.0002962025316455696,
"loss": 0.5941,
"step": 430
},
{
"epoch": 53.9,
"eval_loss": 2.2526333332061768,
"eval_runtime": 7.6578,
"eval_samples_per_second": 8.227,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6731517509727627,
"step": 432
},
{
"epoch": 54.9,
"learning_rate": 0.0002936708860759494,
"loss": 0.5897,
"step": 440
},
{
"epoch": 54.9,
"eval_loss": 2.385159492492676,
"eval_runtime": 7.7372,
"eval_samples_per_second": 8.143,
"eval_steps_per_second": 1.034,
"eval_wer": 0.6542951212211913,
"step": 440
},
{
"epoch": 55.9,
"eval_loss": 2.080392837524414,
"eval_runtime": 7.6943,
"eval_samples_per_second": 8.188,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6563903023046992,
"step": 448
},
{
"epoch": 56.23,
"learning_rate": 0.00029113924050632915,
"loss": 0.6443,
"step": 450
},
{
"epoch": 56.9,
"eval_loss": 2.002680778503418,
"eval_runtime": 7.6599,
"eval_samples_per_second": 8.225,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6569889254714157,
"step": 456
},
{
"epoch": 57.45,
"learning_rate": 0.00028860759493670886,
"loss": 0.6055,
"step": 460
},
{
"epoch": 57.9,
"eval_loss": 2.1207001209259033,
"eval_runtime": 7.74,
"eval_samples_per_second": 8.14,
"eval_steps_per_second": 1.034,
"eval_wer": 0.6635737803052978,
"step": 464
},
{
"epoch": 58.68,
"learning_rate": 0.00028607594936708863,
"loss": 0.5422,
"step": 470
},
{
"epoch": 58.9,
"eval_loss": 2.2515547275543213,
"eval_runtime": 7.7005,
"eval_samples_per_second": 8.181,
"eval_steps_per_second": 1.039,
"eval_wer": 0.6617779108051481,
"step": 472
},
{
"epoch": 59.9,
"learning_rate": 0.00028354430379746835,
"loss": 0.5879,
"step": 480
},
{
"epoch": 59.9,
"eval_loss": 2.002816915512085,
"eval_runtime": 7.6055,
"eval_samples_per_second": 8.284,
"eval_steps_per_second": 1.052,
"eval_wer": 0.6548937443879078,
"step": 480
},
{
"epoch": 60.9,
"eval_loss": 2.3659348487854004,
"eval_runtime": 7.5632,
"eval_samples_per_second": 8.33,
"eval_steps_per_second": 1.058,
"eval_wer": 0.6575875486381323,
"step": 488
},
{
"epoch": 61.23,
"learning_rate": 0.0002810126582278481,
"loss": 0.638,
"step": 490
},
{
"epoch": 61.9,
"eval_loss": 2.499941825866699,
"eval_runtime": 7.5886,
"eval_samples_per_second": 8.302,
"eval_steps_per_second": 1.054,
"eval_wer": 0.6551930559712661,
"step": 496
},
{
"epoch": 62.45,
"learning_rate": 0.0002784810126582279,
"loss": 0.5874,
"step": 500
},
{
"epoch": 62.9,
"eval_loss": 2.3140323162078857,
"eval_runtime": 7.6729,
"eval_samples_per_second": 8.211,
"eval_steps_per_second": 1.043,
"eval_wer": 0.6483088895540258,
"step": 504
},
{
"epoch": 63.68,
"learning_rate": 0.0002759493670886076,
"loss": 0.5829,
"step": 510
},
{
"epoch": 63.9,
"eval_loss": 2.208669900894165,
"eval_runtime": 7.6542,
"eval_samples_per_second": 8.231,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6408260999700689,
"step": 512
},
{
"epoch": 64.9,
"learning_rate": 0.0002734177215189873,
"loss": 0.5632,
"step": 520
},
{
"epoch": 64.9,
"eval_loss": 2.1988563537597656,
"eval_runtime": 7.7231,
"eval_samples_per_second": 8.157,
"eval_steps_per_second": 1.036,
"eval_wer": 0.6533971864711164,
"step": 520
},
{
"epoch": 65.9,
"eval_loss": 2.244645118713379,
"eval_runtime": 7.7705,
"eval_samples_per_second": 8.108,
"eval_steps_per_second": 1.03,
"eval_wer": 0.6623765339718647,
"step": 528
},
{
"epoch": 66.23,
"learning_rate": 0.0002708860759493671,
"loss": 0.6143,
"step": 530
},
{
"epoch": 66.9,
"eval_loss": 2.1098854541778564,
"eval_runtime": 7.5934,
"eval_samples_per_second": 8.297,
"eval_steps_per_second": 1.054,
"eval_wer": 0.642023346303502,
"step": 536
},
{
"epoch": 67.45,
"learning_rate": 0.00026835443037974687,
"loss": 0.5924,
"step": 540
},
{
"epoch": 67.9,
"eval_loss": 2.237240791320801,
"eval_runtime": 7.6205,
"eval_samples_per_second": 8.267,
"eval_steps_per_second": 1.05,
"eval_wer": 0.6423226578868603,
"step": 544
},
{
"epoch": 68.68,
"learning_rate": 0.0002658227848101266,
"loss": 0.5239,
"step": 550
},
{
"epoch": 68.9,
"eval_loss": 2.348794460296631,
"eval_runtime": 7.6413,
"eval_samples_per_second": 8.245,
"eval_steps_per_second": 1.047,
"eval_wer": 0.645315773720443,
"step": 552
},
{
"epoch": 69.9,
"learning_rate": 0.0002632911392405063,
"loss": 0.5883,
"step": 560
},
{
"epoch": 69.9,
"eval_loss": 2.196101427078247,
"eval_runtime": 7.6374,
"eval_samples_per_second": 8.249,
"eval_steps_per_second": 1.047,
"eval_wer": 0.6438192158036516,
"step": 560
},
{
"epoch": 70.9,
"eval_loss": 2.2004334926605225,
"eval_runtime": 7.62,
"eval_samples_per_second": 8.268,
"eval_steps_per_second": 1.05,
"eval_wer": 0.6309488177192457,
"step": 568
},
{
"epoch": 71.23,
"learning_rate": 0.00026075949367088613,
"loss": 0.5918,
"step": 570
},
{
"epoch": 71.9,
"eval_loss": 2.020232677459717,
"eval_runtime": 7.6799,
"eval_samples_per_second": 8.203,
"eval_steps_per_second": 1.042,
"eval_wer": 0.6336426219694702,
"step": 576
},
{
"epoch": 72.45,
"learning_rate": 0.00025822784810126584,
"loss": 0.5602,
"step": 580
},
{
"epoch": 72.9,
"eval_loss": 2.0783603191375732,
"eval_runtime": 7.6645,
"eval_samples_per_second": 8.22,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6372343609697695,
"step": 584
},
{
"epoch": 73.68,
"learning_rate": 0.00025569620253164556,
"loss": 0.5323,
"step": 590
},
{
"epoch": 73.9,
"eval_loss": 2.1598377227783203,
"eval_runtime": 7.5941,
"eval_samples_per_second": 8.296,
"eval_steps_per_second": 1.053,
"eval_wer": 0.657288237054774,
"step": 592
},
{
"epoch": 74.9,
"learning_rate": 0.00025316455696202533,
"loss": 0.5584,
"step": 600
},
{
"epoch": 74.9,
"eval_loss": 2.1240878105163574,
"eval_runtime": 7.7267,
"eval_samples_per_second": 8.154,
"eval_steps_per_second": 1.035,
"eval_wer": 0.6351391798862616,
"step": 600
},
{
"epoch": 75.9,
"eval_loss": 2.113551616668701,
"eval_runtime": 7.6206,
"eval_samples_per_second": 8.267,
"eval_steps_per_second": 1.05,
"eval_wer": 0.6381322957198443,
"step": 608
},
{
"epoch": 76.23,
"learning_rate": 0.0002506329113924051,
"loss": 0.5979,
"step": 610
},
{
"epoch": 76.9,
"eval_loss": 2.1425106525421143,
"eval_runtime": 7.6456,
"eval_samples_per_second": 8.24,
"eval_steps_per_second": 1.046,
"eval_wer": 0.6330439988027536,
"step": 616
},
{
"epoch": 77.45,
"learning_rate": 0.0002481012658227848,
"loss": 0.5525,
"step": 620
},
{
"epoch": 77.9,
"eval_loss": 2.1255650520324707,
"eval_runtime": 7.6228,
"eval_samples_per_second": 8.265,
"eval_steps_per_second": 1.049,
"eval_wer": 0.6303501945525292,
"step": 624
},
{
"epoch": 78.68,
"learning_rate": 0.0002455696202531646,
"loss": 0.5197,
"step": 630
},
{
"epoch": 78.9,
"eval_loss": 2.0801608562469482,
"eval_runtime": 7.634,
"eval_samples_per_second": 8.253,
"eval_steps_per_second": 1.048,
"eval_wer": 0.631248129302604,
"step": 632
},
{
"epoch": 79.9,
"learning_rate": 0.00024303797468354434,
"loss": 0.5509,
"step": 640
},
{
"epoch": 79.9,
"eval_loss": 2.110111713409424,
"eval_runtime": 7.6969,
"eval_samples_per_second": 8.185,
"eval_steps_per_second": 1.039,
"eval_wer": 0.6369350493864112,
"step": 640
},
{
"epoch": 80.9,
"eval_loss": 2.078524112701416,
"eval_runtime": 7.7231,
"eval_samples_per_second": 8.157,
"eval_steps_per_second": 1.036,
"eval_wer": 0.6348398683029033,
"step": 648
},
{
"epoch": 81.23,
"learning_rate": 0.00024050632911392405,
"loss": 0.6176,
"step": 650
},
{
"epoch": 81.9,
"eval_loss": 2.0631349086761475,
"eval_runtime": 7.6229,
"eval_samples_per_second": 8.265,
"eval_steps_per_second": 1.049,
"eval_wer": 0.6270577671355881,
"step": 656
},
{
"epoch": 82.45,
"learning_rate": 0.0002379746835443038,
"loss": 0.5294,
"step": 660
},
{
"epoch": 82.9,
"eval_loss": 2.1448206901550293,
"eval_runtime": 7.5975,
"eval_samples_per_second": 8.292,
"eval_steps_per_second": 1.053,
"eval_wer": 0.6357378030529781,
"step": 664
},
{
"epoch": 83.68,
"learning_rate": 0.00023544303797468357,
"loss": 0.5399,
"step": 670
},
{
"epoch": 83.9,
"eval_loss": 2.2992684841156006,
"eval_runtime": 7.6959,
"eval_samples_per_second": 8.186,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6423226578868603,
"step": 672
},
{
"epoch": 84.9,
"learning_rate": 0.0002329113924050633,
"loss": 0.5507,
"step": 680
},
{
"epoch": 84.9,
"eval_loss": 2.242187976837158,
"eval_runtime": 7.6929,
"eval_samples_per_second": 8.189,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6441185273870099,
"step": 680
},
{
"epoch": 85.9,
"eval_loss": 2.1182749271392822,
"eval_runtime": 7.6056,
"eval_samples_per_second": 8.283,
"eval_steps_per_second": 1.052,
"eval_wer": 0.6429212810535768,
"step": 688
},
{
"epoch": 86.23,
"learning_rate": 0.00023037974683544303,
"loss": 0.5813,
"step": 690
},
{
"epoch": 86.9,
"eval_loss": 2.162194013595581,
"eval_runtime": 7.6302,
"eval_samples_per_second": 8.257,
"eval_steps_per_second": 1.048,
"eval_wer": 0.6408260999700689,
"step": 696
},
{
"epoch": 87.45,
"learning_rate": 0.0002278481012658228,
"loss": 0.5319,
"step": 700
},
{
"epoch": 87.9,
"eval_loss": 2.0702972412109375,
"eval_runtime": 7.6258,
"eval_samples_per_second": 8.261,
"eval_steps_per_second": 1.049,
"eval_wer": 0.6363364262196947,
"step": 704
},
{
"epoch": 88.68,
"learning_rate": 0.00022531645569620254,
"loss": 0.5247,
"step": 710
},
{
"epoch": 88.9,
"eval_loss": 2.1978485584259033,
"eval_runtime": 7.6643,
"eval_samples_per_second": 8.22,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6411254115534272,
"step": 712
},
{
"epoch": 89.9,
"learning_rate": 0.0002227848101265823,
"loss": 0.5607,
"step": 720
},
{
"epoch": 89.9,
"eval_loss": 2.307122230529785,
"eval_runtime": 7.6348,
"eval_samples_per_second": 8.252,
"eval_steps_per_second": 1.048,
"eval_wer": 0.6411254115534272,
"step": 720
},
{
"epoch": 90.9,
"eval_loss": 2.2638070583343506,
"eval_runtime": 7.6046,
"eval_samples_per_second": 8.285,
"eval_steps_per_second": 1.052,
"eval_wer": 0.6303501945525292,
"step": 728
},
{
"epoch": 91.23,
"learning_rate": 0.00022025316455696206,
"loss": 0.5796,
"step": 730
},
{
"epoch": 91.9,
"eval_loss": 2.1073036193847656,
"eval_runtime": 7.6773,
"eval_samples_per_second": 8.206,
"eval_steps_per_second": 1.042,
"eval_wer": 0.6441185273870099,
"step": 736
},
{
"epoch": 92.45,
"learning_rate": 0.00021772151898734177,
"loss": 0.5521,
"step": 740
},
{
"epoch": 92.9,
"eval_loss": 2.057901620864868,
"eval_runtime": 7.5831,
"eval_samples_per_second": 8.308,
"eval_steps_per_second": 1.055,
"eval_wer": 0.6456150853038013,
"step": 744
},
{
"epoch": 93.68,
"learning_rate": 0.00021518987341772152,
"loss": 0.5625,
"step": 750
},
{
"epoch": 93.9,
"eval_loss": 2.0663516521453857,
"eval_runtime": 7.623,
"eval_samples_per_second": 8.264,
"eval_steps_per_second": 1.049,
"eval_wer": 0.6501047590541754,
"step": 752
},
{
"epoch": 94.9,
"learning_rate": 0.00021265822784810126,
"loss": 0.5901,
"step": 760
},
{
"epoch": 94.9,
"eval_loss": 2.0674116611480713,
"eval_runtime": 7.5478,
"eval_samples_per_second": 8.347,
"eval_steps_per_second": 1.06,
"eval_wer": 0.6327446872193954,
"step": 760
},
{
"epoch": 95.9,
"eval_loss": 2.185175895690918,
"eval_runtime": 7.6051,
"eval_samples_per_second": 8.284,
"eval_steps_per_second": 1.052,
"eval_wer": 0.6381322957198443,
"step": 768
},
{
"epoch": 96.23,
"learning_rate": 0.00021012658227848103,
"loss": 0.5974,
"step": 770
},
{
"epoch": 96.9,
"eval_loss": 2.2212321758270264,
"eval_runtime": 7.6016,
"eval_samples_per_second": 8.288,
"eval_steps_per_second": 1.052,
"eval_wer": 0.6387309188865609,
"step": 776
},
{
"epoch": 97.45,
"learning_rate": 0.00020759493670886078,
"loss": 0.5359,
"step": 780
},
{
"epoch": 97.9,
"eval_loss": 2.1027910709381104,
"eval_runtime": 7.6755,
"eval_samples_per_second": 8.208,
"eval_steps_per_second": 1.042,
"eval_wer": 0.6390302304699191,
"step": 784
},
{
"epoch": 98.68,
"learning_rate": 0.0002050632911392405,
"loss": 0.5643,
"step": 790
},
{
"epoch": 98.9,
"eval_loss": 2.1437582969665527,
"eval_runtime": 7.7627,
"eval_samples_per_second": 8.116,
"eval_steps_per_second": 1.031,
"eval_wer": 0.6516013169709668,
"step": 792
},
{
"epoch": 99.9,
"learning_rate": 0.00020253164556962027,
"loss": 0.5488,
"step": 800
},
{
"epoch": 99.9,
"eval_loss": 2.1104142665863037,
"eval_runtime": 7.5682,
"eval_samples_per_second": 8.324,
"eval_steps_per_second": 1.057,
"eval_wer": 0.6447171505537265,
"step": 800
},
{
"epoch": 100.9,
"eval_loss": 2.1389875411987305,
"eval_runtime": 7.6495,
"eval_samples_per_second": 8.236,
"eval_steps_per_second": 1.046,
"eval_wer": 0.639928165219994,
"step": 808
},
{
"epoch": 101.23,
"learning_rate": 0.0002,
"loss": 0.5906,
"step": 810
},
{
"epoch": 101.9,
"eval_loss": 2.3832998275756836,
"eval_runtime": 7.5968,
"eval_samples_per_second": 8.293,
"eval_steps_per_second": 1.053,
"eval_wer": 0.6387309188865609,
"step": 816
},
{
"epoch": 102.45,
"learning_rate": 0.00019746835443037975,
"loss": 0.5735,
"step": 820
},
{
"epoch": 102.9,
"eval_loss": 2.4907209873199463,
"eval_runtime": 7.6164,
"eval_samples_per_second": 8.272,
"eval_steps_per_second": 1.05,
"eval_wer": 0.6303501945525292,
"step": 824
},
{
"epoch": 103.68,
"learning_rate": 0.0001949367088607595,
"loss": 0.5617,
"step": 830
},
{
"epoch": 103.9,
"eval_loss": 2.117652416229248,
"eval_runtime": 7.5597,
"eval_samples_per_second": 8.334,
"eval_steps_per_second": 1.058,
"eval_wer": 0.6438192158036516,
"step": 832
},
{
"epoch": 104.9,
"learning_rate": 0.00019240506329113924,
"loss": 0.5547,
"step": 840
},
{
"epoch": 104.9,
"eval_loss": 2.0854134559631348,
"eval_runtime": 7.6526,
"eval_samples_per_second": 8.233,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6366357378030529,
"step": 840
},
{
"epoch": 105.9,
"eval_loss": 2.1921279430389404,
"eval_runtime": 7.5438,
"eval_samples_per_second": 8.351,
"eval_steps_per_second": 1.06,
"eval_wer": 0.6411254115534272,
"step": 848
},
{
"epoch": 106.23,
"learning_rate": 0.00018987341772151899,
"loss": 0.5805,
"step": 850
},
{
"epoch": 106.9,
"eval_loss": 2.275364398956299,
"eval_runtime": 7.657,
"eval_samples_per_second": 8.228,
"eval_steps_per_second": 1.045,
"eval_wer": 0.631248129302604,
"step": 856
},
{
"epoch": 107.45,
"learning_rate": 0.00018734177215189873,
"loss": 0.5455,
"step": 860
},
{
"epoch": 107.9,
"eval_loss": 2.280198574066162,
"eval_runtime": 7.6544,
"eval_samples_per_second": 8.231,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6348398683029033,
"step": 864
},
{
"epoch": 108.68,
"learning_rate": 0.0001848101265822785,
"loss": 0.5342,
"step": 870
},
{
"epoch": 108.9,
"eval_loss": 2.321939468383789,
"eval_runtime": 7.6518,
"eval_samples_per_second": 8.233,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6324453756360371,
"step": 872
},
{
"epoch": 109.9,
"learning_rate": 0.00018227848101265824,
"loss": 0.5372,
"step": 880
},
{
"epoch": 109.9,
"eval_loss": 2.090009927749634,
"eval_runtime": 7.6209,
"eval_samples_per_second": 8.267,
"eval_steps_per_second": 1.05,
"eval_wer": 0.6423226578868603,
"step": 880
},
{
"epoch": 110.9,
"eval_loss": 1.9904694557189941,
"eval_runtime": 7.6862,
"eval_samples_per_second": 8.196,
"eval_steps_per_second": 1.041,
"eval_wer": 0.6351391798862616,
"step": 888
},
{
"epoch": 111.23,
"learning_rate": 0.000179746835443038,
"loss": 0.6146,
"step": 890
},
{
"epoch": 111.9,
"eval_loss": 2.2073147296905518,
"eval_runtime": 7.7334,
"eval_samples_per_second": 8.146,
"eval_steps_per_second": 1.034,
"eval_wer": 0.6294522598024543,
"step": 896
},
{
"epoch": 112.45,
"learning_rate": 0.00017721518987341773,
"loss": 0.5517,
"step": 900
},
{
"epoch": 112.9,
"eval_loss": 2.2817723751068115,
"eval_runtime": 7.6895,
"eval_samples_per_second": 8.193,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6387309188865609,
"step": 904
},
{
"epoch": 113.68,
"learning_rate": 0.00017468354430379748,
"loss": 0.5501,
"step": 910
},
{
"epoch": 113.9,
"eval_loss": 2.4255876541137695,
"eval_runtime": 7.5778,
"eval_samples_per_second": 8.314,
"eval_steps_per_second": 1.056,
"eval_wer": 0.6318467524693205,
"step": 912
},
{
"epoch": 114.9,
"learning_rate": 0.00017215189873417722,
"loss": 0.5469,
"step": 920
},
{
"epoch": 114.9,
"eval_loss": 2.2073605060577393,
"eval_runtime": 7.6787,
"eval_samples_per_second": 8.205,
"eval_steps_per_second": 1.042,
"eval_wer": 0.6411254115534272,
"step": 920
},
{
"epoch": 115.9,
"eval_loss": 2.2370004653930664,
"eval_runtime": 7.5756,
"eval_samples_per_second": 8.316,
"eval_steps_per_second": 1.056,
"eval_wer": 0.6282550134690212,
"step": 928
},
{
"epoch": 116.23,
"learning_rate": 0.00016962025316455696,
"loss": 0.6065,
"step": 930
},
{
"epoch": 116.9,
"eval_loss": 2.2338502407073975,
"eval_runtime": 7.6802,
"eval_samples_per_second": 8.203,
"eval_steps_per_second": 1.042,
"eval_wer": 0.6267584555522299,
"step": 936
},
{
"epoch": 117.45,
"learning_rate": 0.0001670886075949367,
"loss": 0.5265,
"step": 940
},
{
"epoch": 117.9,
"eval_loss": 2.2717647552490234,
"eval_runtime": 7.6002,
"eval_samples_per_second": 8.289,
"eval_steps_per_second": 1.053,
"eval_wer": 0.6234660281352888,
"step": 944
},
{
"epoch": 118.68,
"learning_rate": 0.00016455696202531648,
"loss": 0.512,
"step": 950
},
{
"epoch": 118.9,
"eval_loss": 2.1963329315185547,
"eval_runtime": 7.6507,
"eval_samples_per_second": 8.235,
"eval_steps_per_second": 1.046,
"eval_wer": 0.6333433103861119,
"step": 952
},
{
"epoch": 119.9,
"learning_rate": 0.0001620253164556962,
"loss": 0.5571,
"step": 960
},
{
"epoch": 119.9,
"eval_loss": 2.2201318740844727,
"eval_runtime": 7.6307,
"eval_samples_per_second": 8.256,
"eval_steps_per_second": 1.048,
"eval_wer": 0.6348398683029033,
"step": 960
},
{
"epoch": 120.9,
"eval_loss": 2.110605478286743,
"eval_runtime": 7.6664,
"eval_samples_per_second": 8.218,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6330439988027536,
"step": 968
},
{
"epoch": 121.23,
"learning_rate": 0.00015949367088607597,
"loss": 0.5778,
"step": 970
},
{
"epoch": 121.9,
"eval_loss": 2.3301584720611572,
"eval_runtime": 7.7674,
"eval_samples_per_second": 8.111,
"eval_steps_per_second": 1.03,
"eval_wer": 0.6306495061358874,
"step": 976
},
{
"epoch": 122.45,
"learning_rate": 0.00015696202531645568,
"loss": 0.539,
"step": 980
},
{
"epoch": 122.9,
"eval_loss": 2.371450662612915,
"eval_runtime": 7.6444,
"eval_samples_per_second": 8.241,
"eval_steps_per_second": 1.047,
"eval_wer": 0.6273570787189464,
"step": 984
},
{
"epoch": 123.68,
"learning_rate": 0.00015443037974683546,
"loss": 0.5306,
"step": 990
},
{
"epoch": 123.9,
"eval_loss": 2.241682529449463,
"eval_runtime": 7.5759,
"eval_samples_per_second": 8.316,
"eval_steps_per_second": 1.056,
"eval_wer": 0.6351391798862616,
"step": 992
},
{
"epoch": 124.9,
"learning_rate": 0.0001518987341772152,
"loss": 0.5271,
"step": 1000
},
{
"epoch": 124.9,
"eval_loss": 2.169471502304077,
"eval_runtime": 7.5614,
"eval_samples_per_second": 8.332,
"eval_steps_per_second": 1.058,
"eval_wer": 0.6249625860520802,
"step": 1000
},
{
"epoch": 125.9,
"eval_loss": 2.1912169456481934,
"eval_runtime": 7.6883,
"eval_samples_per_second": 8.194,
"eval_steps_per_second": 1.041,
"eval_wer": 0.627955701885663,
"step": 1008
},
{
"epoch": 126.23,
"learning_rate": 0.00014936708860759494,
"loss": 0.5766,
"step": 1010
},
{
"epoch": 126.9,
"eval_loss": 2.1122422218322754,
"eval_runtime": 7.6874,
"eval_samples_per_second": 8.195,
"eval_steps_per_second": 1.041,
"eval_wer": 0.6339419335528285,
"step": 1016
},
{
"epoch": 127.45,
"learning_rate": 0.0001468354430379747,
"loss": 0.5483,
"step": 1020
},
{
"epoch": 127.9,
"eval_loss": 2.0696394443511963,
"eval_runtime": 7.6797,
"eval_samples_per_second": 8.203,
"eval_steps_per_second": 1.042,
"eval_wer": 0.6321460640526788,
"step": 1024
},
{
"epoch": 128.68,
"learning_rate": 0.00014430379746835443,
"loss": 0.5414,
"step": 1030
},
{
"epoch": 128.9,
"eval_loss": 2.093480348587036,
"eval_runtime": 7.6571,
"eval_samples_per_second": 8.228,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6315474408859623,
"step": 1032
},
{
"epoch": 129.9,
"learning_rate": 0.00014177215189873418,
"loss": 0.5125,
"step": 1040
},
{
"epoch": 129.9,
"eval_loss": 2.1692750453948975,
"eval_runtime": 7.609,
"eval_samples_per_second": 8.28,
"eval_steps_per_second": 1.051,
"eval_wer": 0.6336426219694702,
"step": 1040
},
{
"epoch": 130.9,
"eval_loss": 2.135119915008545,
"eval_runtime": 7.7121,
"eval_samples_per_second": 8.169,
"eval_steps_per_second": 1.037,
"eval_wer": 0.6315474408859623,
"step": 1048
},
{
"epoch": 131.23,
"learning_rate": 0.00013924050632911395,
"loss": 0.5733,
"step": 1050
},
{
"epoch": 131.9,
"eval_loss": 2.1570212841033936,
"eval_runtime": 7.6856,
"eval_samples_per_second": 8.197,
"eval_steps_per_second": 1.041,
"eval_wer": 0.6405267883867105,
"step": 1056
},
{
"epoch": 132.45,
"learning_rate": 0.00013670886075949366,
"loss": 0.5285,
"step": 1060
},
{
"epoch": 132.9,
"eval_loss": 2.1996734142303467,
"eval_runtime": 7.7021,
"eval_samples_per_second": 8.18,
"eval_steps_per_second": 1.039,
"eval_wer": 0.6309488177192457,
"step": 1064
},
{
"epoch": 133.68,
"learning_rate": 0.00013417721518987343,
"loss": 0.5426,
"step": 1070
},
{
"epoch": 133.9,
"eval_loss": 2.1216108798980713,
"eval_runtime": 7.7071,
"eval_samples_per_second": 8.174,
"eval_steps_per_second": 1.038,
"eval_wer": 0.6321460640526788,
"step": 1072
},
{
"epoch": 134.9,
"learning_rate": 0.00013164556962025315,
"loss": 0.5018,
"step": 1080
},
{
"epoch": 134.9,
"eval_loss": 2.174179792404175,
"eval_runtime": 7.6539,
"eval_samples_per_second": 8.231,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6246632744687219,
"step": 1080
},
{
"epoch": 135.9,
"eval_loss": 2.120788335800171,
"eval_runtime": 7.6772,
"eval_samples_per_second": 8.206,
"eval_steps_per_second": 1.042,
"eval_wer": 0.6303501945525292,
"step": 1088
},
{
"epoch": 136.23,
"learning_rate": 0.00012911392405063292,
"loss": 0.5611,
"step": 1090
},
{
"epoch": 136.9,
"eval_loss": 2.122828483581543,
"eval_runtime": 7.6522,
"eval_samples_per_second": 8.233,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6303501945525292,
"step": 1096
},
{
"epoch": 137.45,
"learning_rate": 0.00012658227848101267,
"loss": 0.5258,
"step": 1100
},
{
"epoch": 137.9,
"eval_loss": 2.225569248199463,
"eval_runtime": 7.692,
"eval_samples_per_second": 8.19,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6309488177192457,
"step": 1104
},
{
"epoch": 138.68,
"learning_rate": 0.0001240506329113924,
"loss": 0.5364,
"step": 1110
},
{
"epoch": 138.9,
"eval_loss": 2.162257432937622,
"eval_runtime": 7.6234,
"eval_samples_per_second": 8.264,
"eval_steps_per_second": 1.049,
"eval_wer": 0.6306495061358874,
"step": 1112
},
{
"epoch": 139.9,
"learning_rate": 0.00012151898734177217,
"loss": 0.528,
"step": 1120
},
{
"epoch": 139.9,
"eval_loss": 2.0063600540161133,
"eval_runtime": 7.6673,
"eval_samples_per_second": 8.217,
"eval_steps_per_second": 1.043,
"eval_wer": 0.6288536366357378,
"step": 1120
},
{
"epoch": 140.9,
"eval_loss": 2.0472218990325928,
"eval_runtime": 7.572,
"eval_samples_per_second": 8.32,
"eval_steps_per_second": 1.057,
"eval_wer": 0.6297515713858126,
"step": 1128
},
{
"epoch": 141.23,
"learning_rate": 0.0001189873417721519,
"loss": 0.5637,
"step": 1130
},
{
"epoch": 141.9,
"eval_loss": 2.190746307373047,
"eval_runtime": 7.6599,
"eval_samples_per_second": 8.225,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6318467524693205,
"step": 1136
},
{
"epoch": 142.45,
"learning_rate": 0.00011645569620253166,
"loss": 0.5051,
"step": 1140
},
{
"epoch": 142.9,
"eval_loss": 2.156960964202881,
"eval_runtime": 7.648,
"eval_samples_per_second": 8.237,
"eval_steps_per_second": 1.046,
"eval_wer": 0.6291529482190961,
"step": 1144
},
{
"epoch": 143.68,
"learning_rate": 0.0001139240506329114,
"loss": 0.523,
"step": 1150
},
{
"epoch": 143.9,
"eval_loss": 2.049663782119751,
"eval_runtime": 7.6935,
"eval_samples_per_second": 8.189,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6423226578868603,
"step": 1152
},
{
"epoch": 144.9,
"learning_rate": 0.00011139240506329114,
"loss": 0.5516,
"step": 1160
},
{
"epoch": 144.9,
"eval_loss": 2.090688467025757,
"eval_runtime": 7.6869,
"eval_samples_per_second": 8.196,
"eval_steps_per_second": 1.041,
"eval_wer": 0.6324453756360371,
"step": 1160
},
{
"epoch": 145.9,
"eval_loss": 2.147946357727051,
"eval_runtime": 7.6864,
"eval_samples_per_second": 8.196,
"eval_steps_per_second": 1.041,
"eval_wer": 0.6309488177192457,
"step": 1168
},
{
"epoch": 146.23,
"learning_rate": 0.00010886075949367089,
"loss": 0.5524,
"step": 1170
},
{
"epoch": 146.9,
"eval_loss": 2.0570223331451416,
"eval_runtime": 7.5902,
"eval_samples_per_second": 8.3,
"eval_steps_per_second": 1.054,
"eval_wer": 0.6273570787189464,
"step": 1176
},
{
"epoch": 147.45,
"learning_rate": 0.00010632911392405063,
"loss": 0.5215,
"step": 1180
},
{
"epoch": 147.9,
"eval_loss": 2.137968063354492,
"eval_runtime": 7.6003,
"eval_samples_per_second": 8.289,
"eval_steps_per_second": 1.053,
"eval_wer": 0.6339419335528285,
"step": 1184
},
{
"epoch": 148.68,
"learning_rate": 0.00010379746835443039,
"loss": 0.5447,
"step": 1190
},
{
"epoch": 148.9,
"eval_loss": 2.2314438819885254,
"eval_runtime": 7.671,
"eval_samples_per_second": 8.213,
"eval_steps_per_second": 1.043,
"eval_wer": 0.6303501945525292,
"step": 1192
},
{
"epoch": 149.9,
"learning_rate": 0.00010126582278481013,
"loss": 0.521,
"step": 1200
},
{
"epoch": 149.9,
"eval_loss": 2.147305727005005,
"eval_runtime": 7.6063,
"eval_samples_per_second": 8.283,
"eval_steps_per_second": 1.052,
"eval_wer": 0.6333433103861119,
"step": 1200
},
{
"epoch": 150.9,
"eval_loss": 2.1240322589874268,
"eval_runtime": 7.5902,
"eval_samples_per_second": 8.3,
"eval_steps_per_second": 1.054,
"eval_wer": 0.6291529482190961,
"step": 1208
},
{
"epoch": 151.23,
"learning_rate": 9.873417721518988e-05,
"loss": 0.5501,
"step": 1210
},
{
"epoch": 151.9,
"eval_loss": 2.1305501461029053,
"eval_runtime": 7.5935,
"eval_samples_per_second": 8.297,
"eval_steps_per_second": 1.054,
"eval_wer": 0.6216701586351392,
"step": 1216
},
{
"epoch": 152.45,
"learning_rate": 9.620253164556962e-05,
"loss": 0.5309,
"step": 1220
},
{
"epoch": 152.9,
"eval_loss": 2.1293582916259766,
"eval_runtime": 7.5958,
"eval_samples_per_second": 8.294,
"eval_steps_per_second": 1.053,
"eval_wer": 0.6315474408859623,
"step": 1224
},
{
"epoch": 153.68,
"learning_rate": 9.367088607594936e-05,
"loss": 0.5293,
"step": 1230
},
{
"epoch": 153.9,
"eval_loss": 2.2012763023376465,
"eval_runtime": 7.6851,
"eval_samples_per_second": 8.198,
"eval_steps_per_second": 1.041,
"eval_wer": 0.6285543250523795,
"step": 1232
},
{
"epoch": 154.9,
"learning_rate": 9.113924050632912e-05,
"loss": 0.4898,
"step": 1240
},
{
"epoch": 154.9,
"eval_loss": 2.216932773590088,
"eval_runtime": 7.6132,
"eval_samples_per_second": 8.275,
"eval_steps_per_second": 1.051,
"eval_wer": 0.6291529482190961,
"step": 1240
},
{
"epoch": 155.9,
"eval_loss": 2.2271268367767334,
"eval_runtime": 7.5691,
"eval_samples_per_second": 8.323,
"eval_steps_per_second": 1.057,
"eval_wer": 0.6237653397186471,
"step": 1248
},
{
"epoch": 156.23,
"learning_rate": 8.860759493670887e-05,
"loss": 0.559,
"step": 1250
},
{
"epoch": 156.9,
"eval_loss": 2.1803646087646484,
"eval_runtime": 7.6189,
"eval_samples_per_second": 8.269,
"eval_steps_per_second": 1.05,
"eval_wer": 0.6276563903023047,
"step": 1256
},
{
"epoch": 157.45,
"learning_rate": 8.607594936708861e-05,
"loss": 0.5451,
"step": 1260
},
{
"epoch": 157.9,
"eval_loss": 2.1884472370147705,
"eval_runtime": 7.7078,
"eval_samples_per_second": 8.174,
"eval_steps_per_second": 1.038,
"eval_wer": 0.6303501945525292,
"step": 1264
},
{
"epoch": 158.68,
"learning_rate": 8.354430379746835e-05,
"loss": 0.5072,
"step": 1270
},
{
"epoch": 158.9,
"eval_loss": 2.229902505874634,
"eval_runtime": 7.6574,
"eval_samples_per_second": 8.227,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6309488177192457,
"step": 1272
},
{
"epoch": 159.9,
"learning_rate": 8.10126582278481e-05,
"loss": 0.5259,
"step": 1280
},
{
"epoch": 159.9,
"eval_loss": 2.16611909866333,
"eval_runtime": 7.6474,
"eval_samples_per_second": 8.238,
"eval_steps_per_second": 1.046,
"eval_wer": 0.625860520802155,
"step": 1280
},
{
"epoch": 160.9,
"eval_loss": 2.157914638519287,
"eval_runtime": 7.699,
"eval_samples_per_second": 8.183,
"eval_steps_per_second": 1.039,
"eval_wer": 0.6264591439688716,
"step": 1288
},
{
"epoch": 161.23,
"learning_rate": 7.848101265822784e-05,
"loss": 0.5609,
"step": 1290
},
{
"epoch": 161.9,
"eval_loss": 2.2085673809051514,
"eval_runtime": 7.6653,
"eval_samples_per_second": 8.219,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6168811733014068,
"step": 1296
},
{
"epoch": 162.45,
"learning_rate": 7.59493670886076e-05,
"loss": 0.5168,
"step": 1300
},
{
"epoch": 162.9,
"eval_loss": 2.146618366241455,
"eval_runtime": 7.6769,
"eval_samples_per_second": 8.206,
"eval_steps_per_second": 1.042,
"eval_wer": 0.6222687818018557,
"step": 1304
},
{
"epoch": 163.68,
"learning_rate": 7.341772151898734e-05,
"loss": 0.4984,
"step": 1310
},
{
"epoch": 163.9,
"eval_loss": 2.141826868057251,
"eval_runtime": 7.6477,
"eval_samples_per_second": 8.238,
"eval_steps_per_second": 1.046,
"eval_wer": 0.625860520802155,
"step": 1312
},
{
"epoch": 164.9,
"learning_rate": 7.088607594936709e-05,
"loss": 0.5254,
"step": 1320
},
{
"epoch": 164.9,
"eval_loss": 2.117159605026245,
"eval_runtime": 7.6915,
"eval_samples_per_second": 8.191,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6282550134690212,
"step": 1320
},
{
"epoch": 165.9,
"eval_loss": 2.091912031173706,
"eval_runtime": 7.6372,
"eval_samples_per_second": 8.249,
"eval_steps_per_second": 1.048,
"eval_wer": 0.6246632744687219,
"step": 1328
},
{
"epoch": 166.23,
"learning_rate": 6.835443037974683e-05,
"loss": 0.5685,
"step": 1330
},
{
"epoch": 166.9,
"eval_loss": 2.1054956912994385,
"eval_runtime": 7.6658,
"eval_samples_per_second": 8.218,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6261598323855133,
"step": 1336
},
{
"epoch": 167.45,
"learning_rate": 6.582278481012658e-05,
"loss": 0.4952,
"step": 1340
},
{
"epoch": 167.9,
"eval_loss": 2.083932638168335,
"eval_runtime": 7.6404,
"eval_samples_per_second": 8.246,
"eval_steps_per_second": 1.047,
"eval_wer": 0.6252618976354385,
"step": 1344
},
{
"epoch": 168.68,
"learning_rate": 6.329113924050633e-05,
"loss": 0.5024,
"step": 1350
},
{
"epoch": 168.9,
"eval_loss": 2.0244107246398926,
"eval_runtime": 7.6196,
"eval_samples_per_second": 8.268,
"eval_steps_per_second": 1.05,
"eval_wer": 0.6255612092187968,
"step": 1352
},
{
"epoch": 169.9,
"learning_rate": 6.0759493670886084e-05,
"loss": 0.5028,
"step": 1360
},
{
"epoch": 169.9,
"eval_loss": 2.0157837867736816,
"eval_runtime": 7.7009,
"eval_samples_per_second": 8.181,
"eval_steps_per_second": 1.039,
"eval_wer": 0.6240646513020054,
"step": 1360
},
{
"epoch": 170.9,
"eval_loss": 2.009673833847046,
"eval_runtime": 7.6823,
"eval_samples_per_second": 8.201,
"eval_steps_per_second": 1.041,
"eval_wer": 0.6240646513020054,
"step": 1368
},
{
"epoch": 171.23,
"learning_rate": 5.822784810126583e-05,
"loss": 0.5731,
"step": 1370
},
{
"epoch": 171.9,
"eval_loss": 1.988526463508606,
"eval_runtime": 7.6305,
"eval_samples_per_second": 8.256,
"eval_steps_per_second": 1.048,
"eval_wer": 0.6216701586351392,
"step": 1376
},
{
"epoch": 172.45,
"learning_rate": 5.569620253164557e-05,
"loss": 0.4829,
"step": 1380
},
{
"epoch": 172.9,
"eval_loss": 1.9991979598999023,
"eval_runtime": 7.591,
"eval_samples_per_second": 8.299,
"eval_steps_per_second": 1.054,
"eval_wer": 0.6237653397186471,
"step": 1384
},
{
"epoch": 173.68,
"learning_rate": 5.3164556962025316e-05,
"loss": 0.5101,
"step": 1390
},
{
"epoch": 173.9,
"eval_loss": 1.9918380975723267,
"eval_runtime": 7.7023,
"eval_samples_per_second": 8.179,
"eval_steps_per_second": 1.039,
"eval_wer": 0.6210715354684226,
"step": 1392
},
{
"epoch": 174.9,
"learning_rate": 5.0632911392405066e-05,
"loss": 0.5058,
"step": 1400
},
{
"epoch": 174.9,
"eval_loss": 1.9633089303970337,
"eval_runtime": 7.6237,
"eval_samples_per_second": 8.264,
"eval_steps_per_second": 1.049,
"eval_wer": 0.6282550134690212,
"step": 1400
},
{
"epoch": 175.9,
"eval_loss": 1.9551260471343994,
"eval_runtime": 7.6939,
"eval_samples_per_second": 8.188,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6228674049685723,
"step": 1408
},
{
"epoch": 176.23,
"learning_rate": 4.810126582278481e-05,
"loss": 0.5182,
"step": 1410
},
{
"epoch": 176.9,
"eval_loss": 2.016941785812378,
"eval_runtime": 7.658,
"eval_samples_per_second": 8.227,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6162825501346902,
"step": 1416
},
{
"epoch": 177.45,
"learning_rate": 4.556962025316456e-05,
"loss": 0.5443,
"step": 1420
},
{
"epoch": 177.9,
"eval_loss": 2.016011953353882,
"eval_runtime": 7.599,
"eval_samples_per_second": 8.291,
"eval_steps_per_second": 1.053,
"eval_wer": 0.6186770428015564,
"step": 1424
},
{
"epoch": 178.68,
"learning_rate": 4.3037974683544305e-05,
"loss": 0.522,
"step": 1430
},
{
"epoch": 178.9,
"eval_loss": 2.060013771057129,
"eval_runtime": 7.6526,
"eval_samples_per_second": 8.232,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6177791080514816,
"step": 1432
},
{
"epoch": 179.9,
"learning_rate": 4.050632911392405e-05,
"loss": 0.5042,
"step": 1440
},
{
"epoch": 179.9,
"eval_loss": 2.036672353744507,
"eval_runtime": 7.6364,
"eval_samples_per_second": 8.25,
"eval_steps_per_second": 1.048,
"eval_wer": 0.625860520802155,
"step": 1440
},
{
"epoch": 180.9,
"eval_loss": 2.071685314178467,
"eval_runtime": 7.672,
"eval_samples_per_second": 8.212,
"eval_steps_per_second": 1.043,
"eval_wer": 0.6186770428015564,
"step": 1448
},
{
"epoch": 181.23,
"learning_rate": 3.79746835443038e-05,
"loss": 0.5486,
"step": 1450
},
{
"epoch": 181.9,
"eval_loss": 2.058335304260254,
"eval_runtime": 7.6269,
"eval_samples_per_second": 8.26,
"eval_steps_per_second": 1.049,
"eval_wer": 0.6252618976354385,
"step": 1456
},
{
"epoch": 182.45,
"learning_rate": 3.5443037974683544e-05,
"loss": 0.4946,
"step": 1460
},
{
"epoch": 182.9,
"eval_loss": 2.067958116531372,
"eval_runtime": 7.6539,
"eval_samples_per_second": 8.231,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6261598323855133,
"step": 1464
},
{
"epoch": 183.68,
"learning_rate": 3.291139240506329e-05,
"loss": 0.5056,
"step": 1470
},
{
"epoch": 183.9,
"eval_loss": 2.0846917629241943,
"eval_runtime": 7.6222,
"eval_samples_per_second": 8.265,
"eval_steps_per_second": 1.05,
"eval_wer": 0.6219694702184975,
"step": 1472
},
{
"epoch": 184.9,
"learning_rate": 3.0379746835443042e-05,
"loss": 0.513,
"step": 1480
},
{
"epoch": 184.9,
"eval_loss": 2.0797383785247803,
"eval_runtime": 7.7548,
"eval_samples_per_second": 8.124,
"eval_steps_per_second": 1.032,
"eval_wer": 0.6231667165519306,
"step": 1480
},
{
"epoch": 185.9,
"eval_loss": 2.056018590927124,
"eval_runtime": 7.6669,
"eval_samples_per_second": 8.217,
"eval_steps_per_second": 1.043,
"eval_wer": 0.622568093385214,
"step": 1488
},
{
"epoch": 186.23,
"learning_rate": 2.7848101265822786e-05,
"loss": 0.5334,
"step": 1490
},
{
"epoch": 186.9,
"eval_loss": 2.0349366664886475,
"eval_runtime": 7.6484,
"eval_samples_per_second": 8.237,
"eval_steps_per_second": 1.046,
"eval_wer": 0.6288536366357378,
"step": 1496
},
{
"epoch": 187.45,
"learning_rate": 2.5316455696202533e-05,
"loss": 0.5265,
"step": 1500
},
{
"epoch": 187.9,
"eval_loss": 2.0137064456939697,
"eval_runtime": 7.7543,
"eval_samples_per_second": 8.125,
"eval_steps_per_second": 1.032,
"eval_wer": 0.6276563903023047,
"step": 1504
},
{
"epoch": 188.68,
"learning_rate": 2.278481012658228e-05,
"loss": 0.5135,
"step": 1510
},
{
"epoch": 188.9,
"eval_loss": 2.022761106491089,
"eval_runtime": 7.6517,
"eval_samples_per_second": 8.233,
"eval_steps_per_second": 1.046,
"eval_wer": 0.625860520802155,
"step": 1512
},
{
"epoch": 189.9,
"learning_rate": 2.0253164556962025e-05,
"loss": 0.5062,
"step": 1520
},
{
"epoch": 189.9,
"eval_loss": 2.0344340801239014,
"eval_runtime": 7.6532,
"eval_samples_per_second": 8.232,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6243639628853637,
"step": 1520
},
{
"epoch": 190.9,
"eval_loss": 2.02585768699646,
"eval_runtime": 7.6933,
"eval_samples_per_second": 8.189,
"eval_steps_per_second": 1.04,
"eval_wer": 0.6252618976354385,
"step": 1528
},
{
"epoch": 191.23,
"learning_rate": 1.7721518987341772e-05,
"loss": 0.5459,
"step": 1530
},
{
"epoch": 191.9,
"eval_loss": 2.019090175628662,
"eval_runtime": 7.6526,
"eval_samples_per_second": 8.233,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6261598323855133,
"step": 1536
},
{
"epoch": 192.45,
"learning_rate": 1.5189873417721521e-05,
"loss": 0.4993,
"step": 1540
},
{
"epoch": 192.9,
"eval_loss": 2.0223634243011475,
"eval_runtime": 7.635,
"eval_samples_per_second": 8.251,
"eval_steps_per_second": 1.048,
"eval_wer": 0.6249625860520802,
"step": 1544
},
{
"epoch": 193.68,
"learning_rate": 1.2658227848101267e-05,
"loss": 0.4965,
"step": 1550
},
{
"epoch": 193.9,
"eval_loss": 2.0135087966918945,
"eval_runtime": 7.6082,
"eval_samples_per_second": 8.281,
"eval_steps_per_second": 1.051,
"eval_wer": 0.6273570787189464,
"step": 1552
},
{
"epoch": 194.9,
"learning_rate": 1.0126582278481012e-05,
"loss": 0.4827,
"step": 1560
},
{
"epoch": 194.9,
"eval_loss": 2.0026562213897705,
"eval_runtime": 7.6658,
"eval_samples_per_second": 8.218,
"eval_steps_per_second": 1.044,
"eval_wer": 0.6288536366357378,
"step": 1560
},
{
"epoch": 195.9,
"eval_loss": 2.006549119949341,
"eval_runtime": 7.6324,
"eval_samples_per_second": 8.254,
"eval_steps_per_second": 1.048,
"eval_wer": 0.6264591439688716,
"step": 1568
},
{
"epoch": 196.23,
"learning_rate": 7.5949367088607605e-06,
"loss": 0.5181,
"step": 1570
},
{
"epoch": 196.9,
"eval_loss": 2.0064003467559814,
"eval_runtime": 7.653,
"eval_samples_per_second": 8.232,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6270577671355881,
"step": 1576
},
{
"epoch": 197.45,
"learning_rate": 5.063291139240506e-06,
"loss": 0.518,
"step": 1580
},
{
"epoch": 197.9,
"eval_loss": 2.007786750793457,
"eval_runtime": 7.6766,
"eval_samples_per_second": 8.207,
"eval_steps_per_second": 1.042,
"eval_wer": 0.6276563903023047,
"step": 1584
},
{
"epoch": 198.68,
"learning_rate": 2.531645569620253e-06,
"loss": 0.4807,
"step": 1590
},
{
"epoch": 198.9,
"eval_loss": 2.008424758911133,
"eval_runtime": 7.654,
"eval_samples_per_second": 8.231,
"eval_steps_per_second": 1.045,
"eval_wer": 0.6276563903023047,
"step": 1592
},
{
"epoch": 199.9,
"learning_rate": 0.0,
"loss": 0.5078,
"step": 1600
},
{
"epoch": 199.9,
"eval_loss": 2.008995532989502,
"eval_runtime": 7.6484,
"eval_samples_per_second": 8.237,
"eval_steps_per_second": 1.046,
"eval_wer": 0.6276563903023047,
"step": 1600
},
{
"epoch": 199.9,
"step": 1600,
"total_flos": 1.1848602213269387e+19,
"train_loss": 0.5738694608211518,
"train_runtime": 18463.351,
"train_samples_per_second": 6.099,
"train_steps_per_second": 0.087
}
],
"max_steps": 1600,
"num_train_epochs": 200,
"total_flos": 1.1848602213269387e+19,
"trial_name": null,
"trial_params": null
}