gary109's picture
End of training
d96475a
raw
history blame
67.5 kB
{
"best_metric": 2.074415922164917,
"best_model_checkpoint": "ai-light-dance_drums_ft_pretrain_wav2vec2-base/checkpoint-744",
"epoch": 199.90140845070422,
"global_step": 1600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.9,
"eval_loss": 2.379915952682495,
"eval_runtime": 7.7959,
"eval_samples_per_second": 8.081,
"eval_steps_per_second": 1.026,
"eval_wer": 0.7797066746483089,
"step": 8
},
{
"epoch": 1.23,
"learning_rate": 0.0002,
"loss": 0.9677,
"step": 10
},
{
"epoch": 1.9,
"eval_loss": 2.4062252044677734,
"eval_runtime": 7.9931,
"eval_samples_per_second": 7.882,
"eval_steps_per_second": 1.001,
"eval_wer": 0.7913798263992816,
"step": 16
},
{
"epoch": 2.45,
"learning_rate": 0.0004,
"loss": 0.9433,
"step": 20
},
{
"epoch": 2.9,
"eval_loss": 2.6954824924468994,
"eval_runtime": 8.0202,
"eval_samples_per_second": 7.855,
"eval_steps_per_second": 0.997,
"eval_wer": 0.7683328344806944,
"step": 24
},
{
"epoch": 3.68,
"learning_rate": 0.00039746835443037974,
"loss": 1.0276,
"step": 30
},
{
"epoch": 3.9,
"eval_loss": 2.5257680416107178,
"eval_runtime": 8.0107,
"eval_samples_per_second": 7.864,
"eval_steps_per_second": 0.999,
"eval_wer": 0.7892846453157737,
"step": 32
},
{
"epoch": 4.9,
"learning_rate": 0.0003949367088607595,
"loss": 0.9923,
"step": 40
},
{
"epoch": 4.9,
"eval_loss": 2.417393445968628,
"eval_runtime": 8.1407,
"eval_samples_per_second": 7.739,
"eval_steps_per_second": 0.983,
"eval_wer": 0.7824004788985334,
"step": 40
},
{
"epoch": 5.9,
"eval_loss": 2.7146248817443848,
"eval_runtime": 8.0327,
"eval_samples_per_second": 7.843,
"eval_steps_per_second": 0.996,
"eval_wer": 0.7788087398982341,
"step": 48
},
{
"epoch": 6.23,
"learning_rate": 0.0003924050632911393,
"loss": 1.0927,
"step": 50
},
{
"epoch": 6.9,
"eval_loss": 2.9690921306610107,
"eval_runtime": 7.8332,
"eval_samples_per_second": 8.043,
"eval_steps_per_second": 1.021,
"eval_wer": 0.7883867105656989,
"step": 56
},
{
"epoch": 7.45,
"learning_rate": 0.000389873417721519,
"loss": 1.0133,
"step": 60
},
{
"epoch": 7.9,
"eval_loss": 3.11049485206604,
"eval_runtime": 8.0174,
"eval_samples_per_second": 7.858,
"eval_steps_per_second": 0.998,
"eval_wer": 0.7644417838970368,
"step": 64
},
{
"epoch": 8.68,
"learning_rate": 0.00038734177215189877,
"loss": 0.98,
"step": 70
},
{
"epoch": 8.9,
"eval_loss": 2.8638393878936768,
"eval_runtime": 8.0331,
"eval_samples_per_second": 7.843,
"eval_steps_per_second": 0.996,
"eval_wer": 0.7644417838970368,
"step": 72
},
{
"epoch": 9.9,
"learning_rate": 0.0003848101265822785,
"loss": 0.9688,
"step": 80
},
{
"epoch": 9.9,
"eval_loss": 2.7538065910339355,
"eval_runtime": 7.9304,
"eval_samples_per_second": 7.944,
"eval_steps_per_second": 1.009,
"eval_wer": 0.758156240646513,
"step": 80
},
{
"epoch": 10.9,
"eval_loss": 2.6010308265686035,
"eval_runtime": 8.0107,
"eval_samples_per_second": 7.865,
"eval_steps_per_second": 0.999,
"eval_wer": 0.7713259503142772,
"step": 88
},
{
"epoch": 11.23,
"learning_rate": 0.00038227848101265825,
"loss": 1.0453,
"step": 90
},
{
"epoch": 11.9,
"eval_loss": 2.6365110874176025,
"eval_runtime": 7.9124,
"eval_samples_per_second": 7.962,
"eval_steps_per_second": 1.011,
"eval_wer": 0.7482789583956899,
"step": 96
},
{
"epoch": 12.45,
"learning_rate": 0.00037974683544303797,
"loss": 0.9397,
"step": 100
},
{
"epoch": 12.9,
"eval_loss": 2.474029302597046,
"eval_runtime": 7.927,
"eval_samples_per_second": 7.948,
"eval_steps_per_second": 1.009,
"eval_wer": 0.7629452259802454,
"step": 104
},
{
"epoch": 13.68,
"learning_rate": 0.00037721518987341774,
"loss": 0.9466,
"step": 110
},
{
"epoch": 13.9,
"eval_loss": 2.6466243267059326,
"eval_runtime": 7.9192,
"eval_samples_per_second": 7.955,
"eval_steps_per_second": 1.01,
"eval_wer": 0.7617479796468123,
"step": 112
},
{
"epoch": 14.9,
"learning_rate": 0.00037468354430379746,
"loss": 0.9665,
"step": 120
},
{
"epoch": 14.9,
"eval_loss": 2.6643269062042236,
"eval_runtime": 7.9716,
"eval_samples_per_second": 7.903,
"eval_steps_per_second": 1.004,
"eval_wer": 0.7644417838970368,
"step": 120
},
{
"epoch": 15.9,
"eval_loss": 2.4003283977508545,
"eval_runtime": 7.9753,
"eval_samples_per_second": 7.899,
"eval_steps_per_second": 1.003,
"eval_wer": 0.740796168811733,
"step": 128
},
{
"epoch": 16.23,
"learning_rate": 0.00037215189873417723,
"loss": 1.0577,
"step": 130
},
{
"epoch": 16.9,
"eval_loss": 2.6306591033935547,
"eval_runtime": 7.9695,
"eval_samples_per_second": 7.905,
"eval_steps_per_second": 1.004,
"eval_wer": 0.7707273271475606,
"step": 136
},
{
"epoch": 17.45,
"learning_rate": 0.000369620253164557,
"loss": 0.9154,
"step": 140
},
{
"epoch": 17.9,
"eval_loss": 2.6734743118286133,
"eval_runtime": 7.957,
"eval_samples_per_second": 7.918,
"eval_steps_per_second": 1.005,
"eval_wer": 0.7491768931457647,
"step": 144
},
{
"epoch": 18.68,
"learning_rate": 0.0003670886075949367,
"loss": 0.9352,
"step": 150
},
{
"epoch": 18.9,
"eval_loss": 2.4403460025787354,
"eval_runtime": 7.9548,
"eval_samples_per_second": 7.92,
"eval_steps_per_second": 1.006,
"eval_wer": 0.7491768931457647,
"step": 152
},
{
"epoch": 19.9,
"learning_rate": 0.0003645569620253165,
"loss": 0.8999,
"step": 160
},
{
"epoch": 19.9,
"eval_loss": 2.71948504447937,
"eval_runtime": 7.9309,
"eval_samples_per_second": 7.944,
"eval_steps_per_second": 1.009,
"eval_wer": 0.7650404070637533,
"step": 160
},
{
"epoch": 20.9,
"eval_loss": 2.2872610092163086,
"eval_runtime": 7.9835,
"eval_samples_per_second": 7.891,
"eval_steps_per_second": 1.002,
"eval_wer": 0.7602514217300209,
"step": 168
},
{
"epoch": 21.23,
"learning_rate": 0.00036202531645569626,
"loss": 0.9935,
"step": 170
},
{
"epoch": 21.9,
"eval_loss": 2.844008207321167,
"eval_runtime": 7.9178,
"eval_samples_per_second": 7.957,
"eval_steps_per_second": 1.01,
"eval_wer": 0.7512720742292727,
"step": 176
},
{
"epoch": 22.45,
"learning_rate": 0.000359493670886076,
"loss": 0.885,
"step": 180
},
{
"epoch": 22.9,
"eval_loss": 2.7574303150177,
"eval_runtime": 7.9538,
"eval_samples_per_second": 7.921,
"eval_steps_per_second": 1.006,
"eval_wer": 0.7485782699790482,
"step": 184
},
{
"epoch": 23.68,
"learning_rate": 0.0003569620253164557,
"loss": 0.8979,
"step": 190
},
{
"epoch": 23.9,
"eval_loss": 3.1470837593078613,
"eval_runtime": 7.9957,
"eval_samples_per_second": 7.879,
"eval_steps_per_second": 1.001,
"eval_wer": 0.7536665668961389,
"step": 192
},
{
"epoch": 24.9,
"learning_rate": 0.00035443037974683546,
"loss": 0.9074,
"step": 200
},
{
"epoch": 24.9,
"eval_loss": 3.089177131652832,
"eval_runtime": 7.9191,
"eval_samples_per_second": 7.955,
"eval_steps_per_second": 1.01,
"eval_wer": 0.7288237054774019,
"step": 200
},
{
"epoch": 25.9,
"eval_loss": 2.8640966415405273,
"eval_runtime": 7.907,
"eval_samples_per_second": 7.968,
"eval_steps_per_second": 1.012,
"eval_wer": 0.7518706973959892,
"step": 208
},
{
"epoch": 26.23,
"learning_rate": 0.00035189873417721524,
"loss": 0.9498,
"step": 210
},
{
"epoch": 26.9,
"eval_loss": 2.879786729812622,
"eval_runtime": 7.8826,
"eval_samples_per_second": 7.992,
"eval_steps_per_second": 1.015,
"eval_wer": 0.7398982340616582,
"step": 216
},
{
"epoch": 27.45,
"learning_rate": 0.00034936708860759495,
"loss": 0.8821,
"step": 220
},
{
"epoch": 27.9,
"eval_loss": 2.8114750385284424,
"eval_runtime": 7.9479,
"eval_samples_per_second": 7.927,
"eval_steps_per_second": 1.007,
"eval_wer": 0.749476204729123,
"step": 224
},
{
"epoch": 28.68,
"learning_rate": 0.00034683544303797467,
"loss": 0.8968,
"step": 230
},
{
"epoch": 28.9,
"eval_loss": 2.922487735748291,
"eval_runtime": 7.8659,
"eval_samples_per_second": 8.009,
"eval_steps_per_second": 1.017,
"eval_wer": 0.7446872193953906,
"step": 232
},
{
"epoch": 29.9,
"learning_rate": 0.00034430379746835444,
"loss": 0.8783,
"step": 240
},
{
"epoch": 29.9,
"eval_loss": 2.541382074356079,
"eval_runtime": 8.0089,
"eval_samples_per_second": 7.866,
"eval_steps_per_second": 0.999,
"eval_wer": 0.7503741394791978,
"step": 240
},
{
"epoch": 30.9,
"eval_loss": 2.352771759033203,
"eval_runtime": 7.9156,
"eval_samples_per_second": 7.959,
"eval_steps_per_second": 1.011,
"eval_wer": 0.7378030529781503,
"step": 248
},
{
"epoch": 31.23,
"learning_rate": 0.0003417721518987342,
"loss": 0.9428,
"step": 250
},
{
"epoch": 31.9,
"eval_loss": 2.807304859161377,
"eval_runtime": 7.8598,
"eval_samples_per_second": 8.015,
"eval_steps_per_second": 1.018,
"eval_wer": 0.7141574378928465,
"step": 256
},
{
"epoch": 32.45,
"learning_rate": 0.00033924050632911393,
"loss": 0.8184,
"step": 260
},
{
"epoch": 32.9,
"eval_loss": 2.575679063796997,
"eval_runtime": 8.0158,
"eval_samples_per_second": 7.859,
"eval_steps_per_second": 0.998,
"eval_wer": 0.7192457348099371,
"step": 264
},
{
"epoch": 33.68,
"learning_rate": 0.0003367088607594937,
"loss": 0.9092,
"step": 270
},
{
"epoch": 33.9,
"eval_loss": 2.4403328895568848,
"eval_runtime": 7.9646,
"eval_samples_per_second": 7.91,
"eval_steps_per_second": 1.004,
"eval_wer": 0.7093684525591141,
"step": 272
},
{
"epoch": 34.9,
"learning_rate": 0.0003341772151898734,
"loss": 0.8749,
"step": 280
},
{
"epoch": 34.9,
"eval_loss": 2.691164493560791,
"eval_runtime": 7.9176,
"eval_samples_per_second": 7.957,
"eval_steps_per_second": 1.01,
"eval_wer": 0.7219395390601616,
"step": 280
},
{
"epoch": 35.9,
"eval_loss": 2.4073445796966553,
"eval_runtime": 8.0386,
"eval_samples_per_second": 7.837,
"eval_steps_per_second": 0.995,
"eval_wer": 0.7327147560610595,
"step": 288
},
{
"epoch": 36.23,
"learning_rate": 0.0003316455696202532,
"loss": 0.9235,
"step": 290
},
{
"epoch": 36.9,
"eval_loss": 2.444603681564331,
"eval_runtime": 7.9142,
"eval_samples_per_second": 7.96,
"eval_steps_per_second": 1.011,
"eval_wer": 0.726728524393894,
"step": 296
},
{
"epoch": 37.45,
"learning_rate": 0.00032911392405063296,
"loss": 0.8654,
"step": 300
},
{
"epoch": 37.9,
"eval_loss": 2.821065902709961,
"eval_runtime": 7.9214,
"eval_samples_per_second": 7.953,
"eval_steps_per_second": 1.01,
"eval_wer": 0.7360071834780006,
"step": 304
},
{
"epoch": 38.68,
"learning_rate": 0.0003265822784810127,
"loss": 0.8428,
"step": 310
},
{
"epoch": 38.9,
"eval_loss": 2.481106996536255,
"eval_runtime": 7.9459,
"eval_samples_per_second": 7.929,
"eval_steps_per_second": 1.007,
"eval_wer": 0.7243340317270278,
"step": 312
},
{
"epoch": 39.9,
"learning_rate": 0.0003240506329113924,
"loss": 0.8355,
"step": 320
},
{
"epoch": 39.9,
"eval_loss": 2.357530355453491,
"eval_runtime": 8.0775,
"eval_samples_per_second": 7.799,
"eval_steps_per_second": 0.99,
"eval_wer": 0.7192457348099371,
"step": 320
},
{
"epoch": 40.9,
"eval_loss": 2.3957395553588867,
"eval_runtime": 7.951,
"eval_samples_per_second": 7.924,
"eval_steps_per_second": 1.006,
"eval_wer": 0.7138581263094882,
"step": 328
},
{
"epoch": 41.23,
"learning_rate": 0.00032151898734177216,
"loss": 0.8992,
"step": 330
},
{
"epoch": 41.9,
"eval_loss": 2.4372870922088623,
"eval_runtime": 7.962,
"eval_samples_per_second": 7.913,
"eval_steps_per_second": 1.005,
"eval_wer": 0.7138581263094882,
"step": 336
},
{
"epoch": 42.45,
"learning_rate": 0.00031898734177215193,
"loss": 0.8221,
"step": 340
},
{
"epoch": 42.9,
"eval_loss": 2.4234611988067627,
"eval_runtime": 7.963,
"eval_samples_per_second": 7.912,
"eval_steps_per_second": 1.005,
"eval_wer": 0.7126608799760551,
"step": 344
},
{
"epoch": 43.68,
"learning_rate": 0.00031645569620253165,
"loss": 0.8305,
"step": 350
},
{
"epoch": 43.9,
"eval_loss": 2.3404624462127686,
"eval_runtime": 7.9486,
"eval_samples_per_second": 7.926,
"eval_steps_per_second": 1.006,
"eval_wer": 0.7111643220592637,
"step": 352
},
{
"epoch": 44.9,
"learning_rate": 0.00031392405063291137,
"loss": 0.8328,
"step": 360
},
{
"epoch": 44.9,
"eval_loss": 2.340630292892456,
"eval_runtime": 8.0091,
"eval_samples_per_second": 7.866,
"eval_steps_per_second": 0.999,
"eval_wer": 0.7216402274768033,
"step": 360
},
{
"epoch": 45.9,
"eval_loss": 2.4469380378723145,
"eval_runtime": 7.9319,
"eval_samples_per_second": 7.943,
"eval_steps_per_second": 1.009,
"eval_wer": 0.7165519305597127,
"step": 368
},
{
"epoch": 46.23,
"learning_rate": 0.0003113924050632912,
"loss": 0.8611,
"step": 370
},
{
"epoch": 46.9,
"eval_loss": 2.429659366607666,
"eval_runtime": 7.8903,
"eval_samples_per_second": 7.984,
"eval_steps_per_second": 1.014,
"eval_wer": 0.7156539958096378,
"step": 376
},
{
"epoch": 47.45,
"learning_rate": 0.0003088607594936709,
"loss": 0.8092,
"step": 380
},
{
"epoch": 47.9,
"eval_loss": 2.5867514610290527,
"eval_runtime": 8.0153,
"eval_samples_per_second": 7.86,
"eval_steps_per_second": 0.998,
"eval_wer": 0.7093684525591141,
"step": 384
},
{
"epoch": 48.68,
"learning_rate": 0.00030632911392405063,
"loss": 0.8173,
"step": 390
},
{
"epoch": 48.9,
"eval_loss": 2.2557618618011475,
"eval_runtime": 8.0103,
"eval_samples_per_second": 7.865,
"eval_steps_per_second": 0.999,
"eval_wer": 0.7003891050583657,
"step": 392
},
{
"epoch": 49.9,
"learning_rate": 0.0003037974683544304,
"loss": 0.7772,
"step": 400
},
{
"epoch": 49.9,
"eval_loss": 2.359837770462036,
"eval_runtime": 7.7486,
"eval_samples_per_second": 8.13,
"eval_steps_per_second": 1.032,
"eval_wer": 0.7003891050583657,
"step": 400
},
{
"epoch": 50.9,
"eval_loss": 2.308309316635132,
"eval_runtime": 7.7464,
"eval_samples_per_second": 8.133,
"eval_steps_per_second": 1.033,
"eval_wer": 0.6881173301406764,
"step": 408
},
{
"epoch": 51.23,
"learning_rate": 0.00030126582278481017,
"loss": 0.8494,
"step": 410
},
{
"epoch": 51.9,
"eval_loss": 2.4430971145629883,
"eval_runtime": 7.7316,
"eval_samples_per_second": 8.148,
"eval_steps_per_second": 1.035,
"eval_wer": 0.7012870398084405,
"step": 416
},
{
"epoch": 52.45,
"learning_rate": 0.0002987341772151899,
"loss": 0.7997,
"step": 420
},
{
"epoch": 52.9,
"eval_loss": 2.3005003929138184,
"eval_runtime": 7.7273,
"eval_samples_per_second": 8.153,
"eval_steps_per_second": 1.035,
"eval_wer": 0.7111643220592637,
"step": 424
},
{
"epoch": 53.68,
"learning_rate": 0.0002962025316455696,
"loss": 0.7879,
"step": 430
},
{
"epoch": 53.9,
"eval_loss": 2.1985087394714355,
"eval_runtime": 7.8272,
"eval_samples_per_second": 8.049,
"eval_steps_per_second": 1.022,
"eval_wer": 0.7297216402274768,
"step": 432
},
{
"epoch": 54.9,
"learning_rate": 0.0002936708860759494,
"loss": 0.7694,
"step": 440
},
{
"epoch": 54.9,
"eval_loss": 2.337602376937866,
"eval_runtime": 7.7096,
"eval_samples_per_second": 8.172,
"eval_steps_per_second": 1.038,
"eval_wer": 0.708171206225681,
"step": 440
},
{
"epoch": 55.9,
"eval_loss": 2.371609926223755,
"eval_runtime": 7.7243,
"eval_samples_per_second": 8.156,
"eval_steps_per_second": 1.036,
"eval_wer": 0.7012870398084405,
"step": 448
},
{
"epoch": 56.23,
"learning_rate": 0.00029113924050632915,
"loss": 0.8397,
"step": 450
},
{
"epoch": 56.9,
"eval_loss": 2.381723403930664,
"eval_runtime": 7.7601,
"eval_samples_per_second": 8.118,
"eval_steps_per_second": 1.031,
"eval_wer": 0.711463633642622,
"step": 456
},
{
"epoch": 57.45,
"learning_rate": 0.00028860759493670886,
"loss": 0.7868,
"step": 460
},
{
"epoch": 57.9,
"eval_loss": 2.257676601409912,
"eval_runtime": 7.7658,
"eval_samples_per_second": 8.112,
"eval_steps_per_second": 1.03,
"eval_wer": 0.7090691409757558,
"step": 464
},
{
"epoch": 58.68,
"learning_rate": 0.00028607594936708863,
"loss": 0.7311,
"step": 470
},
{
"epoch": 58.9,
"eval_loss": 2.3895084857940674,
"eval_runtime": 7.7486,
"eval_samples_per_second": 8.13,
"eval_steps_per_second": 1.032,
"eval_wer": 0.7126608799760551,
"step": 472
},
{
"epoch": 59.9,
"learning_rate": 0.00028354430379746835,
"loss": 0.7796,
"step": 480
},
{
"epoch": 59.9,
"eval_loss": 2.276035785675049,
"eval_runtime": 7.7565,
"eval_samples_per_second": 8.122,
"eval_steps_per_second": 1.031,
"eval_wer": 0.7099670757258306,
"step": 480
},
{
"epoch": 60.9,
"eval_loss": 2.5685431957244873,
"eval_runtime": 7.7725,
"eval_samples_per_second": 8.105,
"eval_steps_per_second": 1.029,
"eval_wer": 0.7072732714756061,
"step": 488
},
{
"epoch": 61.23,
"learning_rate": 0.0002810126582278481,
"loss": 0.8272,
"step": 490
},
{
"epoch": 61.9,
"eval_loss": 2.3881263732910156,
"eval_runtime": 7.7155,
"eval_samples_per_second": 8.165,
"eval_steps_per_second": 1.037,
"eval_wer": 0.7027835977252319,
"step": 496
},
{
"epoch": 62.45,
"learning_rate": 0.0002784810126582279,
"loss": 0.7639,
"step": 500
},
{
"epoch": 62.9,
"eval_loss": 2.3456814289093018,
"eval_runtime": 7.7642,
"eval_samples_per_second": 8.114,
"eval_steps_per_second": 1.03,
"eval_wer": 0.7084705178090392,
"step": 504
},
{
"epoch": 63.68,
"learning_rate": 0.0002759493670886076,
"loss": 0.789,
"step": 510
},
{
"epoch": 63.9,
"eval_loss": 2.3291287422180176,
"eval_runtime": 7.7437,
"eval_samples_per_second": 8.136,
"eval_steps_per_second": 1.033,
"eval_wer": 0.700688416641724,
"step": 512
},
{
"epoch": 64.9,
"learning_rate": 0.0002734177215189873,
"loss": 0.7472,
"step": 520
},
{
"epoch": 64.9,
"eval_loss": 2.5174083709716797,
"eval_runtime": 7.7856,
"eval_samples_per_second": 8.092,
"eval_steps_per_second": 1.028,
"eval_wer": 0.70487877880874,
"step": 520
},
{
"epoch": 65.9,
"eval_loss": 2.399650812149048,
"eval_runtime": 7.7605,
"eval_samples_per_second": 8.118,
"eval_steps_per_second": 1.031,
"eval_wer": 0.7153546842262796,
"step": 528
},
{
"epoch": 66.23,
"learning_rate": 0.0002708860759493671,
"loss": 0.8056,
"step": 530
},
{
"epoch": 66.9,
"eval_loss": 2.4573962688446045,
"eval_runtime": 7.7606,
"eval_samples_per_second": 8.118,
"eval_steps_per_second": 1.031,
"eval_wer": 0.7237354085603113,
"step": 536
},
{
"epoch": 67.45,
"learning_rate": 0.00026835443037974687,
"loss": 0.7752,
"step": 540
},
{
"epoch": 67.9,
"eval_loss": 2.4979681968688965,
"eval_runtime": 7.7515,
"eval_samples_per_second": 8.127,
"eval_steps_per_second": 1.032,
"eval_wer": 0.7003891050583657,
"step": 544
},
{
"epoch": 68.68,
"learning_rate": 0.0002658227848101266,
"loss": 0.7084,
"step": 550
},
{
"epoch": 68.9,
"eval_loss": 2.2370431423187256,
"eval_runtime": 7.792,
"eval_samples_per_second": 8.085,
"eval_steps_per_second": 1.027,
"eval_wer": 0.7084705178090392,
"step": 552
},
{
"epoch": 69.9,
"learning_rate": 0.0002632911392405063,
"loss": 0.7824,
"step": 560
},
{
"epoch": 69.9,
"eval_loss": 2.359494924545288,
"eval_runtime": 7.722,
"eval_samples_per_second": 8.159,
"eval_steps_per_second": 1.036,
"eval_wer": 0.6970966776414247,
"step": 560
},
{
"epoch": 70.9,
"eval_loss": 2.19962477684021,
"eval_runtime": 7.7269,
"eval_samples_per_second": 8.153,
"eval_steps_per_second": 1.035,
"eval_wer": 0.7003891050583657,
"step": 568
},
{
"epoch": 71.23,
"learning_rate": 0.00026075949367088613,
"loss": 0.7776,
"step": 570
},
{
"epoch": 71.9,
"eval_loss": 2.2957143783569336,
"eval_runtime": 7.7186,
"eval_samples_per_second": 8.162,
"eval_steps_per_second": 1.036,
"eval_wer": 0.6902125112241844,
"step": 576
},
{
"epoch": 72.45,
"learning_rate": 0.00025822784810126584,
"loss": 0.7205,
"step": 580
},
{
"epoch": 72.9,
"eval_loss": 2.2435786724090576,
"eval_runtime": 7.7517,
"eval_samples_per_second": 8.127,
"eval_steps_per_second": 1.032,
"eval_wer": 0.6908111343909009,
"step": 584
},
{
"epoch": 73.68,
"learning_rate": 0.00025569620253164556,
"loss": 0.7074,
"step": 590
},
{
"epoch": 73.9,
"eval_loss": 2.23608136177063,
"eval_runtime": 7.7615,
"eval_samples_per_second": 8.117,
"eval_steps_per_second": 1.031,
"eval_wer": 0.6932056270577671,
"step": 592
},
{
"epoch": 74.9,
"learning_rate": 0.00025316455696202533,
"loss": 0.7237,
"step": 600
},
{
"epoch": 74.9,
"eval_loss": 2.207817792892456,
"eval_runtime": 7.6966,
"eval_samples_per_second": 8.185,
"eval_steps_per_second": 1.039,
"eval_wer": 0.6857228374738102,
"step": 600
},
{
"epoch": 75.9,
"eval_loss": 2.233380079269409,
"eval_runtime": 7.7786,
"eval_samples_per_second": 8.099,
"eval_steps_per_second": 1.028,
"eval_wer": 0.6905118228075426,
"step": 608
},
{
"epoch": 76.23,
"learning_rate": 0.0002506329113924051,
"loss": 0.7862,
"step": 610
},
{
"epoch": 76.9,
"eval_loss": 2.3564865589141846,
"eval_runtime": 7.7597,
"eval_samples_per_second": 8.119,
"eval_steps_per_second": 1.031,
"eval_wer": 0.6976953008081412,
"step": 616
},
{
"epoch": 77.45,
"learning_rate": 0.0002481012658227848,
"loss": 0.7299,
"step": 620
},
{
"epoch": 77.9,
"eval_loss": 2.1293139457702637,
"eval_runtime": 7.6982,
"eval_samples_per_second": 8.184,
"eval_steps_per_second": 1.039,
"eval_wer": 0.6779407363064951,
"step": 624
},
{
"epoch": 78.68,
"learning_rate": 0.0002455696202531646,
"loss": 0.6755,
"step": 630
},
{
"epoch": 78.9,
"eval_loss": 2.2523531913757324,
"eval_runtime": 7.7601,
"eval_samples_per_second": 8.118,
"eval_steps_per_second": 1.031,
"eval_wer": 0.6860221490571685,
"step": 632
},
{
"epoch": 79.9,
"learning_rate": 0.00024303797468354434,
"loss": 0.724,
"step": 640
},
{
"epoch": 79.9,
"eval_loss": 2.206925630569458,
"eval_runtime": 7.7271,
"eval_samples_per_second": 8.153,
"eval_steps_per_second": 1.035,
"eval_wer": 0.688715953307393,
"step": 640
},
{
"epoch": 80.9,
"eval_loss": 2.5267446041107178,
"eval_runtime": 7.7853,
"eval_samples_per_second": 8.092,
"eval_steps_per_second": 1.028,
"eval_wer": 0.6785393594732116,
"step": 648
},
{
"epoch": 81.23,
"learning_rate": 0.00024050632911392405,
"loss": 0.7878,
"step": 650
},
{
"epoch": 81.9,
"eval_loss": 2.6393752098083496,
"eval_runtime": 7.709,
"eval_samples_per_second": 8.172,
"eval_steps_per_second": 1.038,
"eval_wer": 0.6824304100568692,
"step": 656
},
{
"epoch": 82.45,
"learning_rate": 0.0002379746835443038,
"loss": 0.6882,
"step": 660
},
{
"epoch": 82.9,
"eval_loss": 2.4647722244262695,
"eval_runtime": 7.8339,
"eval_samples_per_second": 8.042,
"eval_steps_per_second": 1.021,
"eval_wer": 0.6764441783897037,
"step": 664
},
{
"epoch": 83.68,
"learning_rate": 0.00023544303797468357,
"loss": 0.6996,
"step": 670
},
{
"epoch": 83.9,
"eval_loss": 2.4115612506866455,
"eval_runtime": 7.7276,
"eval_samples_per_second": 8.153,
"eval_steps_per_second": 1.035,
"eval_wer": 0.6890152648907513,
"step": 672
},
{
"epoch": 84.9,
"learning_rate": 0.0002329113924050633,
"loss": 0.7149,
"step": 680
},
{
"epoch": 84.9,
"eval_loss": 2.1044137477874756,
"eval_runtime": 7.7519,
"eval_samples_per_second": 8.127,
"eval_steps_per_second": 1.032,
"eval_wer": 0.6893145764741095,
"step": 680
},
{
"epoch": 85.9,
"eval_loss": 2.1447622776031494,
"eval_runtime": 7.7429,
"eval_samples_per_second": 8.136,
"eval_steps_per_second": 1.033,
"eval_wer": 0.6917090691409757,
"step": 688
},
{
"epoch": 86.23,
"learning_rate": 0.00023037974683544303,
"loss": 0.7499,
"step": 690
},
{
"epoch": 86.9,
"eval_loss": 2.2603471279144287,
"eval_runtime": 7.7748,
"eval_samples_per_second": 8.103,
"eval_steps_per_second": 1.029,
"eval_wer": 0.6875187069739599,
"step": 696
},
{
"epoch": 87.45,
"learning_rate": 0.0002278481012658228,
"loss": 0.6881,
"step": 700
},
{
"epoch": 87.9,
"eval_loss": 2.1306064128875732,
"eval_runtime": 7.7761,
"eval_samples_per_second": 8.102,
"eval_steps_per_second": 1.029,
"eval_wer": 0.6815324753067944,
"step": 704
},
{
"epoch": 88.68,
"learning_rate": 0.00022531645569620254,
"loss": 0.6652,
"step": 710
},
{
"epoch": 88.9,
"eval_loss": 2.195241689682007,
"eval_runtime": 7.7296,
"eval_samples_per_second": 8.151,
"eval_steps_per_second": 1.035,
"eval_wer": 0.6905118228075426,
"step": 712
},
{
"epoch": 89.9,
"learning_rate": 0.0002227848101265823,
"loss": 0.7093,
"step": 720
},
{
"epoch": 89.9,
"eval_loss": 2.3550162315368652,
"eval_runtime": 7.7395,
"eval_samples_per_second": 8.14,
"eval_steps_per_second": 1.034,
"eval_wer": 0.676743489973062,
"step": 720
},
{
"epoch": 90.9,
"eval_loss": 2.261043071746826,
"eval_runtime": 7.7396,
"eval_samples_per_second": 8.14,
"eval_steps_per_second": 1.034,
"eval_wer": 0.6749476204729123,
"step": 728
},
{
"epoch": 91.23,
"learning_rate": 0.00022025316455696206,
"loss": 0.7439,
"step": 730
},
{
"epoch": 91.9,
"eval_loss": 2.147209882736206,
"eval_runtime": 7.7312,
"eval_samples_per_second": 8.149,
"eval_steps_per_second": 1.035,
"eval_wer": 0.6857228374738102,
"step": 736
},
{
"epoch": 92.45,
"learning_rate": 0.00021772151898734177,
"loss": 0.6898,
"step": 740
},
{
"epoch": 92.9,
"eval_loss": 2.074415922164917,
"eval_runtime": 7.7637,
"eval_samples_per_second": 8.115,
"eval_steps_per_second": 1.03,
"eval_wer": 0.6881173301406764,
"step": 744
},
{
"epoch": 93.68,
"learning_rate": 0.00021518987341772152,
"loss": 0.6734,
"step": 750
},
{
"epoch": 93.9,
"eval_loss": 2.0897610187530518,
"eval_runtime": 7.7107,
"eval_samples_per_second": 8.17,
"eval_steps_per_second": 1.038,
"eval_wer": 0.6929063154744088,
"step": 752
},
{
"epoch": 94.9,
"learning_rate": 0.00021265822784810126,
"loss": 0.6926,
"step": 760
},
{
"epoch": 94.9,
"eval_loss": 2.089553117752075,
"eval_runtime": 7.721,
"eval_samples_per_second": 8.16,
"eval_steps_per_second": 1.036,
"eval_wer": 0.6683627656390302,
"step": 760
},
{
"epoch": 95.9,
"eval_loss": 2.1928741931915283,
"eval_runtime": 7.7808,
"eval_samples_per_second": 8.097,
"eval_steps_per_second": 1.028,
"eval_wer": 0.6812331637234361,
"step": 768
},
{
"epoch": 96.23,
"learning_rate": 0.00021012658227848103,
"loss": 0.7154,
"step": 770
},
{
"epoch": 96.9,
"eval_loss": 2.153787612915039,
"eval_runtime": 7.7478,
"eval_samples_per_second": 8.131,
"eval_steps_per_second": 1.033,
"eval_wer": 0.6860221490571685,
"step": 776
},
{
"epoch": 97.45,
"learning_rate": 0.00020759493670886078,
"loss": 0.6493,
"step": 780
},
{
"epoch": 97.9,
"eval_loss": 2.143815279006958,
"eval_runtime": 7.7358,
"eval_samples_per_second": 8.144,
"eval_steps_per_second": 1.034,
"eval_wer": 0.6815324753067944,
"step": 784
},
{
"epoch": 98.68,
"learning_rate": 0.0002050632911392405,
"loss": 0.6755,
"step": 790
},
{
"epoch": 98.9,
"eval_loss": 2.1560962200164795,
"eval_runtime": 7.7208,
"eval_samples_per_second": 8.16,
"eval_steps_per_second": 1.036,
"eval_wer": 0.6902125112241844,
"step": 792
},
{
"epoch": 99.9,
"learning_rate": 0.00020253164556962027,
"loss": 0.6667,
"step": 800
},
{
"epoch": 99.9,
"eval_loss": 2.076709032058716,
"eval_runtime": 7.7317,
"eval_samples_per_second": 8.148,
"eval_steps_per_second": 1.035,
"eval_wer": 0.6908111343909009,
"step": 800
},
{
"epoch": 100.9,
"eval_loss": 2.106370449066162,
"eval_runtime": 7.7472,
"eval_samples_per_second": 8.132,
"eval_steps_per_second": 1.033,
"eval_wer": 0.6785393594732116,
"step": 808
},
{
"epoch": 101.23,
"learning_rate": 0.0002,
"loss": 0.7016,
"step": 810
},
{
"epoch": 101.9,
"eval_loss": 2.227837085723877,
"eval_runtime": 8.0181,
"eval_samples_per_second": 7.857,
"eval_steps_per_second": 0.998,
"eval_wer": 0.676743489973062,
"step": 816
},
{
"epoch": 102.45,
"learning_rate": 0.00019746835443037975,
"loss": 0.6726,
"step": 820
},
{
"epoch": 102.9,
"eval_loss": 2.261566162109375,
"eval_runtime": 7.7943,
"eval_samples_per_second": 8.083,
"eval_steps_per_second": 1.026,
"eval_wer": 0.6689613888057467,
"step": 824
},
{
"epoch": 103.68,
"learning_rate": 0.0001949367088607595,
"loss": 0.6725,
"step": 830
},
{
"epoch": 103.9,
"eval_loss": 2.133070230484009,
"eval_runtime": 7.7265,
"eval_samples_per_second": 8.154,
"eval_steps_per_second": 1.035,
"eval_wer": 0.6878180185573182,
"step": 832
},
{
"epoch": 104.9,
"learning_rate": 0.00019240506329113924,
"loss": 0.6657,
"step": 840
},
{
"epoch": 104.9,
"eval_loss": 2.1497416496276855,
"eval_runtime": 7.7253,
"eval_samples_per_second": 8.155,
"eval_steps_per_second": 1.036,
"eval_wer": 0.6731517509727627,
"step": 840
},
{
"epoch": 105.9,
"eval_loss": 2.160142421722412,
"eval_runtime": 7.7477,
"eval_samples_per_second": 8.131,
"eval_steps_per_second": 1.033,
"eval_wer": 0.6737503741394792,
"step": 848
},
{
"epoch": 106.23,
"learning_rate": 0.00018987341772151899,
"loss": 0.6989,
"step": 850
},
{
"epoch": 106.9,
"eval_loss": 2.319141149520874,
"eval_runtime": 7.732,
"eval_samples_per_second": 8.148,
"eval_steps_per_second": 1.035,
"eval_wer": 0.6674648308889554,
"step": 856
},
{
"epoch": 107.45,
"learning_rate": 0.00018734177215189873,
"loss": 0.6658,
"step": 860
},
{
"epoch": 107.9,
"eval_loss": 2.354734420776367,
"eval_runtime": 7.7273,
"eval_samples_per_second": 8.153,
"eval_steps_per_second": 1.035,
"eval_wer": 0.6788386710565699,
"step": 864
},
{
"epoch": 108.68,
"learning_rate": 0.0001848101265822785,
"loss": 0.6398,
"step": 870
},
{
"epoch": 108.9,
"eval_loss": 2.3368043899536133,
"eval_runtime": 7.7551,
"eval_samples_per_second": 8.124,
"eval_steps_per_second": 1.032,
"eval_wer": 0.6740496857228375,
"step": 872
},
{
"epoch": 109.9,
"learning_rate": 0.00018227848101265824,
"loss": 0.6465,
"step": 880
},
{
"epoch": 109.9,
"eval_loss": 2.1896259784698486,
"eval_runtime": 7.7364,
"eval_samples_per_second": 8.143,
"eval_steps_per_second": 1.034,
"eval_wer": 0.6806345405567196,
"step": 880
},
{
"epoch": 110.9,
"eval_loss": 2.1210110187530518,
"eval_runtime": 7.7217,
"eval_samples_per_second": 8.159,
"eval_steps_per_second": 1.036,
"eval_wer": 0.6797366058066447,
"step": 888
},
{
"epoch": 111.23,
"learning_rate": 0.000179746835443038,
"loss": 0.727,
"step": 890
},
{
"epoch": 111.9,
"eval_loss": 2.3508195877075195,
"eval_runtime": 7.7774,
"eval_samples_per_second": 8.1,
"eval_steps_per_second": 1.029,
"eval_wer": 0.6686620772223885,
"step": 896
},
{
"epoch": 112.45,
"learning_rate": 0.00017721518987341773,
"loss": 0.6409,
"step": 900
},
{
"epoch": 112.9,
"eval_loss": 2.3439958095550537,
"eval_runtime": 7.7324,
"eval_samples_per_second": 8.148,
"eval_steps_per_second": 1.035,
"eval_wer": 0.6752469320562706,
"step": 904
},
{
"epoch": 113.68,
"learning_rate": 0.00017468354430379748,
"loss": 0.6573,
"step": 910
},
{
"epoch": 113.9,
"eval_loss": 2.269505500793457,
"eval_runtime": 7.7658,
"eval_samples_per_second": 8.112,
"eval_steps_per_second": 1.03,
"eval_wer": 0.6623765339718647,
"step": 912
},
{
"epoch": 114.9,
"learning_rate": 0.00017215189873417722,
"loss": 0.645,
"step": 920
},
{
"epoch": 114.9,
"eval_loss": 2.1471199989318848,
"eval_runtime": 7.7501,
"eval_samples_per_second": 8.129,
"eval_steps_per_second": 1.032,
"eval_wer": 0.6770428015564203,
"step": 920
},
{
"epoch": 115.9,
"eval_loss": 2.186685562133789,
"eval_runtime": 7.7952,
"eval_samples_per_second": 8.082,
"eval_steps_per_second": 1.026,
"eval_wer": 0.6743489973061958,
"step": 928
},
{
"epoch": 116.23,
"learning_rate": 0.00016962025316455696,
"loss": 0.7103,
"step": 930
},
{
"epoch": 116.9,
"eval_loss": 2.232990026473999,
"eval_runtime": 7.7463,
"eval_samples_per_second": 8.133,
"eval_steps_per_second": 1.033,
"eval_wer": 0.6701586351391798,
"step": 936
},
{
"epoch": 117.45,
"learning_rate": 0.0001670886075949367,
"loss": 0.6214,
"step": 940
},
{
"epoch": 117.9,
"eval_loss": 2.217428207397461,
"eval_runtime": 7.7992,
"eval_samples_per_second": 8.078,
"eval_steps_per_second": 1.026,
"eval_wer": 0.6686620772223885,
"step": 944
},
{
"epoch": 118.68,
"learning_rate": 0.00016455696202531648,
"loss": 0.6134,
"step": 950
},
{
"epoch": 118.9,
"eval_loss": 2.198005437850952,
"eval_runtime": 7.8436,
"eval_samples_per_second": 8.032,
"eval_steps_per_second": 1.02,
"eval_wer": 0.6620772223885064,
"step": 952
},
{
"epoch": 119.9,
"learning_rate": 0.0001620253164556962,
"loss": 0.6612,
"step": 960
},
{
"epoch": 119.9,
"eval_loss": 2.2890524864196777,
"eval_runtime": 7.8296,
"eval_samples_per_second": 8.046,
"eval_steps_per_second": 1.022,
"eval_wer": 0.6749476204729123,
"step": 960
},
{
"epoch": 120.9,
"eval_loss": 2.2862656116485596,
"eval_runtime": 7.7538,
"eval_samples_per_second": 8.125,
"eval_steps_per_second": 1.032,
"eval_wer": 0.6641724034720143,
"step": 968
},
{
"epoch": 121.23,
"learning_rate": 0.00015949367088607597,
"loss": 0.688,
"step": 970
},
{
"epoch": 121.9,
"eval_loss": 2.319775342941284,
"eval_runtime": 7.7964,
"eval_samples_per_second": 8.081,
"eval_steps_per_second": 1.026,
"eval_wer": 0.6668662077222388,
"step": 976
},
{
"epoch": 122.45,
"learning_rate": 0.00015696202531645568,
"loss": 0.6451,
"step": 980
},
{
"epoch": 122.9,
"eval_loss": 2.169647216796875,
"eval_runtime": 7.8494,
"eval_samples_per_second": 8.026,
"eval_steps_per_second": 1.019,
"eval_wer": 0.6668662077222388,
"step": 984
},
{
"epoch": 123.68,
"learning_rate": 0.00015443037974683546,
"loss": 0.6308,
"step": 990
},
{
"epoch": 123.9,
"eval_loss": 2.125494956970215,
"eval_runtime": 7.8606,
"eval_samples_per_second": 8.015,
"eval_steps_per_second": 1.018,
"eval_wer": 0.6596827297216402,
"step": 992
},
{
"epoch": 124.9,
"learning_rate": 0.0001518987341772152,
"loss": 0.6359,
"step": 1000
},
{
"epoch": 124.9,
"eval_loss": 2.2053353786468506,
"eval_runtime": 7.7903,
"eval_samples_per_second": 8.087,
"eval_steps_per_second": 1.027,
"eval_wer": 0.6569889254714157,
"step": 1000
},
{
"epoch": 125.9,
"eval_loss": 2.1914987564086914,
"eval_runtime": 7.7966,
"eval_samples_per_second": 8.08,
"eval_steps_per_second": 1.026,
"eval_wer": 0.6581861718048488,
"step": 1008
},
{
"epoch": 126.23,
"learning_rate": 0.00014936708860759494,
"loss": 0.6845,
"step": 1010
},
{
"epoch": 126.9,
"eval_loss": 2.1405885219573975,
"eval_runtime": 7.7604,
"eval_samples_per_second": 8.118,
"eval_steps_per_second": 1.031,
"eval_wer": 0.6656689613888057,
"step": 1016
},
{
"epoch": 127.45,
"learning_rate": 0.0001468354430379747,
"loss": 0.6609,
"step": 1020
},
{
"epoch": 127.9,
"eval_loss": 2.1851718425750732,
"eval_runtime": 7.745,
"eval_samples_per_second": 8.134,
"eval_steps_per_second": 1.033,
"eval_wer": 0.6752469320562706,
"step": 1024
},
{
"epoch": 128.68,
"learning_rate": 0.00014430379746835443,
"loss": 0.6345,
"step": 1030
},
{
"epoch": 128.9,
"eval_loss": 2.1838414669036865,
"eval_runtime": 7.7504,
"eval_samples_per_second": 8.129,
"eval_steps_per_second": 1.032,
"eval_wer": 0.6620772223885064,
"step": 1032
},
{
"epoch": 129.9,
"learning_rate": 0.00014177215189873418,
"loss": 0.6055,
"step": 1040
},
{
"epoch": 129.9,
"eval_loss": 2.158566474914551,
"eval_runtime": 7.7809,
"eval_samples_per_second": 8.097,
"eval_steps_per_second": 1.028,
"eval_wer": 0.6701586351391798,
"step": 1040
},
{
"epoch": 130.9,
"eval_loss": 2.1627261638641357,
"eval_runtime": 7.7707,
"eval_samples_per_second": 8.107,
"eval_steps_per_second": 1.03,
"eval_wer": 0.6680634540556719,
"step": 1048
},
{
"epoch": 131.23,
"learning_rate": 0.00013924050632911395,
"loss": 0.6737,
"step": 1050
},
{
"epoch": 131.9,
"eval_loss": 2.263141632080078,
"eval_runtime": 7.8874,
"eval_samples_per_second": 7.987,
"eval_steps_per_second": 1.014,
"eval_wer": 0.6761448668063454,
"step": 1056
},
{
"epoch": 132.45,
"learning_rate": 0.00013670886075949366,
"loss": 0.6237,
"step": 1060
},
{
"epoch": 132.9,
"eval_loss": 2.2553627490997314,
"eval_runtime": 7.755,
"eval_samples_per_second": 8.124,
"eval_steps_per_second": 1.032,
"eval_wer": 0.6620772223885064,
"step": 1064
},
{
"epoch": 133.68,
"learning_rate": 0.00013417721518987343,
"loss": 0.6468,
"step": 1070
},
{
"epoch": 133.9,
"eval_loss": 2.2538866996765137,
"eval_runtime": 7.7947,
"eval_samples_per_second": 8.082,
"eval_steps_per_second": 1.026,
"eval_wer": 0.6668662077222388,
"step": 1072
},
{
"epoch": 134.9,
"learning_rate": 0.00013164556962025315,
"loss": 0.5948,
"step": 1080
},
{
"epoch": 134.9,
"eval_loss": 2.2463722229003906,
"eval_runtime": 7.7617,
"eval_samples_per_second": 8.117,
"eval_steps_per_second": 1.031,
"eval_wer": 0.6516013169709668,
"step": 1080
},
{
"epoch": 135.9,
"eval_loss": 2.349128484725952,
"eval_runtime": 7.7593,
"eval_samples_per_second": 8.119,
"eval_steps_per_second": 1.031,
"eval_wer": 0.6620772223885064,
"step": 1088
},
{
"epoch": 136.23,
"learning_rate": 0.00012911392405063292,
"loss": 0.6645,
"step": 1090
},
{
"epoch": 136.9,
"eval_loss": 2.2536532878875732,
"eval_runtime": 7.8036,
"eval_samples_per_second": 8.073,
"eval_steps_per_second": 1.025,
"eval_wer": 0.6620772223885064,
"step": 1096
},
{
"epoch": 137.45,
"learning_rate": 0.00012658227848101267,
"loss": 0.6195,
"step": 1100
},
{
"epoch": 137.9,
"eval_loss": 2.371696710586548,
"eval_runtime": 7.7793,
"eval_samples_per_second": 8.098,
"eval_steps_per_second": 1.028,
"eval_wer": 0.6665668961388805,
"step": 1104
},
{
"epoch": 138.68,
"learning_rate": 0.0001240506329113924,
"loss": 0.6317,
"step": 1110
},
{
"epoch": 138.9,
"eval_loss": 2.2024903297424316,
"eval_runtime": 7.8765,
"eval_samples_per_second": 7.998,
"eval_steps_per_second": 1.016,
"eval_wer": 0.6551930559712661,
"step": 1112
},
{
"epoch": 139.9,
"learning_rate": 0.00012151898734177217,
"loss": 0.6336,
"step": 1120
},
{
"epoch": 139.9,
"eval_loss": 2.142206907272339,
"eval_runtime": 7.8378,
"eval_samples_per_second": 8.038,
"eval_steps_per_second": 1.021,
"eval_wer": 0.6623765339718647,
"step": 1120
},
{
"epoch": 140.9,
"eval_loss": 2.106228828430176,
"eval_runtime": 7.7968,
"eval_samples_per_second": 8.08,
"eval_steps_per_second": 1.026,
"eval_wer": 0.660580664471715,
"step": 1128
},
{
"epoch": 141.23,
"learning_rate": 0.0001189873417721519,
"loss": 0.664,
"step": 1130
},
{
"epoch": 141.9,
"eval_loss": 2.2253739833831787,
"eval_runtime": 7.7492,
"eval_samples_per_second": 8.13,
"eval_steps_per_second": 1.032,
"eval_wer": 0.6596827297216402,
"step": 1136
},
{
"epoch": 142.45,
"learning_rate": 0.00011645569620253166,
"loss": 0.6047,
"step": 1140
},
{
"epoch": 142.9,
"eval_loss": 2.322563886642456,
"eval_runtime": 7.7874,
"eval_samples_per_second": 8.09,
"eval_steps_per_second": 1.027,
"eval_wer": 0.653995809637833,
"step": 1144
},
{
"epoch": 143.68,
"learning_rate": 0.0001139240506329114,
"loss": 0.6173,
"step": 1150
},
{
"epoch": 143.9,
"eval_loss": 2.227854013442993,
"eval_runtime": 7.8279,
"eval_samples_per_second": 8.048,
"eval_steps_per_second": 1.022,
"eval_wer": 0.6683627656390302,
"step": 1152
},
{
"epoch": 144.9,
"learning_rate": 0.00011139240506329114,
"loss": 0.6466,
"step": 1160
},
{
"epoch": 144.9,
"eval_loss": 2.1866044998168945,
"eval_runtime": 7.7744,
"eval_samples_per_second": 8.104,
"eval_steps_per_second": 1.029,
"eval_wer": 0.657288237054774,
"step": 1160
},
{
"epoch": 145.9,
"eval_loss": 2.2489023208618164,
"eval_runtime": 7.7715,
"eval_samples_per_second": 8.107,
"eval_steps_per_second": 1.029,
"eval_wer": 0.6590841065549237,
"step": 1168
},
{
"epoch": 146.23,
"learning_rate": 0.00010886075949367089,
"loss": 0.6585,
"step": 1170
},
{
"epoch": 146.9,
"eval_loss": 2.2273900508880615,
"eval_runtime": 7.821,
"eval_samples_per_second": 8.055,
"eval_steps_per_second": 1.023,
"eval_wer": 0.6480095779706675,
"step": 1176
},
{
"epoch": 147.45,
"learning_rate": 0.00010632911392405063,
"loss": 0.6244,
"step": 1180
},
{
"epoch": 147.9,
"eval_loss": 2.1959400177001953,
"eval_runtime": 7.8697,
"eval_samples_per_second": 8.005,
"eval_steps_per_second": 1.017,
"eval_wer": 0.662675845555223,
"step": 1184
},
{
"epoch": 148.68,
"learning_rate": 0.00010379746835443039,
"loss": 0.6527,
"step": 1190
},
{
"epoch": 148.9,
"eval_loss": 2.2115025520324707,
"eval_runtime": 7.8828,
"eval_samples_per_second": 7.992,
"eval_steps_per_second": 1.015,
"eval_wer": 0.6593834181382819,
"step": 1192
},
{
"epoch": 149.9,
"learning_rate": 0.00010126582278481013,
"loss": 0.6247,
"step": 1200
},
{
"epoch": 149.9,
"eval_loss": 2.2804923057556152,
"eval_runtime": 7.7687,
"eval_samples_per_second": 8.109,
"eval_steps_per_second": 1.03,
"eval_wer": 0.6620772223885064,
"step": 1200
},
{
"epoch": 150.9,
"eval_loss": 2.2128920555114746,
"eval_runtime": 7.7584,
"eval_samples_per_second": 8.12,
"eval_steps_per_second": 1.031,
"eval_wer": 0.6578868602214906,
"step": 1208
},
{
"epoch": 151.23,
"learning_rate": 9.873417721518988e-05,
"loss": 0.6614,
"step": 1210
},
{
"epoch": 151.9,
"eval_loss": 2.23846697807312,
"eval_runtime": 7.7588,
"eval_samples_per_second": 8.12,
"eval_steps_per_second": 1.031,
"eval_wer": 0.6635737803052978,
"step": 1216
},
{
"epoch": 152.45,
"learning_rate": 9.620253164556962e-05,
"loss": 0.6309,
"step": 1220
},
{
"epoch": 152.9,
"eval_loss": 2.275683641433716,
"eval_runtime": 7.8149,
"eval_samples_per_second": 8.061,
"eval_steps_per_second": 1.024,
"eval_wer": 0.6614785992217899,
"step": 1224
},
{
"epoch": 153.68,
"learning_rate": 9.367088607594936e-05,
"loss": 0.6501,
"step": 1230
},
{
"epoch": 153.9,
"eval_loss": 2.3265960216522217,
"eval_runtime": 7.8195,
"eval_samples_per_second": 8.057,
"eval_steps_per_second": 1.023,
"eval_wer": 0.6647710266387309,
"step": 1232
},
{
"epoch": 154.9,
"learning_rate": 9.113924050632912e-05,
"loss": 0.5869,
"step": 1240
},
{
"epoch": 154.9,
"eval_loss": 2.336057662963867,
"eval_runtime": 7.8329,
"eval_samples_per_second": 8.043,
"eval_steps_per_second": 1.021,
"eval_wer": 0.6632744687219395,
"step": 1240
},
{
"epoch": 155.9,
"eval_loss": 2.345245838165283,
"eval_runtime": 7.7323,
"eval_samples_per_second": 8.148,
"eval_steps_per_second": 1.035,
"eval_wer": 0.653995809637833,
"step": 1248
},
{
"epoch": 156.23,
"learning_rate": 8.860759493670887e-05,
"loss": 0.6676,
"step": 1250
},
{
"epoch": 156.9,
"eval_loss": 2.280003070831299,
"eval_runtime": 7.8173,
"eval_samples_per_second": 8.059,
"eval_steps_per_second": 1.023,
"eval_wer": 0.6614785992217899,
"step": 1256
},
{
"epoch": 157.45,
"learning_rate": 8.607594936708861e-05,
"loss": 0.6494,
"step": 1260
},
{
"epoch": 157.9,
"eval_loss": 2.305755376815796,
"eval_runtime": 7.8527,
"eval_samples_per_second": 8.023,
"eval_steps_per_second": 1.019,
"eval_wer": 0.6662675845555223,
"step": 1264
},
{
"epoch": 158.68,
"learning_rate": 8.354430379746835e-05,
"loss": 0.6017,
"step": 1270
},
{
"epoch": 158.9,
"eval_loss": 2.2905781269073486,
"eval_runtime": 7.8309,
"eval_samples_per_second": 8.045,
"eval_steps_per_second": 1.022,
"eval_wer": 0.6662675845555223,
"step": 1272
},
{
"epoch": 159.9,
"learning_rate": 8.10126582278481e-05,
"loss": 0.6266,
"step": 1280
},
{
"epoch": 159.9,
"eval_loss": 2.2315995693206787,
"eval_runtime": 7.7807,
"eval_samples_per_second": 8.097,
"eval_steps_per_second": 1.028,
"eval_wer": 0.6596827297216402,
"step": 1280
},
{
"epoch": 160.9,
"eval_loss": 2.188622236251831,
"eval_runtime": 7.8175,
"eval_samples_per_second": 8.059,
"eval_steps_per_second": 1.023,
"eval_wer": 0.6710565698892547,
"step": 1288
},
{
"epoch": 161.23,
"learning_rate": 7.848101265822784e-05,
"loss": 0.6704,
"step": 1290
},
{
"epoch": 161.9,
"eval_loss": 2.3184380531311035,
"eval_runtime": 7.8037,
"eval_samples_per_second": 8.073,
"eval_steps_per_second": 1.025,
"eval_wer": 0.6590841065549237,
"step": 1296
},
{
"epoch": 162.45,
"learning_rate": 7.59493670886076e-05,
"loss": 0.6239,
"step": 1300
},
{
"epoch": 162.9,
"eval_loss": 2.3544297218322754,
"eval_runtime": 7.7214,
"eval_samples_per_second": 8.159,
"eval_steps_per_second": 1.036,
"eval_wer": 0.6617779108051481,
"step": 1304
},
{
"epoch": 163.68,
"learning_rate": 7.341772151898734e-05,
"loss": 0.5997,
"step": 1310
},
{
"epoch": 163.9,
"eval_loss": 2.298438310623169,
"eval_runtime": 7.7258,
"eval_samples_per_second": 8.155,
"eval_steps_per_second": 1.035,
"eval_wer": 0.6677641424723136,
"step": 1312
},
{
"epoch": 164.9,
"learning_rate": 7.088607594936709e-05,
"loss": 0.6228,
"step": 1320
},
{
"epoch": 164.9,
"eval_loss": 2.293006658554077,
"eval_runtime": 7.7223,
"eval_samples_per_second": 8.158,
"eval_steps_per_second": 1.036,
"eval_wer": 0.669260700389105,
"step": 1320
},
{
"epoch": 165.9,
"eval_loss": 2.3272392749786377,
"eval_runtime": 7.7917,
"eval_samples_per_second": 8.086,
"eval_steps_per_second": 1.027,
"eval_wer": 0.6584854833882071,
"step": 1328
},
{
"epoch": 166.23,
"learning_rate": 6.835443037974683e-05,
"loss": 0.6683,
"step": 1330
},
{
"epoch": 166.9,
"eval_loss": 2.3456509113311768,
"eval_runtime": 7.7579,
"eval_samples_per_second": 8.121,
"eval_steps_per_second": 1.031,
"eval_wer": 0.657288237054774,
"step": 1336
},
{
"epoch": 167.45,
"learning_rate": 6.582278481012658e-05,
"loss": 0.598,
"step": 1340
},
{
"epoch": 167.9,
"eval_loss": 2.2177622318267822,
"eval_runtime": 7.8139,
"eval_samples_per_second": 8.063,
"eval_steps_per_second": 1.024,
"eval_wer": 0.6638730918886561,
"step": 1344
},
{
"epoch": 168.68,
"learning_rate": 6.329113924050633e-05,
"loss": 0.6164,
"step": 1350
},
{
"epoch": 168.9,
"eval_loss": 2.1438896656036377,
"eval_runtime": 7.7254,
"eval_samples_per_second": 8.155,
"eval_steps_per_second": 1.036,
"eval_wer": 0.6542951212211913,
"step": 1352
},
{
"epoch": 169.9,
"learning_rate": 6.0759493670886084e-05,
"loss": 0.5963,
"step": 1360
},
{
"epoch": 169.9,
"eval_loss": 2.1238651275634766,
"eval_runtime": 7.8668,
"eval_samples_per_second": 8.008,
"eval_steps_per_second": 1.017,
"eval_wer": 0.6513020053876085,
"step": 1360
},
{
"epoch": 170.9,
"eval_loss": 2.1392319202423096,
"eval_runtime": 7.7989,
"eval_samples_per_second": 8.078,
"eval_steps_per_second": 1.026,
"eval_wer": 0.6593834181382819,
"step": 1368
},
{
"epoch": 171.23,
"learning_rate": 5.822784810126583e-05,
"loss": 0.6782,
"step": 1370
},
{
"epoch": 171.9,
"eval_loss": 2.129168748855591,
"eval_runtime": 7.8187,
"eval_samples_per_second": 8.058,
"eval_steps_per_second": 1.023,
"eval_wer": 0.6578868602214906,
"step": 1376
},
{
"epoch": 172.45,
"learning_rate": 5.569620253164557e-05,
"loss": 0.5783,
"step": 1380
},
{
"epoch": 172.9,
"eval_loss": 2.1256933212280273,
"eval_runtime": 7.8785,
"eval_samples_per_second": 7.996,
"eval_steps_per_second": 1.015,
"eval_wer": 0.6596827297216402,
"step": 1384
},
{
"epoch": 173.68,
"learning_rate": 5.3164556962025316e-05,
"loss": 0.6087,
"step": 1390
},
{
"epoch": 173.9,
"eval_loss": 2.125344753265381,
"eval_runtime": 7.7825,
"eval_samples_per_second": 8.095,
"eval_steps_per_second": 1.028,
"eval_wer": 0.6593834181382819,
"step": 1392
},
{
"epoch": 174.9,
"learning_rate": 5.0632911392405066e-05,
"loss": 0.6045,
"step": 1400
},
{
"epoch": 174.9,
"eval_loss": 2.133322238922119,
"eval_runtime": 7.8569,
"eval_samples_per_second": 8.018,
"eval_steps_per_second": 1.018,
"eval_wer": 0.6560909907213409,
"step": 1400
},
{
"epoch": 175.9,
"eval_loss": 2.1041812896728516,
"eval_runtime": 7.7837,
"eval_samples_per_second": 8.094,
"eval_steps_per_second": 1.028,
"eval_wer": 0.650703382220892,
"step": 1408
},
{
"epoch": 176.23,
"learning_rate": 4.810126582278481e-05,
"loss": 0.6299,
"step": 1410
},
{
"epoch": 176.9,
"eval_loss": 2.111027956008911,
"eval_runtime": 7.8074,
"eval_samples_per_second": 8.069,
"eval_steps_per_second": 1.025,
"eval_wer": 0.6569889254714157,
"step": 1416
},
{
"epoch": 177.45,
"learning_rate": 4.556962025316456e-05,
"loss": 0.6401,
"step": 1420
},
{
"epoch": 177.9,
"eval_loss": 2.116133451461792,
"eval_runtime": 7.7361,
"eval_samples_per_second": 8.144,
"eval_steps_per_second": 1.034,
"eval_wer": 0.6611792876384316,
"step": 1424
},
{
"epoch": 178.68,
"learning_rate": 4.3037974683544305e-05,
"loss": 0.622,
"step": 1430
},
{
"epoch": 178.9,
"eval_loss": 2.168447494506836,
"eval_runtime": 7.8421,
"eval_samples_per_second": 8.034,
"eval_steps_per_second": 1.02,
"eval_wer": 0.6483088895540258,
"step": 1432
},
{
"epoch": 179.9,
"learning_rate": 4.050632911392405e-05,
"loss": 0.599,
"step": 1440
},
{
"epoch": 179.9,
"eval_loss": 2.190560817718506,
"eval_runtime": 7.8024,
"eval_samples_per_second": 8.074,
"eval_steps_per_second": 1.025,
"eval_wer": 0.6551930559712661,
"step": 1440
},
{
"epoch": 180.9,
"eval_loss": 2.2257890701293945,
"eval_runtime": 7.7768,
"eval_samples_per_second": 8.101,
"eval_steps_per_second": 1.029,
"eval_wer": 0.6492068243041006,
"step": 1448
},
{
"epoch": 181.23,
"learning_rate": 3.79746835443038e-05,
"loss": 0.6516,
"step": 1450
},
{
"epoch": 181.9,
"eval_loss": 2.203824758529663,
"eval_runtime": 7.8475,
"eval_samples_per_second": 8.028,
"eval_steps_per_second": 1.019,
"eval_wer": 0.6536964980544747,
"step": 1456
},
{
"epoch": 182.45,
"learning_rate": 3.5443037974683544e-05,
"loss": 0.5907,
"step": 1460
},
{
"epoch": 182.9,
"eval_loss": 2.194875955581665,
"eval_runtime": 7.95,
"eval_samples_per_second": 7.925,
"eval_steps_per_second": 1.006,
"eval_wer": 0.6533971864711164,
"step": 1464
},
{
"epoch": 183.68,
"learning_rate": 3.291139240506329e-05,
"loss": 0.5979,
"step": 1470
},
{
"epoch": 183.9,
"eval_loss": 2.196150541305542,
"eval_runtime": 7.8608,
"eval_samples_per_second": 8.014,
"eval_steps_per_second": 1.018,
"eval_wer": 0.6530978748877582,
"step": 1472
},
{
"epoch": 184.9,
"learning_rate": 3.0379746835443042e-05,
"loss": 0.6064,
"step": 1480
},
{
"epoch": 184.9,
"eval_loss": 2.1942551136016846,
"eval_runtime": 7.781,
"eval_samples_per_second": 8.097,
"eval_steps_per_second": 1.028,
"eval_wer": 0.6498054474708171,
"step": 1480
},
{
"epoch": 185.9,
"eval_loss": 2.1707868576049805,
"eval_runtime": 7.9327,
"eval_samples_per_second": 7.942,
"eval_steps_per_second": 1.008,
"eval_wer": 0.6524992517210416,
"step": 1488
},
{
"epoch": 186.23,
"learning_rate": 2.7848101265822786e-05,
"loss": 0.6363,
"step": 1490
},
{
"epoch": 186.9,
"eval_loss": 2.1659958362579346,
"eval_runtime": 7.8392,
"eval_samples_per_second": 8.037,
"eval_steps_per_second": 1.021,
"eval_wer": 0.6560909907213409,
"step": 1496
},
{
"epoch": 187.45,
"learning_rate": 2.5316455696202533e-05,
"loss": 0.6257,
"step": 1500
},
{
"epoch": 187.9,
"eval_loss": 2.174118757247925,
"eval_runtime": 7.8051,
"eval_samples_per_second": 8.072,
"eval_steps_per_second": 1.025,
"eval_wer": 0.657288237054774,
"step": 1504
},
{
"epoch": 188.68,
"learning_rate": 2.278481012658228e-05,
"loss": 0.6128,
"step": 1510
},
{
"epoch": 188.9,
"eval_loss": 2.1725566387176514,
"eval_runtime": 7.7709,
"eval_samples_per_second": 8.107,
"eval_steps_per_second": 1.029,
"eval_wer": 0.6563903023046992,
"step": 1512
},
{
"epoch": 189.9,
"learning_rate": 2.0253164556962025e-05,
"loss": 0.602,
"step": 1520
},
{
"epoch": 189.9,
"eval_loss": 2.168877124786377,
"eval_runtime": 7.9172,
"eval_samples_per_second": 7.957,
"eval_steps_per_second": 1.01,
"eval_wer": 0.6554923675546244,
"step": 1520
},
{
"epoch": 190.9,
"eval_loss": 2.170177936553955,
"eval_runtime": 7.8092,
"eval_samples_per_second": 8.067,
"eval_steps_per_second": 1.024,
"eval_wer": 0.6566896138880575,
"step": 1528
},
{
"epoch": 191.23,
"learning_rate": 1.7721518987341772e-05,
"loss": 0.645,
"step": 1530
},
{
"epoch": 191.9,
"eval_loss": 2.1751959323883057,
"eval_runtime": 7.9351,
"eval_samples_per_second": 7.939,
"eval_steps_per_second": 1.008,
"eval_wer": 0.6590841065549237,
"step": 1536
},
{
"epoch": 192.45,
"learning_rate": 1.5189873417721521e-05,
"loss": 0.5916,
"step": 1540
},
{
"epoch": 192.9,
"eval_loss": 2.190694570541382,
"eval_runtime": 7.7664,
"eval_samples_per_second": 8.112,
"eval_steps_per_second": 1.03,
"eval_wer": 0.6560909907213409,
"step": 1544
},
{
"epoch": 193.68,
"learning_rate": 1.2658227848101267e-05,
"loss": 0.5853,
"step": 1550
},
{
"epoch": 193.9,
"eval_loss": 2.1865837574005127,
"eval_runtime": 7.7908,
"eval_samples_per_second": 8.086,
"eval_steps_per_second": 1.027,
"eval_wer": 0.6545944328045495,
"step": 1552
},
{
"epoch": 194.9,
"learning_rate": 1.0126582278481012e-05,
"loss": 0.5735,
"step": 1560
},
{
"epoch": 194.9,
"eval_loss": 2.1829705238342285,
"eval_runtime": 7.8222,
"eval_samples_per_second": 8.054,
"eval_steps_per_second": 1.023,
"eval_wer": 0.6554923675546244,
"step": 1560
},
{
"epoch": 195.9,
"eval_loss": 2.176032781600952,
"eval_runtime": 7.8048,
"eval_samples_per_second": 8.072,
"eval_steps_per_second": 1.025,
"eval_wer": 0.6563903023046992,
"step": 1568
},
{
"epoch": 196.23,
"learning_rate": 7.5949367088607605e-06,
"loss": 0.6294,
"step": 1570
},
{
"epoch": 196.9,
"eval_loss": 2.1679303646087646,
"eval_runtime": 7.925,
"eval_samples_per_second": 7.949,
"eval_steps_per_second": 1.009,
"eval_wer": 0.6578868602214906,
"step": 1576
},
{
"epoch": 197.45,
"learning_rate": 5.063291139240506e-06,
"loss": 0.6149,
"step": 1580
},
{
"epoch": 197.9,
"eval_loss": 2.1631834506988525,
"eval_runtime": 7.8984,
"eval_samples_per_second": 7.976,
"eval_steps_per_second": 1.013,
"eval_wer": 0.6575875486381323,
"step": 1584
},
{
"epoch": 198.68,
"learning_rate": 2.531645569620253e-06,
"loss": 0.5761,
"step": 1590
},
{
"epoch": 198.9,
"eval_loss": 2.1613857746124268,
"eval_runtime": 7.8089,
"eval_samples_per_second": 8.068,
"eval_steps_per_second": 1.024,
"eval_wer": 0.657288237054774,
"step": 1592
},
{
"epoch": 199.9,
"learning_rate": 0.0,
"loss": 0.6111,
"step": 1600
},
{
"epoch": 199.9,
"eval_loss": 2.1611926555633545,
"eval_runtime": 7.7531,
"eval_samples_per_second": 8.126,
"eval_steps_per_second": 1.032,
"eval_wer": 0.6575875486381323,
"step": 1600
},
{
"epoch": 199.9,
"step": 1600,
"total_flos": 1.1848602213269387e+19,
"train_loss": 0.7314322146773339,
"train_runtime": 18544.7872,
"train_samples_per_second": 6.072,
"train_steps_per_second": 0.086
}
],
"max_steps": 1600,
"num_train_epochs": 200,
"total_flos": 1.1848602213269387e+19,
"trial_name": null,
"trial_params": null
}