gary109's picture
End of training
25a3ff0
{
"best_metric": 0.5104931592941284,
"best_model_checkpoint": "ai-light-dance_singing3_ft_wav2vec2-large-xlsr-53-v2/checkpoint-1872",
"epoch": 49.996539792387544,
"global_step": 3600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.14,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.6213,
"step": 10
},
{
"epoch": 0.28,
"learning_rate": 1.9000000000000002e-06,
"loss": 0.639,
"step": 20
},
{
"epoch": 0.42,
"learning_rate": 2.9e-06,
"loss": 0.6243,
"step": 30
},
{
"epoch": 0.55,
"learning_rate": 3.900000000000001e-06,
"loss": 0.6178,
"step": 40
},
{
"epoch": 0.69,
"learning_rate": 4.9000000000000005e-06,
"loss": 0.5815,
"step": 50
},
{
"epoch": 0.83,
"learning_rate": 4.9887323943661975e-06,
"loss": 0.5894,
"step": 60
},
{
"epoch": 0.97,
"learning_rate": 4.974647887323944e-06,
"loss": 0.6154,
"step": 70
},
{
"epoch": 1.0,
"eval_loss": 0.526593804359436,
"eval_runtime": 128.5544,
"eval_samples_per_second": 4.138,
"eval_steps_per_second": 0.521,
"eval_wer": 0.2550620299543614,
"step": 72
},
{
"epoch": 1.11,
"learning_rate": 4.96056338028169e-06,
"loss": 0.6172,
"step": 80
},
{
"epoch": 1.25,
"learning_rate": 4.946478873239437e-06,
"loss": 0.6082,
"step": 90
},
{
"epoch": 1.39,
"learning_rate": 4.932394366197184e-06,
"loss": 0.5951,
"step": 100
},
{
"epoch": 1.53,
"learning_rate": 4.91830985915493e-06,
"loss": 0.6139,
"step": 110
},
{
"epoch": 1.66,
"learning_rate": 4.904225352112677e-06,
"loss": 0.5957,
"step": 120
},
{
"epoch": 1.8,
"learning_rate": 4.890140845070423e-06,
"loss": 0.6248,
"step": 130
},
{
"epoch": 1.94,
"learning_rate": 4.876056338028169e-06,
"loss": 0.5958,
"step": 140
},
{
"epoch": 2.0,
"eval_loss": 0.5272348523139954,
"eval_runtime": 129.1192,
"eval_samples_per_second": 4.12,
"eval_steps_per_second": 0.519,
"eval_wer": 0.2585974159542328,
"step": 144
},
{
"epoch": 2.08,
"learning_rate": 4.861971830985916e-06,
"loss": 0.6125,
"step": 150
},
{
"epoch": 2.22,
"learning_rate": 4.847887323943662e-06,
"loss": 0.6002,
"step": 160
},
{
"epoch": 2.36,
"learning_rate": 4.833802816901409e-06,
"loss": 0.5946,
"step": 170
},
{
"epoch": 2.5,
"learning_rate": 4.819718309859156e-06,
"loss": 0.586,
"step": 180
},
{
"epoch": 2.64,
"learning_rate": 4.805633802816902e-06,
"loss": 0.5792,
"step": 190
},
{
"epoch": 2.78,
"learning_rate": 4.7915492957746485e-06,
"loss": 0.5761,
"step": 200
},
{
"epoch": 2.91,
"learning_rate": 4.777464788732395e-06,
"loss": 0.5825,
"step": 210
},
{
"epoch": 3.0,
"eval_loss": 0.5249173641204834,
"eval_runtime": 127.7312,
"eval_samples_per_second": 4.165,
"eval_steps_per_second": 0.525,
"eval_wer": 0.25866169569968506,
"step": 216
},
{
"epoch": 3.06,
"learning_rate": 4.763380281690141e-06,
"loss": 0.5987,
"step": 220
},
{
"epoch": 3.19,
"learning_rate": 4.749295774647888e-06,
"loss": 0.5777,
"step": 230
},
{
"epoch": 3.33,
"learning_rate": 4.735211267605635e-06,
"loss": 0.61,
"step": 240
},
{
"epoch": 3.47,
"learning_rate": 4.721126760563381e-06,
"loss": 0.5833,
"step": 250
},
{
"epoch": 3.61,
"learning_rate": 4.707042253521127e-06,
"loss": 0.5848,
"step": 260
},
{
"epoch": 3.75,
"learning_rate": 4.692957746478873e-06,
"loss": 0.5808,
"step": 270
},
{
"epoch": 3.89,
"learning_rate": 4.6788732394366195e-06,
"loss": 0.5717,
"step": 280
},
{
"epoch": 4.0,
"eval_loss": 0.5236164927482605,
"eval_runtime": 127.5564,
"eval_samples_per_second": 4.171,
"eval_steps_per_second": 0.525,
"eval_wer": 0.2570547020633798,
"step": 288
},
{
"epoch": 4.03,
"learning_rate": 4.664788732394367e-06,
"loss": 0.6055,
"step": 290
},
{
"epoch": 4.17,
"learning_rate": 4.650704225352113e-06,
"loss": 0.5704,
"step": 300
},
{
"epoch": 4.3,
"learning_rate": 4.6366197183098594e-06,
"loss": 0.5835,
"step": 310
},
{
"epoch": 4.44,
"learning_rate": 4.622535211267606e-06,
"loss": 0.5677,
"step": 320
},
{
"epoch": 4.58,
"learning_rate": 4.608450704225352e-06,
"loss": 0.5799,
"step": 330
},
{
"epoch": 4.72,
"learning_rate": 4.5943661971830986e-06,
"loss": 0.576,
"step": 340
},
{
"epoch": 4.86,
"learning_rate": 4.580281690140845e-06,
"loss": 0.5975,
"step": 350
},
{
"epoch": 5.0,
"learning_rate": 4.566197183098592e-06,
"loss": 0.5831,
"step": 360
},
{
"epoch": 5.0,
"eval_loss": 0.5202789306640625,
"eval_runtime": 129.1161,
"eval_samples_per_second": 4.12,
"eval_steps_per_second": 0.519,
"eval_wer": 0.25898309442694606,
"step": 360
},
{
"epoch": 5.14,
"learning_rate": 4.5521126760563385e-06,
"loss": 0.58,
"step": 370
},
{
"epoch": 5.28,
"learning_rate": 4.538028169014085e-06,
"loss": 0.5869,
"step": 380
},
{
"epoch": 5.42,
"learning_rate": 4.523943661971831e-06,
"loss": 0.5603,
"step": 390
},
{
"epoch": 5.55,
"learning_rate": 4.509859154929578e-06,
"loss": 0.5657,
"step": 400
},
{
"epoch": 5.69,
"learning_rate": 4.495774647887324e-06,
"loss": 0.5846,
"step": 410
},
{
"epoch": 5.83,
"learning_rate": 4.48169014084507e-06,
"loss": 0.5951,
"step": 420
},
{
"epoch": 5.97,
"learning_rate": 4.467605633802818e-06,
"loss": 0.5652,
"step": 430
},
{
"epoch": 6.0,
"eval_loss": 0.5126761198043823,
"eval_runtime": 126.6507,
"eval_samples_per_second": 4.201,
"eval_steps_per_second": 0.529,
"eval_wer": 0.2575046602815453,
"step": 432
},
{
"epoch": 6.11,
"learning_rate": 4.453521126760564e-06,
"loss": 0.5965,
"step": 440
},
{
"epoch": 6.25,
"learning_rate": 4.43943661971831e-06,
"loss": 0.5641,
"step": 450
},
{
"epoch": 6.39,
"learning_rate": 4.425352112676057e-06,
"loss": 0.5547,
"step": 460
},
{
"epoch": 6.53,
"learning_rate": 4.411267605633803e-06,
"loss": 0.5849,
"step": 470
},
{
"epoch": 6.66,
"learning_rate": 4.3971830985915495e-06,
"loss": 0.5665,
"step": 480
},
{
"epoch": 6.8,
"learning_rate": 4.383098591549296e-06,
"loss": 0.5666,
"step": 490
},
{
"epoch": 6.94,
"learning_rate": 4.369014084507043e-06,
"loss": 0.5665,
"step": 500
},
{
"epoch": 7.0,
"eval_loss": 0.5228902101516724,
"eval_runtime": 126.6048,
"eval_samples_per_second": 4.202,
"eval_steps_per_second": 0.529,
"eval_wer": 0.25866169569968506,
"step": 504
},
{
"epoch": 7.08,
"learning_rate": 4.3549295774647895e-06,
"loss": 0.5989,
"step": 510
},
{
"epoch": 7.22,
"learning_rate": 4.340845070422536e-06,
"loss": 0.5625,
"step": 520
},
{
"epoch": 7.36,
"learning_rate": 4.326760563380282e-06,
"loss": 0.5827,
"step": 530
},
{
"epoch": 7.5,
"learning_rate": 4.312676056338029e-06,
"loss": 0.5864,
"step": 540
},
{
"epoch": 7.64,
"learning_rate": 4.298591549295775e-06,
"loss": 0.5555,
"step": 550
},
{
"epoch": 7.78,
"learning_rate": 4.284507042253521e-06,
"loss": 0.5606,
"step": 560
},
{
"epoch": 7.91,
"learning_rate": 4.270422535211268e-06,
"loss": 0.5625,
"step": 570
},
{
"epoch": 8.0,
"eval_loss": 0.5248023867607117,
"eval_runtime": 127.7741,
"eval_samples_per_second": 4.164,
"eval_steps_per_second": 0.524,
"eval_wer": 0.25474063122710033,
"step": 576
},
{
"epoch": 8.06,
"learning_rate": 4.256338028169014e-06,
"loss": 0.5798,
"step": 580
},
{
"epoch": 8.19,
"learning_rate": 4.2422535211267605e-06,
"loss": 0.5645,
"step": 590
},
{
"epoch": 8.33,
"learning_rate": 4.228169014084507e-06,
"loss": 0.5717,
"step": 600
},
{
"epoch": 8.47,
"learning_rate": 4.214084507042254e-06,
"loss": 0.5617,
"step": 610
},
{
"epoch": 8.61,
"learning_rate": 4.2000000000000004e-06,
"loss": 0.564,
"step": 620
},
{
"epoch": 8.75,
"learning_rate": 4.185915492957747e-06,
"loss": 0.5758,
"step": 630
},
{
"epoch": 8.89,
"learning_rate": 4.171830985915493e-06,
"loss": 0.5661,
"step": 640
},
{
"epoch": 9.0,
"eval_loss": 0.5213830471038818,
"eval_runtime": 127.0111,
"eval_samples_per_second": 4.189,
"eval_steps_per_second": 0.528,
"eval_wer": 0.25576910715433565,
"step": 648
},
{
"epoch": 9.03,
"learning_rate": 4.1577464788732396e-06,
"loss": 0.6023,
"step": 650
},
{
"epoch": 9.17,
"learning_rate": 4.143661971830986e-06,
"loss": 0.5642,
"step": 660
},
{
"epoch": 9.3,
"learning_rate": 4.129577464788732e-06,
"loss": 0.5741,
"step": 670
},
{
"epoch": 9.44,
"learning_rate": 4.1154929577464795e-06,
"loss": 0.5746,
"step": 680
},
{
"epoch": 9.58,
"learning_rate": 4.101408450704226e-06,
"loss": 0.5749,
"step": 690
},
{
"epoch": 9.72,
"learning_rate": 4.087323943661972e-06,
"loss": 0.5623,
"step": 700
},
{
"epoch": 9.86,
"learning_rate": 4.073239436619719e-06,
"loss": 0.5628,
"step": 710
},
{
"epoch": 10.0,
"learning_rate": 4.059154929577465e-06,
"loss": 0.5583,
"step": 720
},
{
"epoch": 10.0,
"eval_loss": 0.5196737051010132,
"eval_runtime": 128.0441,
"eval_samples_per_second": 4.155,
"eval_steps_per_second": 0.523,
"eval_wer": 0.2582117374815196,
"step": 720
},
{
"epoch": 10.14,
"learning_rate": 4.045070422535211e-06,
"loss": 0.5656,
"step": 730
},
{
"epoch": 10.28,
"learning_rate": 4.030985915492958e-06,
"loss": 0.5687,
"step": 740
},
{
"epoch": 10.42,
"learning_rate": 4.016901408450705e-06,
"loss": 0.5569,
"step": 750
},
{
"epoch": 10.55,
"learning_rate": 4.002816901408451e-06,
"loss": 0.5771,
"step": 760
},
{
"epoch": 10.69,
"learning_rate": 3.988732394366198e-06,
"loss": 0.568,
"step": 770
},
{
"epoch": 10.83,
"learning_rate": 3.974647887323944e-06,
"loss": 0.5699,
"step": 780
},
{
"epoch": 10.97,
"learning_rate": 3.9605633802816905e-06,
"loss": 0.5605,
"step": 790
},
{
"epoch": 11.0,
"eval_loss": 0.5212803483009338,
"eval_runtime": 127.3424,
"eval_samples_per_second": 4.178,
"eval_steps_per_second": 0.526,
"eval_wer": 0.26110432602686895,
"step": 792
},
{
"epoch": 11.11,
"learning_rate": 3.946478873239437e-06,
"loss": 0.5823,
"step": 800
},
{
"epoch": 11.25,
"learning_rate": 3.932394366197183e-06,
"loss": 0.5739,
"step": 810
},
{
"epoch": 11.39,
"learning_rate": 3.9183098591549305e-06,
"loss": 0.5539,
"step": 820
},
{
"epoch": 11.53,
"learning_rate": 3.904225352112677e-06,
"loss": 0.5672,
"step": 830
},
{
"epoch": 11.66,
"learning_rate": 3.890140845070423e-06,
"loss": 0.557,
"step": 840
},
{
"epoch": 11.8,
"learning_rate": 3.87605633802817e-06,
"loss": 0.5711,
"step": 850
},
{
"epoch": 11.94,
"learning_rate": 3.861971830985915e-06,
"loss": 0.5784,
"step": 860
},
{
"epoch": 12.0,
"eval_loss": 0.5327615141868591,
"eval_runtime": 128.9244,
"eval_samples_per_second": 4.126,
"eval_steps_per_second": 0.52,
"eval_wer": 0.258340296972424,
"step": 864
},
{
"epoch": 12.08,
"learning_rate": 3.847887323943662e-06,
"loss": 0.5593,
"step": 870
},
{
"epoch": 12.22,
"learning_rate": 3.833802816901409e-06,
"loss": 0.5503,
"step": 880
},
{
"epoch": 12.36,
"learning_rate": 3.819718309859155e-06,
"loss": 0.57,
"step": 890
},
{
"epoch": 12.5,
"learning_rate": 3.8056338028169015e-06,
"loss": 0.556,
"step": 900
},
{
"epoch": 12.64,
"learning_rate": 3.791549295774648e-06,
"loss": 0.5469,
"step": 910
},
{
"epoch": 12.78,
"learning_rate": 3.7774647887323947e-06,
"loss": 0.5575,
"step": 920
},
{
"epoch": 12.91,
"learning_rate": 3.763380281690141e-06,
"loss": 0.5636,
"step": 930
},
{
"epoch": 13.0,
"eval_loss": 0.5246398448944092,
"eval_runtime": 127.8438,
"eval_samples_per_second": 4.161,
"eval_steps_per_second": 0.524,
"eval_wer": 0.2585974159542328,
"step": 936
},
{
"epoch": 13.06,
"learning_rate": 3.7492957746478874e-06,
"loss": 0.5818,
"step": 940
},
{
"epoch": 13.19,
"learning_rate": 3.7352112676056342e-06,
"loss": 0.5387,
"step": 950
},
{
"epoch": 13.33,
"learning_rate": 3.7211267605633806e-06,
"loss": 0.5792,
"step": 960
},
{
"epoch": 13.47,
"learning_rate": 3.707042253521127e-06,
"loss": 0.5543,
"step": 970
},
{
"epoch": 13.61,
"learning_rate": 3.6929577464788733e-06,
"loss": 0.5429,
"step": 980
},
{
"epoch": 13.75,
"learning_rate": 3.67887323943662e-06,
"loss": 0.5571,
"step": 990
},
{
"epoch": 13.89,
"learning_rate": 3.6647887323943665e-06,
"loss": 0.5581,
"step": 1000
},
{
"epoch": 14.0,
"eval_loss": 0.522983968257904,
"eval_runtime": 128.2074,
"eval_samples_per_second": 4.15,
"eval_steps_per_second": 0.523,
"eval_wer": 0.25461207173619593,
"step": 1008
},
{
"epoch": 14.03,
"learning_rate": 3.650704225352113e-06,
"loss": 0.5776,
"step": 1010
},
{
"epoch": 14.17,
"learning_rate": 3.6366197183098597e-06,
"loss": 0.5523,
"step": 1020
},
{
"epoch": 14.3,
"learning_rate": 3.622535211267606e-06,
"loss": 0.5603,
"step": 1030
},
{
"epoch": 14.44,
"learning_rate": 3.6084507042253524e-06,
"loss": 0.5341,
"step": 1040
},
{
"epoch": 14.58,
"learning_rate": 3.594366197183099e-06,
"loss": 0.5589,
"step": 1050
},
{
"epoch": 14.72,
"learning_rate": 3.5802816901408456e-06,
"loss": 0.5508,
"step": 1060
},
{
"epoch": 14.86,
"learning_rate": 3.566197183098592e-06,
"loss": 0.5483,
"step": 1070
},
{
"epoch": 15.0,
"learning_rate": 3.5521126760563384e-06,
"loss": 0.567,
"step": 1080
},
{
"epoch": 15.0,
"eval_loss": 0.5205003619194031,
"eval_runtime": 128.349,
"eval_samples_per_second": 4.145,
"eval_steps_per_second": 0.522,
"eval_wer": 0.2571832615542842,
"step": 1080
},
{
"epoch": 15.14,
"learning_rate": 3.538028169014085e-06,
"loss": 0.5702,
"step": 1090
},
{
"epoch": 15.28,
"learning_rate": 3.5239436619718315e-06,
"loss": 0.5812,
"step": 1100
},
{
"epoch": 15.42,
"learning_rate": 3.509859154929578e-06,
"loss": 0.5577,
"step": 1110
},
{
"epoch": 15.55,
"learning_rate": 3.4957746478873243e-06,
"loss": 0.5728,
"step": 1120
},
{
"epoch": 15.69,
"learning_rate": 3.481690140845071e-06,
"loss": 0.5317,
"step": 1130
},
{
"epoch": 15.83,
"learning_rate": 3.4676056338028175e-06,
"loss": 0.5601,
"step": 1140
},
{
"epoch": 15.97,
"learning_rate": 3.4535211267605634e-06,
"loss": 0.5586,
"step": 1150
},
{
"epoch": 16.0,
"eval_loss": 0.5258896946907043,
"eval_runtime": 126.5534,
"eval_samples_per_second": 4.204,
"eval_steps_per_second": 0.529,
"eval_wer": 0.25564054766343125,
"step": 1152
},
{
"epoch": 16.11,
"learning_rate": 3.4394366197183098e-06,
"loss": 0.5722,
"step": 1160
},
{
"epoch": 16.25,
"learning_rate": 3.4253521126760566e-06,
"loss": 0.5569,
"step": 1170
},
{
"epoch": 16.39,
"learning_rate": 3.411267605633803e-06,
"loss": 0.5507,
"step": 1180
},
{
"epoch": 16.53,
"learning_rate": 3.3971830985915493e-06,
"loss": 0.57,
"step": 1190
},
{
"epoch": 16.66,
"learning_rate": 3.3830985915492957e-06,
"loss": 0.557,
"step": 1200
},
{
"epoch": 16.8,
"learning_rate": 3.3690140845070425e-06,
"loss": 0.5366,
"step": 1210
},
{
"epoch": 16.94,
"learning_rate": 3.354929577464789e-06,
"loss": 0.5358,
"step": 1220
},
{
"epoch": 17.0,
"eval_loss": 0.5334306359291077,
"eval_runtime": 128.1209,
"eval_samples_per_second": 4.152,
"eval_steps_per_second": 0.523,
"eval_wer": 0.26046152857234683,
"step": 1224
},
{
"epoch": 17.08,
"learning_rate": 3.3408450704225353e-06,
"loss": 0.5884,
"step": 1230
},
{
"epoch": 17.22,
"learning_rate": 3.326760563380282e-06,
"loss": 0.5394,
"step": 1240
},
{
"epoch": 17.36,
"learning_rate": 3.3126760563380284e-06,
"loss": 0.5633,
"step": 1250
},
{
"epoch": 17.5,
"learning_rate": 3.298591549295775e-06,
"loss": 0.5456,
"step": 1260
},
{
"epoch": 17.64,
"learning_rate": 3.284507042253521e-06,
"loss": 0.5509,
"step": 1270
},
{
"epoch": 17.78,
"learning_rate": 3.270422535211268e-06,
"loss": 0.5746,
"step": 1280
},
{
"epoch": 17.91,
"learning_rate": 3.2563380281690144e-06,
"loss": 0.5526,
"step": 1290
},
{
"epoch": 18.0,
"eval_loss": 0.5180938839912415,
"eval_runtime": 127.6299,
"eval_samples_per_second": 4.168,
"eval_steps_per_second": 0.525,
"eval_wer": 0.25557626791797905,
"step": 1296
},
{
"epoch": 18.06,
"learning_rate": 3.2422535211267607e-06,
"loss": 0.5768,
"step": 1300
},
{
"epoch": 18.19,
"learning_rate": 3.2281690140845075e-06,
"loss": 0.5491,
"step": 1310
},
{
"epoch": 18.33,
"learning_rate": 3.214084507042254e-06,
"loss": 0.5738,
"step": 1320
},
{
"epoch": 18.47,
"learning_rate": 3.2000000000000003e-06,
"loss": 0.5564,
"step": 1330
},
{
"epoch": 18.61,
"learning_rate": 3.1859154929577467e-06,
"loss": 0.5605,
"step": 1340
},
{
"epoch": 18.75,
"learning_rate": 3.1718309859154935e-06,
"loss": 0.5443,
"step": 1350
},
{
"epoch": 18.89,
"learning_rate": 3.15774647887324e-06,
"loss": 0.5483,
"step": 1360
},
{
"epoch": 19.0,
"eval_loss": 0.5131182074546814,
"eval_runtime": 127.3437,
"eval_samples_per_second": 4.178,
"eval_steps_per_second": 0.526,
"eval_wer": 0.2562190653725011,
"step": 1368
},
{
"epoch": 19.03,
"learning_rate": 3.143661971830986e-06,
"loss": 0.5656,
"step": 1370
},
{
"epoch": 19.17,
"learning_rate": 3.129577464788733e-06,
"loss": 0.5534,
"step": 1380
},
{
"epoch": 19.3,
"learning_rate": 3.1154929577464794e-06,
"loss": 0.5568,
"step": 1390
},
{
"epoch": 19.44,
"learning_rate": 3.1014084507042258e-06,
"loss": 0.5492,
"step": 1400
},
{
"epoch": 19.58,
"learning_rate": 3.087323943661972e-06,
"loss": 0.5537,
"step": 1410
},
{
"epoch": 19.72,
"learning_rate": 3.073239436619719e-06,
"loss": 0.5541,
"step": 1420
},
{
"epoch": 19.86,
"learning_rate": 3.0591549295774653e-06,
"loss": 0.5536,
"step": 1430
},
{
"epoch": 20.0,
"learning_rate": 3.0450704225352117e-06,
"loss": 0.5487,
"step": 1440
},
{
"epoch": 20.0,
"eval_loss": 0.5178970098495483,
"eval_runtime": 128.7396,
"eval_samples_per_second": 4.132,
"eval_steps_per_second": 0.52,
"eval_wer": 0.2560905058815967,
"step": 1440
},
{
"epoch": 20.14,
"learning_rate": 3.0309859154929576e-06,
"loss": 0.551,
"step": 1450
},
{
"epoch": 20.28,
"learning_rate": 3.0169014084507044e-06,
"loss": 0.554,
"step": 1460
},
{
"epoch": 20.42,
"learning_rate": 3.002816901408451e-06,
"loss": 0.5524,
"step": 1470
},
{
"epoch": 20.55,
"learning_rate": 2.988732394366197e-06,
"loss": 0.5676,
"step": 1480
},
{
"epoch": 20.69,
"learning_rate": 2.9746478873239436e-06,
"loss": 0.5488,
"step": 1490
},
{
"epoch": 20.83,
"learning_rate": 2.9605633802816903e-06,
"loss": 0.5691,
"step": 1500
},
{
"epoch": 20.97,
"learning_rate": 2.9464788732394367e-06,
"loss": 0.5489,
"step": 1510
},
{
"epoch": 21.0,
"eval_loss": 0.525915265083313,
"eval_runtime": 128.1257,
"eval_samples_per_second": 4.152,
"eval_steps_per_second": 0.523,
"eval_wer": 0.2596258918814682,
"step": 1512
},
{
"epoch": 21.11,
"learning_rate": 2.932394366197183e-06,
"loss": 0.5522,
"step": 1520
},
{
"epoch": 21.25,
"learning_rate": 2.91830985915493e-06,
"loss": 0.5544,
"step": 1530
},
{
"epoch": 21.39,
"learning_rate": 2.9042253521126763e-06,
"loss": 0.5715,
"step": 1540
},
{
"epoch": 21.53,
"learning_rate": 2.8901408450704226e-06,
"loss": 0.5547,
"step": 1550
},
{
"epoch": 21.66,
"learning_rate": 2.876056338028169e-06,
"loss": 0.5256,
"step": 1560
},
{
"epoch": 21.8,
"learning_rate": 2.861971830985916e-06,
"loss": 0.5507,
"step": 1570
},
{
"epoch": 21.94,
"learning_rate": 2.847887323943662e-06,
"loss": 0.5582,
"step": 1580
},
{
"epoch": 22.0,
"eval_loss": 0.5199052691459656,
"eval_runtime": 128.2296,
"eval_samples_per_second": 4.149,
"eval_steps_per_second": 0.523,
"eval_wer": 0.2550620299543614,
"step": 1584
},
{
"epoch": 22.08,
"learning_rate": 2.8338028169014086e-06,
"loss": 0.5706,
"step": 1590
},
{
"epoch": 22.22,
"learning_rate": 2.8197183098591554e-06,
"loss": 0.5487,
"step": 1600
},
{
"epoch": 22.36,
"learning_rate": 2.8056338028169017e-06,
"loss": 0.5494,
"step": 1610
},
{
"epoch": 22.5,
"learning_rate": 2.791549295774648e-06,
"loss": 0.5536,
"step": 1620
},
{
"epoch": 22.64,
"learning_rate": 2.7774647887323945e-06,
"loss": 0.5469,
"step": 1630
},
{
"epoch": 22.78,
"learning_rate": 2.7633802816901413e-06,
"loss": 0.556,
"step": 1640
},
{
"epoch": 22.91,
"learning_rate": 2.7492957746478877e-06,
"loss": 0.5351,
"step": 1650
},
{
"epoch": 23.0,
"eval_loss": 0.5282993316650391,
"eval_runtime": 129.7167,
"eval_samples_per_second": 4.101,
"eval_steps_per_second": 0.517,
"eval_wer": 0.25345503631805616,
"step": 1656
},
{
"epoch": 23.06,
"learning_rate": 2.735211267605634e-06,
"loss": 0.5505,
"step": 1660
},
{
"epoch": 23.19,
"learning_rate": 2.721126760563381e-06,
"loss": 0.5448,
"step": 1670
},
{
"epoch": 23.33,
"learning_rate": 2.7070422535211272e-06,
"loss": 0.5539,
"step": 1680
},
{
"epoch": 23.47,
"learning_rate": 2.6929577464788736e-06,
"loss": 0.5401,
"step": 1690
},
{
"epoch": 23.61,
"learning_rate": 2.67887323943662e-06,
"loss": 0.5626,
"step": 1700
},
{
"epoch": 23.75,
"learning_rate": 2.6647887323943668e-06,
"loss": 0.5588,
"step": 1710
},
{
"epoch": 23.89,
"learning_rate": 2.650704225352113e-06,
"loss": 0.5572,
"step": 1720
},
{
"epoch": 24.0,
"eval_loss": 0.5120282173156738,
"eval_runtime": 127.888,
"eval_samples_per_second": 4.16,
"eval_steps_per_second": 0.524,
"eval_wer": 0.25326219708169956,
"step": 1728
},
{
"epoch": 24.03,
"learning_rate": 2.6366197183098595e-06,
"loss": 0.5649,
"step": 1730
},
{
"epoch": 24.17,
"learning_rate": 2.6225352112676055e-06,
"loss": 0.5481,
"step": 1740
},
{
"epoch": 24.3,
"learning_rate": 2.6084507042253523e-06,
"loss": 0.5478,
"step": 1750
},
{
"epoch": 24.44,
"learning_rate": 2.5943661971830986e-06,
"loss": 0.5404,
"step": 1760
},
{
"epoch": 24.58,
"learning_rate": 2.580281690140845e-06,
"loss": 0.5593,
"step": 1770
},
{
"epoch": 24.72,
"learning_rate": 2.5661971830985914e-06,
"loss": 0.5302,
"step": 1780
},
{
"epoch": 24.86,
"learning_rate": 2.552112676056338e-06,
"loss": 0.5557,
"step": 1790
},
{
"epoch": 25.0,
"learning_rate": 2.5380281690140846e-06,
"loss": 0.5467,
"step": 1800
},
{
"epoch": 25.0,
"eval_loss": 0.5175544619560242,
"eval_runtime": 129.516,
"eval_samples_per_second": 4.108,
"eval_steps_per_second": 0.517,
"eval_wer": 0.25782605900880634,
"step": 1800
},
{
"epoch": 25.14,
"learning_rate": 2.523943661971831e-06,
"loss": 0.5543,
"step": 1810
},
{
"epoch": 25.28,
"learning_rate": 2.5098591549295777e-06,
"loss": 0.55,
"step": 1820
},
{
"epoch": 25.42,
"learning_rate": 2.495774647887324e-06,
"loss": 0.5348,
"step": 1830
},
{
"epoch": 25.55,
"learning_rate": 2.4816901408450705e-06,
"loss": 0.5401,
"step": 1840
},
{
"epoch": 25.69,
"learning_rate": 2.467605633802817e-06,
"loss": 0.5341,
"step": 1850
},
{
"epoch": 25.83,
"learning_rate": 2.4535211267605637e-06,
"loss": 0.552,
"step": 1860
},
{
"epoch": 25.97,
"learning_rate": 2.43943661971831e-06,
"loss": 0.5424,
"step": 1870
},
{
"epoch": 26.0,
"eval_loss": 0.5104931592941284,
"eval_runtime": 127.2359,
"eval_samples_per_second": 4.181,
"eval_steps_per_second": 0.527,
"eval_wer": 0.2551905894452658,
"step": 1872
},
{
"epoch": 26.11,
"learning_rate": 2.4253521126760564e-06,
"loss": 0.5556,
"step": 1880
},
{
"epoch": 26.25,
"learning_rate": 2.4112676056338032e-06,
"loss": 0.546,
"step": 1890
},
{
"epoch": 26.39,
"learning_rate": 2.3971830985915496e-06,
"loss": 0.5392,
"step": 1900
},
{
"epoch": 26.53,
"learning_rate": 2.383098591549296e-06,
"loss": 0.5465,
"step": 1910
},
{
"epoch": 26.66,
"learning_rate": 2.3690140845070423e-06,
"loss": 0.5393,
"step": 1920
},
{
"epoch": 26.8,
"learning_rate": 2.354929577464789e-06,
"loss": 0.5469,
"step": 1930
},
{
"epoch": 26.94,
"learning_rate": 2.3408450704225355e-06,
"loss": 0.5344,
"step": 1940
},
{
"epoch": 27.0,
"eval_loss": 0.5212472677230835,
"eval_runtime": 128.0249,
"eval_samples_per_second": 4.155,
"eval_steps_per_second": 0.523,
"eval_wer": 0.2540978337725783,
"step": 1944
},
{
"epoch": 27.08,
"learning_rate": 2.326760563380282e-06,
"loss": 0.5647,
"step": 1950
},
{
"epoch": 27.22,
"learning_rate": 2.3126760563380287e-06,
"loss": 0.5383,
"step": 1960
},
{
"epoch": 27.36,
"learning_rate": 2.2985915492957746e-06,
"loss": 0.5333,
"step": 1970
},
{
"epoch": 27.5,
"learning_rate": 2.284507042253521e-06,
"loss": 0.5551,
"step": 1980
},
{
"epoch": 27.64,
"learning_rate": 2.270422535211268e-06,
"loss": 0.5477,
"step": 1990
},
{
"epoch": 27.78,
"learning_rate": 2.256338028169014e-06,
"loss": 0.5594,
"step": 2000
},
{
"epoch": 27.91,
"learning_rate": 2.2422535211267606e-06,
"loss": 0.5444,
"step": 2010
},
{
"epoch": 28.0,
"eval_loss": 0.5154798626899719,
"eval_runtime": 128.0303,
"eval_samples_per_second": 4.155,
"eval_steps_per_second": 0.523,
"eval_wer": 0.25557626791797905,
"step": 2016
},
{
"epoch": 28.06,
"learning_rate": 2.2281690140845074e-06,
"loss": 0.569,
"step": 2020
},
{
"epoch": 28.19,
"learning_rate": 2.2140845070422537e-06,
"loss": 0.5493,
"step": 2030
},
{
"epoch": 28.33,
"learning_rate": 2.2e-06,
"loss": 0.5485,
"step": 2040
},
{
"epoch": 28.47,
"learning_rate": 2.1859154929577465e-06,
"loss": 0.5367,
"step": 2050
},
{
"epoch": 28.61,
"learning_rate": 2.1718309859154933e-06,
"loss": 0.5487,
"step": 2060
},
{
"epoch": 28.75,
"learning_rate": 2.1577464788732397e-06,
"loss": 0.5487,
"step": 2070
},
{
"epoch": 28.89,
"learning_rate": 2.143661971830986e-06,
"loss": 0.5276,
"step": 2080
},
{
"epoch": 29.0,
"eval_loss": 0.523108959197998,
"eval_runtime": 128.0146,
"eval_samples_per_second": 4.156,
"eval_steps_per_second": 0.523,
"eval_wer": 0.2551263096998136,
"step": 2088
},
{
"epoch": 29.03,
"learning_rate": 2.129577464788733e-06,
"loss": 0.546,
"step": 2090
},
{
"epoch": 29.17,
"learning_rate": 2.115492957746479e-06,
"loss": 0.5308,
"step": 2100
},
{
"epoch": 29.3,
"learning_rate": 2.1014084507042256e-06,
"loss": 0.5303,
"step": 2110
},
{
"epoch": 29.44,
"learning_rate": 2.087323943661972e-06,
"loss": 0.5453,
"step": 2120
},
{
"epoch": 29.58,
"learning_rate": 2.0732394366197183e-06,
"loss": 0.5396,
"step": 2130
},
{
"epoch": 29.72,
"learning_rate": 2.0591549295774647e-06,
"loss": 0.5352,
"step": 2140
},
{
"epoch": 29.86,
"learning_rate": 2.0450704225352115e-06,
"loss": 0.54,
"step": 2150
},
{
"epoch": 30.0,
"learning_rate": 2.030985915492958e-06,
"loss": 0.5501,
"step": 2160
},
{
"epoch": 30.0,
"eval_loss": 0.5224459171295166,
"eval_runtime": 128.6755,
"eval_samples_per_second": 4.134,
"eval_steps_per_second": 0.521,
"eval_wer": 0.25570482740888345,
"step": 2160
},
{
"epoch": 30.14,
"learning_rate": 2.0169014084507043e-06,
"loss": 0.554,
"step": 2170
},
{
"epoch": 30.28,
"learning_rate": 2.002816901408451e-06,
"loss": 0.555,
"step": 2180
},
{
"epoch": 30.42,
"learning_rate": 1.9887323943661974e-06,
"loss": 0.5414,
"step": 2190
},
{
"epoch": 30.55,
"learning_rate": 1.974647887323944e-06,
"loss": 0.5469,
"step": 2200
},
{
"epoch": 30.69,
"learning_rate": 1.96056338028169e-06,
"loss": 0.5356,
"step": 2210
},
{
"epoch": 30.83,
"learning_rate": 1.946478873239437e-06,
"loss": 0.5483,
"step": 2220
},
{
"epoch": 30.97,
"learning_rate": 1.9323943661971834e-06,
"loss": 0.5335,
"step": 2230
},
{
"epoch": 31.0,
"eval_loss": 0.5278783440589905,
"eval_runtime": 128.5943,
"eval_samples_per_second": 4.137,
"eval_steps_per_second": 0.521,
"eval_wer": 0.2549977502089092,
"step": 2232
},
{
"epoch": 31.11,
"learning_rate": 1.9183098591549297e-06,
"loss": 0.5579,
"step": 2240
},
{
"epoch": 31.25,
"learning_rate": 1.9042253521126763e-06,
"loss": 0.5416,
"step": 2250
},
{
"epoch": 31.39,
"learning_rate": 1.8901408450704225e-06,
"loss": 0.5325,
"step": 2260
},
{
"epoch": 31.53,
"learning_rate": 1.876056338028169e-06,
"loss": 0.5376,
"step": 2270
},
{
"epoch": 31.66,
"learning_rate": 1.8619718309859157e-06,
"loss": 0.5382,
"step": 2280
},
{
"epoch": 31.8,
"learning_rate": 1.847887323943662e-06,
"loss": 0.5517,
"step": 2290
},
{
"epoch": 31.94,
"learning_rate": 1.8338028169014086e-06,
"loss": 0.5315,
"step": 2300
},
{
"epoch": 32.0,
"eval_loss": 0.515052855014801,
"eval_runtime": 128.5881,
"eval_samples_per_second": 4.137,
"eval_steps_per_second": 0.521,
"eval_wer": 0.25448351224529153,
"step": 2304
},
{
"epoch": 32.08,
"learning_rate": 1.819718309859155e-06,
"loss": 0.5712,
"step": 2310
},
{
"epoch": 32.22,
"learning_rate": 1.8056338028169016e-06,
"loss": 0.5349,
"step": 2320
},
{
"epoch": 32.36,
"learning_rate": 1.791549295774648e-06,
"loss": 0.5408,
"step": 2330
},
{
"epoch": 32.5,
"learning_rate": 1.7774647887323945e-06,
"loss": 0.5405,
"step": 2340
},
{
"epoch": 32.64,
"learning_rate": 1.7633802816901411e-06,
"loss": 0.5309,
"step": 2350
},
{
"epoch": 32.78,
"learning_rate": 1.7492957746478875e-06,
"loss": 0.5463,
"step": 2360
},
{
"epoch": 32.91,
"learning_rate": 1.735211267605634e-06,
"loss": 0.5344,
"step": 2370
},
{
"epoch": 33.0,
"eval_loss": 0.5204472541809082,
"eval_runtime": 129.9429,
"eval_samples_per_second": 4.094,
"eval_steps_per_second": 0.516,
"eval_wer": 0.2528122388635341,
"step": 2376
},
{
"epoch": 33.06,
"learning_rate": 1.7211267605633805e-06,
"loss": 0.5626,
"step": 2380
},
{
"epoch": 33.19,
"learning_rate": 1.707042253521127e-06,
"loss": 0.5423,
"step": 2390
},
{
"epoch": 33.33,
"learning_rate": 1.6929577464788734e-06,
"loss": 0.5505,
"step": 2400
},
{
"epoch": 33.47,
"learning_rate": 1.6788732394366198e-06,
"loss": 0.5354,
"step": 2410
},
{
"epoch": 33.61,
"learning_rate": 1.6647887323943662e-06,
"loss": 0.5366,
"step": 2420
},
{
"epoch": 33.75,
"learning_rate": 1.6507042253521128e-06,
"loss": 0.5445,
"step": 2430
},
{
"epoch": 33.89,
"learning_rate": 1.6366197183098591e-06,
"loss": 0.5249,
"step": 2440
},
{
"epoch": 34.0,
"eval_loss": 0.515282154083252,
"eval_runtime": 128.9615,
"eval_samples_per_second": 4.125,
"eval_steps_per_second": 0.52,
"eval_wer": 0.2542906730089349,
"step": 2448
},
{
"epoch": 34.03,
"learning_rate": 1.6225352112676057e-06,
"loss": 0.5576,
"step": 2450
},
{
"epoch": 34.17,
"learning_rate": 1.6084507042253523e-06,
"loss": 0.5375,
"step": 2460
},
{
"epoch": 34.3,
"learning_rate": 1.5943661971830987e-06,
"loss": 0.5439,
"step": 2470
},
{
"epoch": 34.44,
"learning_rate": 1.5802816901408453e-06,
"loss": 0.5376,
"step": 2480
},
{
"epoch": 34.58,
"learning_rate": 1.5661971830985917e-06,
"loss": 0.5327,
"step": 2490
},
{
"epoch": 34.72,
"learning_rate": 1.5521126760563382e-06,
"loss": 0.5283,
"step": 2500
},
{
"epoch": 34.86,
"learning_rate": 1.5380281690140846e-06,
"loss": 0.5375,
"step": 2510
},
{
"epoch": 35.0,
"learning_rate": 1.5239436619718312e-06,
"loss": 0.5478,
"step": 2520
},
{
"epoch": 35.0,
"eval_loss": 0.5154463648796082,
"eval_runtime": 129.3389,
"eval_samples_per_second": 4.113,
"eval_steps_per_second": 0.518,
"eval_wer": 0.2543549527543871,
"step": 2520
},
{
"epoch": 35.14,
"learning_rate": 1.5098591549295778e-06,
"loss": 0.526,
"step": 2530
},
{
"epoch": 35.28,
"learning_rate": 1.4957746478873242e-06,
"loss": 0.5461,
"step": 2540
},
{
"epoch": 35.42,
"learning_rate": 1.4816901408450707e-06,
"loss": 0.5357,
"step": 2550
},
{
"epoch": 35.55,
"learning_rate": 1.467605633802817e-06,
"loss": 0.5379,
"step": 2560
},
{
"epoch": 35.69,
"learning_rate": 1.4535211267605635e-06,
"loss": 0.5354,
"step": 2570
},
{
"epoch": 35.83,
"learning_rate": 1.4394366197183099e-06,
"loss": 0.5374,
"step": 2580
},
{
"epoch": 35.97,
"learning_rate": 1.4253521126760565e-06,
"loss": 0.5346,
"step": 2590
},
{
"epoch": 36.0,
"eval_loss": 0.5122731924057007,
"eval_runtime": 127.7459,
"eval_samples_per_second": 4.165,
"eval_steps_per_second": 0.524,
"eval_wer": 0.25339075657260396,
"step": 2592
},
{
"epoch": 36.11,
"learning_rate": 1.4112676056338028e-06,
"loss": 0.5522,
"step": 2600
},
{
"epoch": 36.25,
"learning_rate": 1.3971830985915494e-06,
"loss": 0.5397,
"step": 2610
},
{
"epoch": 36.39,
"learning_rate": 1.3830985915492958e-06,
"loss": 0.519,
"step": 2620
},
{
"epoch": 36.53,
"learning_rate": 1.3690140845070424e-06,
"loss": 0.5558,
"step": 2630
},
{
"epoch": 36.66,
"learning_rate": 1.354929577464789e-06,
"loss": 0.5407,
"step": 2640
},
{
"epoch": 36.8,
"learning_rate": 1.3408450704225353e-06,
"loss": 0.533,
"step": 2650
},
{
"epoch": 36.94,
"learning_rate": 1.326760563380282e-06,
"loss": 0.5436,
"step": 2660
},
{
"epoch": 37.0,
"eval_loss": 0.5210054516792297,
"eval_runtime": 129.2771,
"eval_samples_per_second": 4.115,
"eval_steps_per_second": 0.518,
"eval_wer": 0.25654046409976217,
"step": 2664
},
{
"epoch": 37.08,
"learning_rate": 1.3126760563380283e-06,
"loss": 0.564,
"step": 2670
},
{
"epoch": 37.22,
"learning_rate": 1.298591549295775e-06,
"loss": 0.5498,
"step": 2680
},
{
"epoch": 37.36,
"learning_rate": 1.2845070422535213e-06,
"loss": 0.5368,
"step": 2690
},
{
"epoch": 37.5,
"learning_rate": 1.2704225352112676e-06,
"loss": 0.5166,
"step": 2700
},
{
"epoch": 37.64,
"learning_rate": 1.256338028169014e-06,
"loss": 0.5314,
"step": 2710
},
{
"epoch": 37.78,
"learning_rate": 1.2422535211267606e-06,
"loss": 0.5411,
"step": 2720
},
{
"epoch": 37.91,
"learning_rate": 1.2281690140845072e-06,
"loss": 0.5299,
"step": 2730
},
{
"epoch": 38.0,
"eval_loss": 0.5182300806045532,
"eval_runtime": 129.021,
"eval_samples_per_second": 4.123,
"eval_steps_per_second": 0.519,
"eval_wer": 0.253712155299865,
"step": 2736
},
{
"epoch": 38.06,
"learning_rate": 1.2140845070422536e-06,
"loss": 0.5536,
"step": 2740
},
{
"epoch": 38.19,
"learning_rate": 1.2000000000000002e-06,
"loss": 0.5458,
"step": 2750
},
{
"epoch": 38.33,
"learning_rate": 1.1859154929577465e-06,
"loss": 0.5247,
"step": 2760
},
{
"epoch": 38.47,
"learning_rate": 1.1718309859154931e-06,
"loss": 0.5405,
"step": 2770
},
{
"epoch": 38.61,
"learning_rate": 1.1577464788732395e-06,
"loss": 0.547,
"step": 2780
},
{
"epoch": 38.75,
"learning_rate": 1.143661971830986e-06,
"loss": 0.5321,
"step": 2790
},
{
"epoch": 38.89,
"learning_rate": 1.1295774647887325e-06,
"loss": 0.5248,
"step": 2800
},
{
"epoch": 39.0,
"eval_loss": 0.5239952206611633,
"eval_runtime": 129.8341,
"eval_samples_per_second": 4.098,
"eval_steps_per_second": 0.516,
"eval_wer": 0.2528765186089863,
"step": 2808
},
{
"epoch": 39.03,
"learning_rate": 1.115492957746479e-06,
"loss": 0.5514,
"step": 2810
},
{
"epoch": 39.17,
"learning_rate": 1.1014084507042254e-06,
"loss": 0.5394,
"step": 2820
},
{
"epoch": 39.3,
"learning_rate": 1.0873239436619718e-06,
"loss": 0.5387,
"step": 2830
},
{
"epoch": 39.44,
"learning_rate": 1.0732394366197184e-06,
"loss": 0.513,
"step": 2840
},
{
"epoch": 39.58,
"learning_rate": 1.059154929577465e-06,
"loss": 0.5425,
"step": 2850
},
{
"epoch": 39.72,
"learning_rate": 1.0450704225352113e-06,
"loss": 0.5397,
"step": 2860
},
{
"epoch": 39.86,
"learning_rate": 1.030985915492958e-06,
"loss": 0.5407,
"step": 2870
},
{
"epoch": 40.0,
"learning_rate": 1.0169014084507043e-06,
"loss": 0.5295,
"step": 2880
},
{
"epoch": 40.0,
"eval_loss": 0.5250394940376282,
"eval_runtime": 128.5995,
"eval_samples_per_second": 4.137,
"eval_steps_per_second": 0.521,
"eval_wer": 0.2562833451179533,
"step": 2880
},
{
"epoch": 40.14,
"learning_rate": 1.0028169014084507e-06,
"loss": 0.5626,
"step": 2890
},
{
"epoch": 40.28,
"learning_rate": 9.887323943661973e-07,
"loss": 0.5362,
"step": 2900
},
{
"epoch": 40.42,
"learning_rate": 9.746478873239436e-07,
"loss": 0.5354,
"step": 2910
},
{
"epoch": 40.55,
"learning_rate": 9.605633802816902e-07,
"loss": 0.5444,
"step": 2920
},
{
"epoch": 40.69,
"learning_rate": 9.464788732394367e-07,
"loss": 0.5232,
"step": 2930
},
{
"epoch": 40.83,
"learning_rate": 9.323943661971832e-07,
"loss": 0.5378,
"step": 2940
},
{
"epoch": 40.97,
"learning_rate": 9.183098591549297e-07,
"loss": 0.5343,
"step": 2950
},
{
"epoch": 41.0,
"eval_loss": 0.5179165601730347,
"eval_runtime": 129.1365,
"eval_samples_per_second": 4.12,
"eval_steps_per_second": 0.519,
"eval_wer": 0.2536478755544128,
"step": 2952
},
{
"epoch": 41.11,
"learning_rate": 9.04225352112676e-07,
"loss": 0.5501,
"step": 2960
},
{
"epoch": 41.25,
"learning_rate": 8.901408450704225e-07,
"loss": 0.5334,
"step": 2970
},
{
"epoch": 41.39,
"learning_rate": 8.76056338028169e-07,
"loss": 0.5379,
"step": 2980
},
{
"epoch": 41.53,
"learning_rate": 8.619718309859156e-07,
"loss": 0.54,
"step": 2990
},
{
"epoch": 41.66,
"learning_rate": 8.478873239436621e-07,
"loss": 0.5446,
"step": 3000
},
{
"epoch": 41.8,
"learning_rate": 8.338028169014086e-07,
"loss": 0.5478,
"step": 3010
},
{
"epoch": 41.94,
"learning_rate": 8.19718309859155e-07,
"loss": 0.5255,
"step": 3020
},
{
"epoch": 42.0,
"eval_loss": 0.5213496685028076,
"eval_runtime": 130.2226,
"eval_samples_per_second": 4.085,
"eval_steps_per_second": 0.515,
"eval_wer": 0.2560262261361445,
"step": 3024
},
{
"epoch": 42.08,
"learning_rate": 8.056338028169015e-07,
"loss": 0.5457,
"step": 3030
},
{
"epoch": 42.22,
"learning_rate": 7.915492957746479e-07,
"loss": 0.5311,
"step": 3040
},
{
"epoch": 42.36,
"learning_rate": 7.774647887323944e-07,
"loss": 0.5355,
"step": 3050
},
{
"epoch": 42.5,
"learning_rate": 7.633802816901409e-07,
"loss": 0.5426,
"step": 3060
},
{
"epoch": 42.64,
"learning_rate": 7.492957746478873e-07,
"loss": 0.5349,
"step": 3070
},
{
"epoch": 42.78,
"learning_rate": 7.352112676056339e-07,
"loss": 0.5379,
"step": 3080
},
{
"epoch": 42.91,
"learning_rate": 7.211267605633804e-07,
"loss": 0.525,
"step": 3090
},
{
"epoch": 43.0,
"eval_loss": 0.522071123123169,
"eval_runtime": 128.4426,
"eval_samples_per_second": 4.142,
"eval_steps_per_second": 0.522,
"eval_wer": 0.2553191489361702,
"step": 3096
},
{
"epoch": 43.06,
"learning_rate": 7.070422535211269e-07,
"loss": 0.5591,
"step": 3100
},
{
"epoch": 43.19,
"learning_rate": 6.929577464788733e-07,
"loss": 0.5328,
"step": 3110
},
{
"epoch": 43.33,
"learning_rate": 6.788732394366197e-07,
"loss": 0.5427,
"step": 3120
},
{
"epoch": 43.47,
"learning_rate": 6.647887323943662e-07,
"loss": 0.5322,
"step": 3130
},
{
"epoch": 43.61,
"learning_rate": 6.507042253521127e-07,
"loss": 0.5293,
"step": 3140
},
{
"epoch": 43.75,
"learning_rate": 6.366197183098592e-07,
"loss": 0.5299,
"step": 3150
},
{
"epoch": 43.89,
"learning_rate": 6.225352112676057e-07,
"loss": 0.5345,
"step": 3160
},
{
"epoch": 44.0,
"eval_loss": 0.5230171084403992,
"eval_runtime": 129.6367,
"eval_samples_per_second": 4.104,
"eval_steps_per_second": 0.517,
"eval_wer": 0.25306935784534296,
"step": 3168
},
{
"epoch": 44.03,
"learning_rate": 6.084507042253521e-07,
"loss": 0.5468,
"step": 3170
},
{
"epoch": 44.17,
"learning_rate": 5.943661971830986e-07,
"loss": 0.5317,
"step": 3180
},
{
"epoch": 44.3,
"learning_rate": 5.802816901408451e-07,
"loss": 0.5357,
"step": 3190
},
{
"epoch": 44.44,
"learning_rate": 5.661971830985916e-07,
"loss": 0.5407,
"step": 3200
},
{
"epoch": 44.58,
"learning_rate": 5.521126760563381e-07,
"loss": 0.5388,
"step": 3210
},
{
"epoch": 44.72,
"learning_rate": 5.380281690140846e-07,
"loss": 0.5096,
"step": 3220
},
{
"epoch": 44.86,
"learning_rate": 5.23943661971831e-07,
"loss": 0.5349,
"step": 3230
},
{
"epoch": 45.0,
"learning_rate": 5.098591549295775e-07,
"loss": 0.5485,
"step": 3240
},
{
"epoch": 45.0,
"eval_loss": 0.52115797996521,
"eval_runtime": 128.2514,
"eval_samples_per_second": 4.148,
"eval_steps_per_second": 0.522,
"eval_wer": 0.253712155299865,
"step": 3240
},
{
"epoch": 45.14,
"learning_rate": 4.95774647887324e-07,
"loss": 0.536,
"step": 3250
},
{
"epoch": 45.28,
"learning_rate": 4.816901408450705e-07,
"loss": 0.5245,
"step": 3260
},
{
"epoch": 45.42,
"learning_rate": 4.6760563380281696e-07,
"loss": 0.5197,
"step": 3270
},
{
"epoch": 45.55,
"learning_rate": 4.535211267605634e-07,
"loss": 0.5556,
"step": 3280
},
{
"epoch": 45.69,
"learning_rate": 4.3943661971830987e-07,
"loss": 0.5254,
"step": 3290
},
{
"epoch": 45.83,
"learning_rate": 4.253521126760564e-07,
"loss": 0.5375,
"step": 3300
},
{
"epoch": 45.97,
"learning_rate": 4.1126760563380283e-07,
"loss": 0.5471,
"step": 3310
},
{
"epoch": 46.0,
"eval_loss": 0.5214569568634033,
"eval_runtime": 128.944,
"eval_samples_per_second": 4.126,
"eval_steps_per_second": 0.52,
"eval_wer": 0.25319791733624736,
"step": 3312
},
{
"epoch": 46.11,
"learning_rate": 3.971830985915493e-07,
"loss": 0.5549,
"step": 3320
},
{
"epoch": 46.25,
"learning_rate": 3.830985915492958e-07,
"loss": 0.5379,
"step": 3330
},
{
"epoch": 46.39,
"learning_rate": 3.690140845070423e-07,
"loss": 0.521,
"step": 3340
},
{
"epoch": 46.53,
"learning_rate": 3.5492957746478875e-07,
"loss": 0.5369,
"step": 3350
},
{
"epoch": 46.66,
"learning_rate": 3.4084507042253523e-07,
"loss": 0.5292,
"step": 3360
},
{
"epoch": 46.8,
"learning_rate": 3.267605633802817e-07,
"loss": 0.5373,
"step": 3370
},
{
"epoch": 46.94,
"learning_rate": 3.126760563380282e-07,
"loss": 0.5375,
"step": 3380
},
{
"epoch": 47.0,
"eval_loss": 0.5215560793876648,
"eval_runtime": 128.748,
"eval_samples_per_second": 4.132,
"eval_steps_per_second": 0.52,
"eval_wer": 0.2543549527543871,
"step": 3384
},
{
"epoch": 47.08,
"learning_rate": 2.985915492957747e-07,
"loss": 0.5496,
"step": 3390
},
{
"epoch": 47.22,
"learning_rate": 2.8450704225352116e-07,
"loss": 0.5405,
"step": 3400
},
{
"epoch": 47.36,
"learning_rate": 2.7042253521126764e-07,
"loss": 0.5353,
"step": 3410
},
{
"epoch": 47.5,
"learning_rate": 2.563380281690141e-07,
"loss": 0.5449,
"step": 3420
},
{
"epoch": 47.64,
"learning_rate": 2.422535211267606e-07,
"loss": 0.5415,
"step": 3430
},
{
"epoch": 47.78,
"learning_rate": 2.2816901408450706e-07,
"loss": 0.5322,
"step": 3440
},
{
"epoch": 47.91,
"learning_rate": 2.1408450704225354e-07,
"loss": 0.5229,
"step": 3450
},
{
"epoch": 48.0,
"eval_loss": 0.5208937525749207,
"eval_runtime": 128.6533,
"eval_samples_per_second": 4.135,
"eval_steps_per_second": 0.521,
"eval_wer": 0.2551263096998136,
"step": 3456
},
{
"epoch": 48.06,
"learning_rate": 2.0000000000000002e-07,
"loss": 0.5553,
"step": 3460
},
{
"epoch": 48.19,
"learning_rate": 1.8591549295774647e-07,
"loss": 0.5291,
"step": 3470
},
{
"epoch": 48.33,
"learning_rate": 1.7183098591549298e-07,
"loss": 0.5476,
"step": 3480
},
{
"epoch": 48.47,
"learning_rate": 1.5774647887323943e-07,
"loss": 0.5228,
"step": 3490
},
{
"epoch": 48.61,
"learning_rate": 1.4366197183098591e-07,
"loss": 0.5252,
"step": 3500
},
{
"epoch": 48.75,
"learning_rate": 1.295774647887324e-07,
"loss": 0.5434,
"step": 3510
},
{
"epoch": 48.89,
"learning_rate": 1.1549295774647888e-07,
"loss": 0.5218,
"step": 3520
},
{
"epoch": 49.0,
"eval_loss": 0.5215969085693359,
"eval_runtime": 129.6533,
"eval_samples_per_second": 4.103,
"eval_steps_per_second": 0.517,
"eval_wer": 0.2536478755544128,
"step": 3528
},
{
"epoch": 49.03,
"learning_rate": 1.0281690140845071e-07,
"loss": 0.5535,
"step": 3530
},
{
"epoch": 49.17,
"learning_rate": 8.873239436619719e-08,
"loss": 0.529,
"step": 3540
},
{
"epoch": 49.3,
"learning_rate": 7.464788732394367e-08,
"loss": 0.5316,
"step": 3550
},
{
"epoch": 49.44,
"learning_rate": 6.056338028169015e-08,
"loss": 0.5191,
"step": 3560
},
{
"epoch": 49.58,
"learning_rate": 4.647887323943662e-08,
"loss": 0.5505,
"step": 3570
},
{
"epoch": 49.72,
"learning_rate": 3.23943661971831e-08,
"loss": 0.5328,
"step": 3580
},
{
"epoch": 49.86,
"learning_rate": 1.830985915492958e-08,
"loss": 0.5271,
"step": 3590
},
{
"epoch": 50.0,
"learning_rate": 4.225352112676057e-09,
"loss": 0.5292,
"step": 3600
},
{
"epoch": 50.0,
"eval_loss": 0.5207646489143372,
"eval_runtime": 128.939,
"eval_samples_per_second": 4.126,
"eval_steps_per_second": 0.52,
"eval_wer": 0.25448351224529153,
"step": 3600
},
{
"epoch": 50.0,
"step": 3600,
"total_flos": 1.3601359172236221e+20,
"train_loss": 0.5537465457121531,
"train_runtime": 95750.0723,
"train_samples_per_second": 2.411,
"train_steps_per_second": 0.038
}
],
"max_steps": 3600,
"num_train_epochs": 50,
"total_flos": 1.3601359172236221e+20,
"trial_name": null,
"trial_params": null
}