alinerodrigues's picture
End of training
2e1cb14
{
"best_metric": 0.1773720234632492,
"best_model_checkpoint": "wav2vec2-xlsr-1b-mecita-portuguese-all-text-a_coisa-os_morcegos/checkpoint-1738",
"epoch": 42.0,
"global_step": 3318,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"learning_rate": 3e-05,
"loss": 25.5905,
"step": 1
},
{
"epoch": 1.0,
"eval_cer": 0.0734213636130093,
"eval_loss": 0.44948670268058777,
"eval_runtime": 19.9817,
"eval_samples_per_second": 15.614,
"eval_steps_per_second": 1.952,
"eval_wer": 0.25804706518799025,
"step": 79
},
{
"epoch": 1.27,
"learning_rate": 2.9631645569620254e-05,
"loss": 3.1482,
"step": 100
},
{
"epoch": 2.0,
"eval_cer": 0.038020860093510765,
"eval_loss": 0.2479224056005478,
"eval_runtime": 19.8794,
"eval_samples_per_second": 15.695,
"eval_steps_per_second": 1.962,
"eval_wer": 0.12036786583716527,
"step": 158
},
{
"epoch": 2.53,
"learning_rate": 2.9251898734177216e-05,
"loss": 0.4247,
"step": 200
},
{
"epoch": 3.0,
"eval_cer": 0.03447567178749422,
"eval_loss": 0.23473307490348816,
"eval_runtime": 19.9054,
"eval_samples_per_second": 15.674,
"eval_steps_per_second": 1.959,
"eval_wer": 0.10251555315120368,
"step": 237
},
{
"epoch": 3.8,
"learning_rate": 2.887215189873418e-05,
"loss": 0.3136,
"step": 300
},
{
"epoch": 4.0,
"eval_cer": 0.032214971998150335,
"eval_loss": 0.2043968290090561,
"eval_runtime": 20.064,
"eval_samples_per_second": 15.55,
"eval_steps_per_second": 1.944,
"eval_wer": 0.10170408439275087,
"step": 316
},
{
"epoch": 5.0,
"eval_cer": 0.029594615424138108,
"eval_loss": 0.19060839712619781,
"eval_runtime": 19.9461,
"eval_samples_per_second": 15.642,
"eval_steps_per_second": 1.955,
"eval_wer": 0.09304841763592102,
"step": 395
},
{
"epoch": 5.06,
"learning_rate": 2.849240506329114e-05,
"loss": 0.2985,
"step": 400
},
{
"epoch": 6.0,
"eval_cer": 0.031084622103478395,
"eval_loss": 0.2050233781337738,
"eval_runtime": 20.0744,
"eval_samples_per_second": 15.542,
"eval_steps_per_second": 1.943,
"eval_wer": 0.09629429266973222,
"step": 474
},
{
"epoch": 6.33,
"learning_rate": 2.8112658227848103e-05,
"loss": 0.2413,
"step": 500
},
{
"epoch": 7.0,
"eval_cer": 0.030879103940810768,
"eval_loss": 0.20249603688716888,
"eval_runtime": 20.1379,
"eval_samples_per_second": 15.493,
"eval_steps_per_second": 1.937,
"eval_wer": 0.09710576142818501,
"step": 553
},
{
"epoch": 7.59,
"learning_rate": 2.7732911392405062e-05,
"loss": 0.2267,
"step": 600
},
{
"epoch": 8.0,
"eval_cer": 0.02913219955813595,
"eval_loss": 0.20055869221687317,
"eval_runtime": 19.8715,
"eval_samples_per_second": 15.701,
"eval_steps_per_second": 1.963,
"eval_wer": 0.08845009467135516,
"step": 632
},
{
"epoch": 8.86,
"learning_rate": 2.7353164556962024e-05,
"loss": 0.224,
"step": 700
},
{
"epoch": 9.0,
"eval_cer": 0.029080820017469044,
"eval_loss": 0.1990896761417389,
"eval_runtime": 19.8842,
"eval_samples_per_second": 15.691,
"eval_steps_per_second": 1.961,
"eval_wer": 0.09169596970516636,
"step": 711
},
{
"epoch": 10.0,
"eval_cer": 0.02810460874479782,
"eval_loss": 0.1880808174610138,
"eval_runtime": 19.8781,
"eval_samples_per_second": 15.696,
"eval_steps_per_second": 1.962,
"eval_wer": 0.08845009467135516,
"step": 790
},
{
"epoch": 10.13,
"learning_rate": 2.697341772151899e-05,
"loss": 0.1864,
"step": 800
},
{
"epoch": 11.0,
"eval_cer": 0.02784771104146329,
"eval_loss": 0.18414445221424103,
"eval_runtime": 20.0151,
"eval_samples_per_second": 15.588,
"eval_steps_per_second": 1.949,
"eval_wer": 0.08926156342980796,
"step": 869
},
{
"epoch": 11.39,
"learning_rate": 2.659367088607595e-05,
"loss": 0.1951,
"step": 900
},
{
"epoch": 12.0,
"eval_cer": 0.028155988285464728,
"eval_loss": 0.18085478246212006,
"eval_runtime": 20.0956,
"eval_samples_per_second": 15.526,
"eval_steps_per_second": 1.941,
"eval_wer": 0.08953205301595889,
"step": 948
},
{
"epoch": 12.66,
"learning_rate": 2.621392405063291e-05,
"loss": 0.1794,
"step": 1000
},
{
"epoch": 13.0,
"eval_cer": 0.028001849663464008,
"eval_loss": 0.19231769442558289,
"eval_runtime": 20.0602,
"eval_samples_per_second": 15.553,
"eval_steps_per_second": 1.944,
"eval_wer": 0.08331079253448742,
"step": 1027
},
{
"epoch": 13.92,
"learning_rate": 2.5834177215189873e-05,
"loss": 0.1621,
"step": 1100
},
{
"epoch": 14.0,
"eval_cer": 0.027744951960129476,
"eval_loss": 0.19489158689975739,
"eval_runtime": 20.0375,
"eval_samples_per_second": 15.571,
"eval_steps_per_second": 1.946,
"eval_wer": 0.08574519880984582,
"step": 1106
},
{
"epoch": 15.0,
"eval_cer": 0.02656322252479063,
"eval_loss": 0.19287976622581482,
"eval_runtime": 20.0101,
"eval_samples_per_second": 15.592,
"eval_steps_per_second": 1.949,
"eval_wer": 0.08168785501758183,
"step": 1185
},
{
"epoch": 15.19,
"learning_rate": 2.5454430379746836e-05,
"loss": 0.1695,
"step": 1200
},
{
"epoch": 16.0,
"eval_cer": 0.02697425885012588,
"eval_loss": 0.19071535766124725,
"eval_runtime": 20.1621,
"eval_samples_per_second": 15.475,
"eval_steps_per_second": 1.934,
"eval_wer": 0.08385177170678929,
"step": 1264
},
{
"epoch": 16.46,
"learning_rate": 2.5074683544303798e-05,
"loss": 0.1528,
"step": 1300
},
{
"epoch": 17.0,
"eval_cer": 0.02856702461079998,
"eval_loss": 0.18394820392131805,
"eval_runtime": 19.8761,
"eval_samples_per_second": 15.697,
"eval_steps_per_second": 1.962,
"eval_wer": 0.09061401136056262,
"step": 1343
},
{
"epoch": 17.72,
"learning_rate": 2.469493670886076e-05,
"loss": 0.1592,
"step": 1400
},
{
"epoch": 18.0,
"eval_cer": 0.02810460874479782,
"eval_loss": 0.18656496703624725,
"eval_runtime": 20.0039,
"eval_samples_per_second": 15.597,
"eval_steps_per_second": 1.95,
"eval_wer": 0.09034352177441168,
"step": 1422
},
{
"epoch": 18.99,
"learning_rate": 2.4315189873417722e-05,
"loss": 0.1519,
"step": 1500
},
{
"epoch": 19.0,
"eval_cer": 0.027488054256794944,
"eval_loss": 0.20305851101875305,
"eval_runtime": 20.3338,
"eval_samples_per_second": 15.344,
"eval_steps_per_second": 1.918,
"eval_wer": 0.08574519880984582,
"step": 1501
},
{
"epoch": 20.0,
"eval_cer": 0.027796331500796384,
"eval_loss": 0.19475489854812622,
"eval_runtime": 19.9135,
"eval_samples_per_second": 15.668,
"eval_steps_per_second": 1.958,
"eval_wer": 0.08601568839599676,
"step": 1580
},
{
"epoch": 20.25,
"learning_rate": 2.3935443037974685e-05,
"loss": 0.1257,
"step": 1600
},
{
"epoch": 21.0,
"eval_cer": 0.026152186199455377,
"eval_loss": 0.18495479226112366,
"eval_runtime": 19.994,
"eval_samples_per_second": 15.605,
"eval_steps_per_second": 1.951,
"eval_wer": 0.08601568839599676,
"step": 1659
},
{
"epoch": 21.52,
"learning_rate": 2.3555696202531647e-05,
"loss": 0.1288,
"step": 1700
},
{
"epoch": 22.0,
"eval_cer": 0.02656322252479063,
"eval_loss": 0.1773720234632492,
"eval_runtime": 19.9911,
"eval_samples_per_second": 15.607,
"eval_steps_per_second": 1.951,
"eval_wer": 0.08439275087909115,
"step": 1738
},
{
"epoch": 22.78,
"learning_rate": 2.317594936708861e-05,
"loss": 0.115,
"step": 1800
},
{
"epoch": 23.0,
"eval_cer": 0.02651184298412372,
"eval_loss": 0.19595499336719513,
"eval_runtime": 19.9245,
"eval_samples_per_second": 15.659,
"eval_steps_per_second": 1.957,
"eval_wer": 0.08439275087909115,
"step": 1817
},
{
"epoch": 24.0,
"eval_cer": 0.025843908955453937,
"eval_loss": 0.18322429060935974,
"eval_runtime": 19.9298,
"eval_samples_per_second": 15.655,
"eval_steps_per_second": 1.957,
"eval_wer": 0.08249932377603462,
"step": 1896
},
{
"epoch": 24.05,
"learning_rate": 2.2796202531645568e-05,
"loss": 0.1223,
"step": 1900
},
{
"epoch": 25.0,
"eval_cer": 0.02610080665878847,
"eval_loss": 0.19195543229579926,
"eval_runtime": 20.0272,
"eval_samples_per_second": 15.579,
"eval_steps_per_second": 1.947,
"eval_wer": 0.08276981336218556,
"step": 1975
},
{
"epoch": 25.32,
"learning_rate": 2.2416455696202534e-05,
"loss": 0.1175,
"step": 2000
},
{
"epoch": 26.0,
"eval_cer": 0.026049427118121565,
"eval_loss": 0.1951374113559723,
"eval_runtime": 20.0587,
"eval_samples_per_second": 15.554,
"eval_steps_per_second": 1.944,
"eval_wer": 0.08033540708682715,
"step": 2054
},
{
"epoch": 26.58,
"learning_rate": 2.2036708860759496e-05,
"loss": 0.1051,
"step": 2100
},
{
"epoch": 27.0,
"eval_cer": 0.02656322252479063,
"eval_loss": 0.1995711475610733,
"eval_runtime": 20.0348,
"eval_samples_per_second": 15.573,
"eval_steps_per_second": 1.947,
"eval_wer": 0.08249932377603462,
"step": 2133
},
{
"epoch": 27.85,
"learning_rate": 2.1656962025316455e-05,
"loss": 0.1033,
"step": 2200
},
{
"epoch": 28.0,
"eval_cer": 0.027385295175461132,
"eval_loss": 0.21518437564373016,
"eval_runtime": 20.185,
"eval_samples_per_second": 15.457,
"eval_steps_per_second": 1.932,
"eval_wer": 0.08466324046524208,
"step": 2212
},
{
"epoch": 29.0,
"eval_cer": 0.02769357241946257,
"eval_loss": 0.2082461565732956,
"eval_runtime": 20.1321,
"eval_samples_per_second": 15.498,
"eval_steps_per_second": 1.937,
"eval_wer": 0.08790911549905328,
"step": 2291
},
{
"epoch": 29.11,
"learning_rate": 2.127721518987342e-05,
"loss": 0.0961,
"step": 2300
},
{
"epoch": 30.0,
"eval_cer": 0.027385295175461132,
"eval_loss": 0.2153148353099823,
"eval_runtime": 20.1045,
"eval_samples_per_second": 15.519,
"eval_steps_per_second": 1.94,
"eval_wer": 0.08547470922369489,
"step": 2370
},
{
"epoch": 30.38,
"learning_rate": 2.089746835443038e-05,
"loss": 0.1003,
"step": 2400
},
{
"epoch": 31.0,
"eval_cer": 0.028772542773467604,
"eval_loss": 0.2043757140636444,
"eval_runtime": 20.1868,
"eval_samples_per_second": 15.456,
"eval_steps_per_second": 1.932,
"eval_wer": 0.09034352177441168,
"step": 2449
},
{
"epoch": 31.65,
"learning_rate": 2.0517721518987342e-05,
"loss": 0.1129,
"step": 2500
},
{
"epoch": 32.0,
"eval_cer": 0.026768740687458253,
"eval_loss": 0.20504404604434967,
"eval_runtime": 20.2156,
"eval_samples_per_second": 15.434,
"eval_steps_per_second": 1.929,
"eval_wer": 0.08547470922369489,
"step": 2528
},
{
"epoch": 32.91,
"learning_rate": 2.0137974683544304e-05,
"loss": 0.0939,
"step": 2600
},
{
"epoch": 33.0,
"eval_cer": 0.0271283974721266,
"eval_loss": 0.20279404520988464,
"eval_runtime": 20.1612,
"eval_samples_per_second": 15.475,
"eval_steps_per_second": 1.934,
"eval_wer": 0.08601568839599676,
"step": 2607
},
{
"epoch": 34.0,
"eval_cer": 0.027436674716128037,
"eval_loss": 0.20313425362110138,
"eval_runtime": 20.5421,
"eval_samples_per_second": 15.188,
"eval_steps_per_second": 1.899,
"eval_wer": 0.08466324046524208,
"step": 2686
},
{
"epoch": 34.18,
"learning_rate": 1.9758227848101266e-05,
"loss": 0.0846,
"step": 2700
},
{
"epoch": 35.0,
"eval_cer": 0.026922879309458973,
"eval_loss": 0.20462077856063843,
"eval_runtime": 20.1988,
"eval_samples_per_second": 15.446,
"eval_steps_per_second": 1.931,
"eval_wer": 0.08222883418988369,
"step": 2765
},
{
"epoch": 35.44,
"learning_rate": 1.937848101265823e-05,
"loss": 0.083,
"step": 2800
},
{
"epoch": 36.0,
"eval_cer": 0.02651184298412372,
"eval_loss": 0.20938025414943695,
"eval_runtime": 20.4858,
"eval_samples_per_second": 15.23,
"eval_steps_per_second": 1.904,
"eval_wer": 0.08249932377603462,
"step": 2844
},
{
"epoch": 36.71,
"learning_rate": 1.8998734177215188e-05,
"loss": 0.0844,
"step": 2900
},
{
"epoch": 37.0,
"eval_cer": 0.026768740687458253,
"eval_loss": 0.21756267547607422,
"eval_runtime": 20.1565,
"eval_samples_per_second": 15.479,
"eval_steps_per_second": 1.935,
"eval_wer": 0.08195834460373276,
"step": 2923
},
{
"epoch": 37.97,
"learning_rate": 1.8618987341772153e-05,
"loss": 0.0829,
"step": 3000
},
{
"epoch": 38.0,
"eval_cer": 0.02666598160612444,
"eval_loss": 0.20818965137004852,
"eval_runtime": 20.1541,
"eval_samples_per_second": 15.481,
"eval_steps_per_second": 1.935,
"eval_wer": 0.08168785501758183,
"step": 3002
},
{
"epoch": 39.0,
"eval_cer": 0.028618404151466884,
"eval_loss": 0.2200096845626831,
"eval_runtime": 20.1838,
"eval_samples_per_second": 15.458,
"eval_steps_per_second": 1.932,
"eval_wer": 0.08926156342980796,
"step": 3081
},
{
"epoch": 39.24,
"learning_rate": 1.8239240506329115e-05,
"loss": 0.103,
"step": 3100
},
{
"epoch": 40.0,
"eval_cer": 0.027642192878795664,
"eval_loss": 0.2102428525686264,
"eval_runtime": 20.0863,
"eval_samples_per_second": 15.533,
"eval_steps_per_second": 1.942,
"eval_wer": 0.08412226129294022,
"step": 3160
},
{
"epoch": 40.51,
"learning_rate": 1.7859493670886074e-05,
"loss": 0.0728,
"step": 3200
},
{
"epoch": 41.0,
"eval_cer": 0.027077017931459692,
"eval_loss": 0.2143275886774063,
"eval_runtime": 20.2051,
"eval_samples_per_second": 15.442,
"eval_steps_per_second": 1.93,
"eval_wer": 0.08168785501758183,
"step": 3239
},
{
"epoch": 41.77,
"learning_rate": 1.747974683544304e-05,
"loss": 0.079,
"step": 3300
},
{
"epoch": 42.0,
"eval_cer": 0.02651184298412372,
"eval_loss": 0.2131078988313675,
"eval_runtime": 20.1578,
"eval_samples_per_second": 15.478,
"eval_steps_per_second": 1.935,
"eval_wer": 0.08249932377603462,
"step": 3318
},
{
"epoch": 42.0,
"step": 3318,
"total_flos": 8.489873279367732e+19,
"train_loss": 0.24954385395291484,
"train_runtime": 14687.2421,
"train_samples_per_second": 17.137,
"train_steps_per_second": 0.538
}
],
"max_steps": 7900,
"num_train_epochs": 100,
"total_flos": 8.489873279367732e+19,
"trial_name": null,
"trial_params": null
}