wav2vec2-large-robust-paper / trainer_state.json
hts98's picture
End of training
38b2ce5
{
"best_metric": 0.8695769309997559,
"best_model_checkpoint": "./wav2vec2-large-robust-paper/checkpoint-4355",
"epoch": 50.0,
"global_step": 16750,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_loss": 3.9162847995758057,
"eval_runtime": 53.7666,
"eval_samples_per_second": 15.66,
"eval_steps_per_second": 1.971,
"eval_wer": 1.0,
"step": 335
},
{
"epoch": 1.49,
"learning_rate": 4.976729944886712e-05,
"loss": 7.1369,
"step": 500
},
{
"epoch": 2.0,
"eval_loss": 3.342172145843506,
"eval_runtime": 53.6439,
"eval_samples_per_second": 15.696,
"eval_steps_per_second": 1.976,
"eval_wer": 1.0,
"step": 670
},
{
"epoch": 2.99,
"learning_rate": 4.82363747703613e-05,
"loss": 3.3448,
"step": 1000
},
{
"epoch": 3.0,
"eval_loss": 3.335538864135742,
"eval_runtime": 53.7095,
"eval_samples_per_second": 15.677,
"eval_steps_per_second": 1.974,
"eval_wer": 1.0,
"step": 1005
},
{
"epoch": 4.0,
"eval_loss": 3.3262581825256348,
"eval_runtime": 53.7592,
"eval_samples_per_second": 15.662,
"eval_steps_per_second": 1.972,
"eval_wer": 1.0,
"step": 1340
},
{
"epoch": 4.48,
"learning_rate": 4.6705450091855484e-05,
"loss": 3.3277,
"step": 1500
},
{
"epoch": 5.0,
"eval_loss": 2.8927650451660156,
"eval_runtime": 54.3633,
"eval_samples_per_second": 15.488,
"eval_steps_per_second": 1.95,
"eval_wer": 1.0079421226156946,
"step": 1675
},
{
"epoch": 5.97,
"learning_rate": 4.517452541334967e-05,
"loss": 2.6655,
"step": 2000
},
{
"epoch": 6.0,
"eval_loss": 1.7821804285049438,
"eval_runtime": 54.4942,
"eval_samples_per_second": 15.451,
"eval_steps_per_second": 1.945,
"eval_wer": 0.8787591601372186,
"step": 2010
},
{
"epoch": 7.0,
"eval_loss": 1.3193254470825195,
"eval_runtime": 54.3211,
"eval_samples_per_second": 15.5,
"eval_steps_per_second": 1.951,
"eval_wer": 0.7055407984836553,
"step": 2345
},
{
"epoch": 7.46,
"learning_rate": 4.364360073484385e-05,
"loss": 1.4617,
"step": 2500
},
{
"epoch": 8.0,
"eval_loss": 1.1407958269119263,
"eval_runtime": 54.3418,
"eval_samples_per_second": 15.495,
"eval_steps_per_second": 1.951,
"eval_wer": 0.607031781838568,
"step": 2680
},
{
"epoch": 8.96,
"learning_rate": 4.211267605633803e-05,
"loss": 1.0805,
"step": 3000
},
{
"epoch": 9.0,
"eval_loss": 1.0108448266983032,
"eval_runtime": 54.8305,
"eval_samples_per_second": 15.356,
"eval_steps_per_second": 1.933,
"eval_wer": 0.542240079020783,
"step": 3015
},
{
"epoch": 10.0,
"eval_loss": 0.9516933560371399,
"eval_runtime": 54.4768,
"eval_samples_per_second": 15.456,
"eval_steps_per_second": 1.946,
"eval_wer": 0.515383691285022,
"step": 3350
},
{
"epoch": 10.45,
"learning_rate": 4.058175137783221e-05,
"loss": 0.8759,
"step": 3500
},
{
"epoch": 11.0,
"eval_loss": 0.9081984758377075,
"eval_runtime": 54.3156,
"eval_samples_per_second": 15.502,
"eval_steps_per_second": 1.952,
"eval_wer": 0.49020916480905535,
"step": 3685
},
{
"epoch": 11.94,
"learning_rate": 3.905082669932639e-05,
"loss": 0.7462,
"step": 4000
},
{
"epoch": 12.0,
"eval_loss": 0.875782310962677,
"eval_runtime": 54.5818,
"eval_samples_per_second": 15.426,
"eval_steps_per_second": 1.942,
"eval_wer": 0.47056075390098373,
"step": 4020
},
{
"epoch": 13.0,
"eval_loss": 0.8695769309997559,
"eval_runtime": 54.4851,
"eval_samples_per_second": 15.454,
"eval_steps_per_second": 1.945,
"eval_wer": 0.457239344874995,
"step": 4355
},
{
"epoch": 13.43,
"learning_rate": 3.7519902020820577e-05,
"loss": 0.6429,
"step": 4500
},
{
"epoch": 14.0,
"eval_loss": 0.8731432557106018,
"eval_runtime": 55.2734,
"eval_samples_per_second": 15.233,
"eval_steps_per_second": 1.918,
"eval_wer": 0.45348852730354927,
"step": 4690
},
{
"epoch": 14.93,
"learning_rate": 3.598897734231476e-05,
"loss": 0.5672,
"step": 5000
},
{
"epoch": 15.0,
"eval_loss": 0.8749489784240723,
"eval_runtime": 54.2876,
"eval_samples_per_second": 15.51,
"eval_steps_per_second": 1.953,
"eval_wer": 0.450792210045784,
"step": 5025
},
{
"epoch": 16.0,
"eval_loss": 0.8752743005752563,
"eval_runtime": 54.5671,
"eval_samples_per_second": 15.431,
"eval_steps_per_second": 1.943,
"eval_wer": 0.4512460456238237,
"step": 5360
},
{
"epoch": 16.42,
"learning_rate": 3.445805266380894e-05,
"loss": 0.4959,
"step": 5500
},
{
"epoch": 17.0,
"eval_loss": 0.9039203524589539,
"eval_runtime": 54.5236,
"eval_samples_per_second": 15.443,
"eval_steps_per_second": 1.944,
"eval_wer": 0.4486965575236595,
"step": 5695
},
{
"epoch": 17.91,
"learning_rate": 3.2927127985303126e-05,
"loss": 0.4456,
"step": 6000
},
{
"epoch": 18.0,
"eval_loss": 0.9161030650138855,
"eval_runtime": 54.3598,
"eval_samples_per_second": 15.489,
"eval_steps_per_second": 1.95,
"eval_wer": 0.443303923008129,
"step": 6030
},
{
"epoch": 19.0,
"eval_loss": 0.9505767226219177,
"eval_runtime": 54.2942,
"eval_samples_per_second": 15.508,
"eval_steps_per_second": 1.952,
"eval_wer": 0.4429835684824539,
"step": 6365
},
{
"epoch": 19.4,
"learning_rate": 3.13962033067973e-05,
"loss": 0.392,
"step": 6500
},
{
"epoch": 20.0,
"eval_loss": 0.9411688446998596,
"eval_runtime": 54.3336,
"eval_samples_per_second": 15.497,
"eval_steps_per_second": 1.951,
"eval_wer": 0.4438511953228239,
"step": 6700
},
{
"epoch": 20.9,
"learning_rate": 2.9865278628291486e-05,
"loss": 0.3594,
"step": 7000
},
{
"epoch": 21.0,
"eval_loss": 0.9884207844734192,
"eval_runtime": 54.3631,
"eval_samples_per_second": 15.488,
"eval_steps_per_second": 1.95,
"eval_wer": 0.44162206174833485,
"step": 7035
},
{
"epoch": 22.0,
"eval_loss": 1.022162914276123,
"eval_runtime": 54.656,
"eval_samples_per_second": 15.405,
"eval_steps_per_second": 1.939,
"eval_wer": 0.45101912783480386,
"step": 7370
},
{
"epoch": 22.39,
"learning_rate": 2.833435394978567e-05,
"loss": 0.3175,
"step": 7500
},
{
"epoch": 23.0,
"eval_loss": 1.0344542264938354,
"eval_runtime": 54.3628,
"eval_samples_per_second": 15.489,
"eval_steps_per_second": 1.95,
"eval_wer": 0.4439312839542427,
"step": 7705
},
{
"epoch": 23.88,
"learning_rate": 2.6803429271279856e-05,
"loss": 0.2947,
"step": 8000
},
{
"epoch": 24.0,
"eval_loss": 1.084883213043213,
"eval_runtime": 54.6337,
"eval_samples_per_second": 15.412,
"eval_steps_per_second": 1.94,
"eval_wer": 0.4464807720544069,
"step": 8040
},
{
"epoch": 25.0,
"eval_loss": 1.0879119634628296,
"eval_runtime": 54.4682,
"eval_samples_per_second": 15.459,
"eval_steps_per_second": 1.946,
"eval_wer": 0.4472416140528852,
"step": 8375
},
{
"epoch": 25.37,
"learning_rate": 2.527556644213105e-05,
"loss": 0.2674,
"step": 8500
},
{
"epoch": 26.0,
"eval_loss": 1.1071442365646362,
"eval_runtime": 54.3908,
"eval_samples_per_second": 15.481,
"eval_steps_per_second": 1.949,
"eval_wer": 0.4512460456238237,
"step": 8710
},
{
"epoch": 26.87,
"learning_rate": 2.3744641763625232e-05,
"loss": 0.2521,
"step": 9000
},
{
"epoch": 27.0,
"eval_loss": 1.1146758794784546,
"eval_runtime": 54.502,
"eval_samples_per_second": 15.449,
"eval_steps_per_second": 1.945,
"eval_wer": 0.4494307033116649,
"step": 9045
},
{
"epoch": 28.0,
"eval_loss": 1.1426175832748413,
"eval_runtime": 54.4541,
"eval_samples_per_second": 15.463,
"eval_steps_per_second": 1.947,
"eval_wer": 0.4525408118317605,
"step": 9380
},
{
"epoch": 28.36,
"learning_rate": 2.2216778934476424e-05,
"loss": 0.2321,
"step": 9500
},
{
"epoch": 29.0,
"eval_loss": 1.1591500043869019,
"eval_runtime": 54.6264,
"eval_samples_per_second": 15.414,
"eval_steps_per_second": 1.94,
"eval_wer": 0.4440380687961344,
"step": 9715
},
{
"epoch": 29.85,
"learning_rate": 2.0685854255970608e-05,
"loss": 0.2235,
"step": 10000
},
{
"epoch": 30.0,
"eval_loss": 1.178154706954956,
"eval_runtime": 54.3939,
"eval_samples_per_second": 15.48,
"eval_steps_per_second": 1.949,
"eval_wer": 0.44495908805745027,
"step": 10050
},
{
"epoch": 31.0,
"eval_loss": 1.2050156593322754,
"eval_runtime": 54.4103,
"eval_samples_per_second": 15.475,
"eval_steps_per_second": 1.948,
"eval_wer": 0.4436643218495135,
"step": 10385
},
{
"epoch": 31.34,
"learning_rate": 1.9154929577464788e-05,
"loss": 0.2071,
"step": 10500
},
{
"epoch": 32.0,
"eval_loss": 1.2223504781723022,
"eval_runtime": 54.4403,
"eval_samples_per_second": 15.466,
"eval_steps_per_second": 1.947,
"eval_wer": 0.4399535485937771,
"step": 10720
},
{
"epoch": 32.84,
"learning_rate": 1.7624004898958974e-05,
"loss": 0.1951,
"step": 11000
},
{
"epoch": 33.0,
"eval_loss": 1.2269729375839233,
"eval_runtime": 54.7494,
"eval_samples_per_second": 15.379,
"eval_steps_per_second": 1.936,
"eval_wer": 0.4470680886848112,
"step": 11055
},
{
"epoch": 34.0,
"eval_loss": 1.246551275253296,
"eval_runtime": 54.3927,
"eval_samples_per_second": 15.48,
"eval_steps_per_second": 1.949,
"eval_wer": 0.44833615868227505,
"step": 11390
},
{
"epoch": 34.33,
"learning_rate": 1.6093080220453154e-05,
"loss": 0.1892,
"step": 11500
},
{
"epoch": 35.0,
"eval_loss": 1.232478380203247,
"eval_runtime": 54.41,
"eval_samples_per_second": 15.475,
"eval_steps_per_second": 1.948,
"eval_wer": 0.44286343553532576,
"step": 11725
},
{
"epoch": 35.82,
"learning_rate": 1.4562155541947337e-05,
"loss": 0.1809,
"step": 12000
},
{
"epoch": 36.0,
"eval_loss": 1.2754629850387573,
"eval_runtime": 54.5117,
"eval_samples_per_second": 15.446,
"eval_steps_per_second": 1.945,
"eval_wer": 0.44272995448296115,
"step": 12060
},
{
"epoch": 37.0,
"eval_loss": 1.2675007581710815,
"eval_runtime": 54.594,
"eval_samples_per_second": 15.423,
"eval_steps_per_second": 1.942,
"eval_wer": 0.4421693340630298,
"step": 12395
},
{
"epoch": 37.31,
"learning_rate": 1.3031230863441517e-05,
"loss": 0.1746,
"step": 12500
},
{
"epoch": 38.0,
"eval_loss": 1.3022228479385376,
"eval_runtime": 54.757,
"eval_samples_per_second": 15.377,
"eval_steps_per_second": 1.936,
"eval_wer": 0.4417688909059359,
"step": 12730
},
{
"epoch": 38.81,
"learning_rate": 1.15003061849357e-05,
"loss": 0.1656,
"step": 13000
},
{
"epoch": 39.0,
"eval_loss": 1.3178575038909912,
"eval_runtime": 54.82,
"eval_samples_per_second": 15.359,
"eval_steps_per_second": 1.934,
"eval_wer": 0.4407544349079648,
"step": 13065
},
{
"epoch": 40.0,
"eval_loss": 1.293350338935852,
"eval_runtime": 54.6833,
"eval_samples_per_second": 15.398,
"eval_steps_per_second": 1.938,
"eval_wer": 0.4425430810096507,
"step": 13400
},
{
"epoch": 40.3,
"learning_rate": 9.972443355786895e-06,
"loss": 0.1614,
"step": 13500
},
{
"epoch": 41.0,
"eval_loss": 1.3303664922714233,
"eval_runtime": 54.5126,
"eval_samples_per_second": 15.446,
"eval_steps_per_second": 1.945,
"eval_wer": 0.44259647343059655,
"step": 13735
},
{
"epoch": 41.79,
"learning_rate": 8.441518677281078e-06,
"loss": 0.1564,
"step": 14000
},
{
"epoch": 42.0,
"eval_loss": 1.3147845268249512,
"eval_runtime": 54.5529,
"eval_samples_per_second": 15.435,
"eval_steps_per_second": 1.943,
"eval_wer": 0.44196911248448284,
"step": 14070
},
{
"epoch": 43.0,
"eval_loss": 1.3266962766647339,
"eval_runtime": 54.7201,
"eval_samples_per_second": 15.387,
"eval_steps_per_second": 1.937,
"eval_wer": 0.44325053058718317,
"step": 14405
},
{
"epoch": 43.28,
"learning_rate": 6.910593998775261e-06,
"loss": 0.1546,
"step": 14500
},
{
"epoch": 44.0,
"eval_loss": 1.3331360816955566,
"eval_runtime": 54.6617,
"eval_samples_per_second": 15.404,
"eval_steps_per_second": 1.939,
"eval_wer": 0.4412750110121868,
"step": 14740
},
{
"epoch": 44.78,
"learning_rate": 5.379669320269443e-06,
"loss": 0.1515,
"step": 15000
},
{
"epoch": 45.0,
"eval_loss": 1.344504475593567,
"eval_runtime": 54.543,
"eval_samples_per_second": 15.437,
"eval_steps_per_second": 1.943,
"eval_wer": 0.43875221912249557,
"step": 15075
},
{
"epoch": 46.0,
"eval_loss": 1.352994441986084,
"eval_runtime": 54.5619,
"eval_samples_per_second": 15.432,
"eval_steps_per_second": 1.943,
"eval_wer": 0.4372438832307754,
"step": 15410
},
{
"epoch": 46.27,
"learning_rate": 3.851806491120637e-06,
"loss": 0.147,
"step": 15500
},
{
"epoch": 47.0,
"eval_loss": 1.34428870677948,
"eval_runtime": 54.5828,
"eval_samples_per_second": 15.426,
"eval_steps_per_second": 1.942,
"eval_wer": 0.4384585608072934,
"step": 15745
},
{
"epoch": 47.76,
"learning_rate": 2.3208818126148195e-06,
"loss": 0.1447,
"step": 16000
},
{
"epoch": 48.0,
"eval_loss": 1.3502939939498901,
"eval_runtime": 54.5282,
"eval_samples_per_second": 15.442,
"eval_steps_per_second": 1.944,
"eval_wer": 0.436856788178918,
"step": 16080
},
{
"epoch": 49.0,
"eval_loss": 1.358969807624817,
"eval_runtime": 55.1854,
"eval_samples_per_second": 15.258,
"eval_steps_per_second": 1.921,
"eval_wer": 0.4393261876476634,
"step": 16415
},
{
"epoch": 49.25,
"learning_rate": 7.930189834660135e-07,
"loss": 0.1437,
"step": 16500
},
{
"epoch": 50.0,
"eval_loss": 1.3668413162231445,
"eval_runtime": 54.6805,
"eval_samples_per_second": 15.399,
"eval_steps_per_second": 1.939,
"eval_wer": 0.43717714270459307,
"step": 16750
},
{
"epoch": 50.0,
"step": 16750,
"total_flos": 1.4087701795050537e+20,
"train_loss": 0.8170821473989913,
"train_runtime": 40557.4985,
"train_samples_per_second": 4.13,
"train_steps_per_second": 0.413
}
],
"max_steps": 16750,
"num_train_epochs": 50,
"total_flos": 1.4087701795050537e+20,
"trial_name": null,
"trial_params": null
}