wav2vec2-large-xlsr-bn / trainer_state.json
nihalbaig's picture
adding training model
e8053f9
{
"best_metric": 0.8215018908698001,
"best_model_checkpoint": "/content/wav2vec2-large-xlsr-bn/checkpoint-800",
"epoch": 30.0,
"global_step": 18750,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.64,
"learning_rate": 0.00029405766150560596,
"loss": 4.1339,
"step": 400
},
{
"epoch": 0.64,
"eval_loss": 3.2776501178741455,
"eval_runtime": 74.0715,
"eval_samples_per_second": 13.5,
"eval_steps_per_second": 1.688,
"eval_wer": 1.0,
"step": 400
},
{
"epoch": 1.28,
"learning_rate": 0.00028774693005872927,
"loss": 2.0718,
"step": 800
},
{
"epoch": 1.28,
"eval_loss": 0.979073703289032,
"eval_runtime": 74.5153,
"eval_samples_per_second": 13.42,
"eval_steps_per_second": 1.678,
"eval_wer": 0.8215018908698001,
"step": 800
},
{
"epoch": 1.92,
"learning_rate": 0.00028143619861185264,
"loss": 2.4619,
"step": 1200
},
{
"epoch": 1.92,
"eval_loss": 3.080274820327759,
"eval_runtime": 74.0712,
"eval_samples_per_second": 13.501,
"eval_steps_per_second": 1.688,
"eval_wer": 1.0,
"step": 1200
},
{
"epoch": 2.56,
"learning_rate": 0.000275157501334757,
"loss": 3.1703,
"step": 1600
},
{
"epoch": 2.56,
"eval_loss": 3.4948482513427734,
"eval_runtime": 74.092,
"eval_samples_per_second": 13.497,
"eval_steps_per_second": 1.687,
"eval_wer": 1.0,
"step": 1600
},
{
"epoch": 3.2,
"learning_rate": 0.00026886278697277094,
"loss": 5.5212,
"step": 2000
},
{
"epoch": 3.2,
"eval_loss": 6.071021556854248,
"eval_runtime": 74.4322,
"eval_samples_per_second": 13.435,
"eval_steps_per_second": 1.679,
"eval_wer": 1.0,
"step": 2000
},
{
"epoch": 3.84,
"learning_rate": 0.0002625680726107848,
"loss": 5.8864,
"step": 2400
},
{
"epoch": 3.84,
"eval_loss": 6.071021556854248,
"eval_runtime": 74.0924,
"eval_samples_per_second": 13.497,
"eval_steps_per_second": 1.687,
"eval_wer": 1.0,
"step": 2400
},
{
"epoch": 4.48,
"learning_rate": 0.00025628937533368924,
"loss": 5.9244,
"step": 2800
},
{
"epoch": 4.48,
"eval_loss": 6.071021556854248,
"eval_runtime": 71.9212,
"eval_samples_per_second": 13.904,
"eval_steps_per_second": 1.738,
"eval_wer": 1.0,
"step": 2800
},
{
"epoch": 5.12,
"learning_rate": 0.00024996262680192206,
"loss": 5.8882,
"step": 3200
},
{
"epoch": 5.12,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.014,
"eval_samples_per_second": 13.886,
"eval_steps_per_second": 1.736,
"eval_wer": 1.0,
"step": 3200
},
{
"epoch": 5.76,
"learning_rate": 0.00024365189535504537,
"loss": 5.9011,
"step": 3600
},
{
"epoch": 5.76,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.5441,
"eval_samples_per_second": 13.785,
"eval_steps_per_second": 1.723,
"eval_wer": 1.0,
"step": 3600
},
{
"epoch": 6.4,
"learning_rate": 0.00023734116390816868,
"loss": 5.8956,
"step": 4000
},
{
"epoch": 6.4,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.2548,
"eval_samples_per_second": 13.84,
"eval_steps_per_second": 1.73,
"eval_wer": 1.0,
"step": 4000
},
{
"epoch": 7.04,
"learning_rate": 0.00023103043246129203,
"loss": 5.9103,
"step": 4400
},
{
"epoch": 7.04,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.8707,
"eval_samples_per_second": 13.723,
"eval_steps_per_second": 1.715,
"eval_wer": 1.0,
"step": 4400
},
{
"epoch": 7.68,
"learning_rate": 0.0002247357180993059,
"loss": 5.9083,
"step": 4800
},
{
"epoch": 7.68,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.091,
"eval_samples_per_second": 13.871,
"eval_steps_per_second": 1.734,
"eval_wer": 1.0,
"step": 4800
},
{
"epoch": 8.32,
"learning_rate": 0.0002184410037373198,
"loss": 5.9054,
"step": 5200
},
{
"epoch": 8.32,
"eval_loss": 6.071021556854248,
"eval_runtime": 74.6941,
"eval_samples_per_second": 13.388,
"eval_steps_per_second": 1.673,
"eval_wer": 1.0,
"step": 5200
},
{
"epoch": 8.96,
"learning_rate": 0.00021213027229044314,
"loss": 5.8996,
"step": 5600
},
{
"epoch": 8.96,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.5093,
"eval_samples_per_second": 13.791,
"eval_steps_per_second": 1.724,
"eval_wer": 1.0,
"step": 5600
},
{
"epoch": 9.6,
"learning_rate": 0.00020581954084356645,
"loss": 5.8929,
"step": 6000
},
{
"epoch": 9.6,
"eval_loss": 6.071021556854248,
"eval_runtime": 73.1997,
"eval_samples_per_second": 13.661,
"eval_steps_per_second": 1.708,
"eval_wer": 1.0,
"step": 6000
},
{
"epoch": 10.24,
"learning_rate": 0.0001995408435664709,
"loss": 5.9021,
"step": 6400
},
{
"epoch": 10.24,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.6358,
"eval_samples_per_second": 13.767,
"eval_steps_per_second": 1.721,
"eval_wer": 1.0,
"step": 6400
},
{
"epoch": 10.88,
"learning_rate": 0.00019323011211959423,
"loss": 5.8853,
"step": 6800
},
{
"epoch": 10.88,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.5502,
"eval_samples_per_second": 13.784,
"eval_steps_per_second": 1.723,
"eval_wer": 1.0,
"step": 6800
},
{
"epoch": 11.52,
"learning_rate": 0.000186903363587827,
"loss": 5.8968,
"step": 7200
},
{
"epoch": 11.52,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.2966,
"eval_samples_per_second": 13.832,
"eval_steps_per_second": 1.729,
"eval_wer": 1.0,
"step": 7200
},
{
"epoch": 12.16,
"learning_rate": 0.00018060864922584088,
"loss": 5.9139,
"step": 7600
},
{
"epoch": 12.16,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.4188,
"eval_samples_per_second": 13.809,
"eval_steps_per_second": 1.726,
"eval_wer": 1.0,
"step": 7600
},
{
"epoch": 12.8,
"learning_rate": 0.00017431393486385476,
"loss": 5.8976,
"step": 8000
},
{
"epoch": 12.8,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.6699,
"eval_samples_per_second": 13.761,
"eval_steps_per_second": 1.72,
"eval_wer": 1.0,
"step": 8000
},
{
"epoch": 13.44,
"learning_rate": 0.00016798718633208754,
"loss": 5.8909,
"step": 8400
},
{
"epoch": 13.44,
"eval_loss": 6.071021556854248,
"eval_runtime": 72.1967,
"eval_samples_per_second": 13.851,
"eval_steps_per_second": 1.731,
"eval_wer": 1.0,
"step": 8400
},
{
"epoch": 14.08,
"learning_rate": 0.00016202883075280296,
"loss": 7.2473,
"step": 8800
},
{
"epoch": 14.08,
"eval_loss": NaN,
"eval_runtime": 74.9323,
"eval_samples_per_second": 13.345,
"eval_steps_per_second": 1.668,
"eval_wer": 1.0,
"step": 8800
},
{
"epoch": 14.72,
"learning_rate": 0.000155621996796583,
"loss": 0.0,
"step": 9200
},
{
"epoch": 14.72,
"eval_loss": NaN,
"eval_runtime": 72.0418,
"eval_samples_per_second": 13.881,
"eval_steps_per_second": 1.735,
"eval_wer": 1.0,
"step": 9200
},
{
"epoch": 15.36,
"learning_rate": 0.00014921516284036303,
"loss": 0.0,
"step": 9600
},
{
"epoch": 15.36,
"eval_loss": NaN,
"eval_runtime": 72.991,
"eval_samples_per_second": 13.7,
"eval_steps_per_second": 1.713,
"eval_wer": 1.0,
"step": 9600
},
{
"epoch": 16.0,
"learning_rate": 0.00014280832888414308,
"loss": 0.0,
"step": 10000
},
{
"epoch": 16.0,
"eval_loss": NaN,
"eval_runtime": 74.3256,
"eval_samples_per_second": 13.454,
"eval_steps_per_second": 1.682,
"eval_wer": 1.0,
"step": 10000
},
{
"epoch": 16.64,
"learning_rate": 0.0001364014949279231,
"loss": 0.0,
"step": 10400
},
{
"epoch": 16.64,
"eval_loss": NaN,
"eval_runtime": 85.1556,
"eval_samples_per_second": 11.743,
"eval_steps_per_second": 1.468,
"eval_wer": 1.0,
"step": 10400
},
{
"epoch": 17.28,
"learning_rate": 0.00012999466097170315,
"loss": 0.0,
"step": 10800
},
{
"epoch": 17.28,
"eval_loss": NaN,
"eval_runtime": 74.297,
"eval_samples_per_second": 13.46,
"eval_steps_per_second": 1.682,
"eval_wer": 1.0,
"step": 10800
},
{
"epoch": 17.92,
"learning_rate": 0.00012358782701548318,
"loss": 0.0,
"step": 11200
},
{
"epoch": 17.92,
"eval_loss": NaN,
"eval_runtime": 71.8705,
"eval_samples_per_second": 13.914,
"eval_steps_per_second": 1.739,
"eval_wer": 1.0,
"step": 11200
},
{
"epoch": 18.56,
"learning_rate": 0.00011718099305926321,
"loss": 0.0,
"step": 11600
},
{
"epoch": 18.56,
"eval_loss": NaN,
"eval_runtime": 72.0682,
"eval_samples_per_second": 13.876,
"eval_steps_per_second": 1.734,
"eval_wer": 1.0,
"step": 11600
},
{
"epoch": 19.2,
"learning_rate": 0.00011077415910304323,
"loss": 0.0,
"step": 12000
},
{
"epoch": 19.2,
"eval_loss": NaN,
"eval_runtime": 86.6422,
"eval_samples_per_second": 11.542,
"eval_steps_per_second": 1.443,
"eval_wer": 1.0,
"step": 12000
},
{
"epoch": 19.84,
"learning_rate": 0.00010436732514682327,
"loss": 0.0,
"step": 12400
},
{
"epoch": 19.84,
"eval_loss": NaN,
"eval_runtime": 74.8452,
"eval_samples_per_second": 13.361,
"eval_steps_per_second": 1.67,
"eval_wer": 1.0,
"step": 12400
},
{
"epoch": 20.48,
"learning_rate": 9.79604911906033e-05,
"loss": 0.0,
"step": 12800
},
{
"epoch": 20.48,
"eval_loss": NaN,
"eval_runtime": 73.8255,
"eval_samples_per_second": 13.545,
"eval_steps_per_second": 1.693,
"eval_wer": 1.0,
"step": 12800
},
{
"epoch": 21.12,
"learning_rate": 9.155365723438334e-05,
"loss": 0.0,
"step": 13200
},
{
"epoch": 21.12,
"eval_loss": NaN,
"eval_runtime": 77.5777,
"eval_samples_per_second": 12.89,
"eval_steps_per_second": 1.611,
"eval_wer": 1.0,
"step": 13200
},
{
"epoch": 21.76,
"learning_rate": 8.514682327816338e-05,
"loss": 0.0,
"step": 13600
},
{
"epoch": 21.76,
"eval_loss": NaN,
"eval_runtime": 78.2086,
"eval_samples_per_second": 12.786,
"eval_steps_per_second": 1.598,
"eval_wer": 1.0,
"step": 13600
},
{
"epoch": 22.4,
"learning_rate": 7.87399893219434e-05,
"loss": 0.0,
"step": 14000
},
{
"epoch": 22.4,
"eval_loss": NaN,
"eval_runtime": 81.9911,
"eval_samples_per_second": 12.196,
"eval_steps_per_second": 1.525,
"eval_wer": 1.0,
"step": 14000
},
{
"epoch": 23.04,
"learning_rate": 7.233315536572343e-05,
"loss": 0.0,
"step": 14400
},
{
"epoch": 23.04,
"eval_loss": NaN,
"eval_runtime": 74.0428,
"eval_samples_per_second": 13.506,
"eval_steps_per_second": 1.688,
"eval_wer": 1.0,
"step": 14400
},
{
"epoch": 23.68,
"learning_rate": 6.592632140950347e-05,
"loss": 0.0,
"step": 14800
},
{
"epoch": 23.68,
"eval_loss": NaN,
"eval_runtime": 73.6487,
"eval_samples_per_second": 13.578,
"eval_steps_per_second": 1.697,
"eval_wer": 1.0,
"step": 14800
},
{
"epoch": 24.32,
"learning_rate": 5.95194874532835e-05,
"loss": 0.0,
"step": 15200
},
{
"epoch": 24.32,
"eval_loss": NaN,
"eval_runtime": 73.0072,
"eval_samples_per_second": 13.697,
"eval_steps_per_second": 1.712,
"eval_wer": 1.0,
"step": 15200
},
{
"epoch": 24.96,
"learning_rate": 5.3112653497063527e-05,
"loss": 0.0,
"step": 15600
},
{
"epoch": 24.96,
"eval_loss": NaN,
"eval_runtime": 79.0121,
"eval_samples_per_second": 12.656,
"eval_steps_per_second": 1.582,
"eval_wer": 1.0,
"step": 15600
},
{
"epoch": 25.6,
"learning_rate": 4.670581954084356e-05,
"loss": 0.0,
"step": 16000
},
{
"epoch": 25.6,
"eval_loss": NaN,
"eval_runtime": 82.7961,
"eval_samples_per_second": 12.078,
"eval_steps_per_second": 1.51,
"eval_wer": 1.0,
"step": 16000
},
{
"epoch": 26.24,
"learning_rate": 4.02989855846236e-05,
"loss": 0.0,
"step": 16400
},
{
"epoch": 26.24,
"eval_loss": NaN,
"eval_runtime": 83.3819,
"eval_samples_per_second": 11.993,
"eval_steps_per_second": 1.499,
"eval_wer": 1.0,
"step": 16400
},
{
"epoch": 26.88,
"learning_rate": 3.3892151628403626e-05,
"loss": 0.0,
"step": 16800
},
{
"epoch": 26.88,
"eval_loss": NaN,
"eval_runtime": 79.5109,
"eval_samples_per_second": 12.577,
"eval_steps_per_second": 1.572,
"eval_wer": 1.0,
"step": 16800
},
{
"epoch": 27.52,
"learning_rate": 2.748531767218366e-05,
"loss": 0.0,
"step": 17200
},
{
"epoch": 27.52,
"eval_loss": NaN,
"eval_runtime": 76.3506,
"eval_samples_per_second": 13.097,
"eval_steps_per_second": 1.637,
"eval_wer": 1.0,
"step": 17200
},
{
"epoch": 28.16,
"learning_rate": 2.107848371596369e-05,
"loss": 0.0,
"step": 17600
},
{
"epoch": 28.16,
"eval_loss": NaN,
"eval_runtime": 72.6042,
"eval_samples_per_second": 13.773,
"eval_steps_per_second": 1.722,
"eval_wer": 1.0,
"step": 17600
},
{
"epoch": 28.8,
"learning_rate": 1.4671649759743725e-05,
"loss": 0.0,
"step": 18000
},
{
"epoch": 28.8,
"eval_loss": NaN,
"eval_runtime": 83.2188,
"eval_samples_per_second": 12.017,
"eval_steps_per_second": 1.502,
"eval_wer": 1.0,
"step": 18000
},
{
"epoch": 29.44,
"learning_rate": 8.264815803523758e-06,
"loss": 0.0,
"step": 18400
},
{
"epoch": 29.44,
"eval_loss": NaN,
"eval_runtime": 76.8024,
"eval_samples_per_second": 13.02,
"eval_steps_per_second": 1.628,
"eval_wer": 1.0,
"step": 18400
},
{
"epoch": 30.0,
"step": 18750,
"total_flos": 1.1136444297962675e+20,
"train_loss": 2.53877658203125,
"train_runtime": 56941.5798,
"train_samples_per_second": 10.537,
"train_steps_per_second": 0.329
}
],
"max_steps": 18750,
"num_train_epochs": 30,
"total_flos": 1.1136444297962675e+20,
"trial_name": null,
"trial_params": null
}