wav2vec2-large-xls-r-300m-odia / trainer_state.json
infinitejoy's picture
End of training
e870548
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 120.0,
"global_step": 2040,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 5.88,
"learning_rate": 1.455e-05,
"loss": 16.0345,
"step": 100
},
{
"epoch": 11.76,
"learning_rate": 2.955e-05,
"loss": 6.2463,
"step": 200
},
{
"epoch": 17.65,
"learning_rate": 4.454999999999999e-05,
"loss": 4.2277,
"step": 300
},
{
"epoch": 23.53,
"learning_rate": 5.955e-05,
"loss": 3.4915,
"step": 400
},
{
"epoch": 29.41,
"learning_rate": 7.455e-05,
"loss": 3.3231,
"step": 500
},
{
"epoch": 29.41,
"eval_loss": 3.352241277694702,
"eval_runtime": 5.0475,
"eval_samples_per_second": 22.189,
"eval_steps_per_second": 1.387,
"eval_wer": 0.998972250770812,
"step": 500
},
{
"epoch": 35.29,
"learning_rate": 7.027597402597401e-05,
"loss": 3.2264,
"step": 600
},
{
"epoch": 41.18,
"learning_rate": 6.540584415584416e-05,
"loss": 3.1652,
"step": 700
},
{
"epoch": 47.06,
"learning_rate": 6.0535714285714285e-05,
"loss": 3.019,
"step": 800
},
{
"epoch": 52.94,
"learning_rate": 5.566558441558441e-05,
"loss": 2.6429,
"step": 900
},
{
"epoch": 58.82,
"learning_rate": 5.0795454545454536e-05,
"loss": 2.1146,
"step": 1000
},
{
"epoch": 58.82,
"eval_loss": 1.3367875814437866,
"eval_runtime": 5.0633,
"eval_samples_per_second": 22.12,
"eval_steps_per_second": 1.382,
"eval_wer": 0.9383350462487153,
"step": 1000
},
{
"epoch": 64.71,
"learning_rate": 4.592532467532467e-05,
"loss": 1.7769,
"step": 1100
},
{
"epoch": 70.59,
"learning_rate": 4.10551948051948e-05,
"loss": 1.5937,
"step": 1200
},
{
"epoch": 76.47,
"learning_rate": 3.6185064935064934e-05,
"loss": 1.4694,
"step": 1300
},
{
"epoch": 82.35,
"learning_rate": 3.131493506493506e-05,
"loss": 1.3781,
"step": 1400
},
{
"epoch": 88.24,
"learning_rate": 2.6444805194805193e-05,
"loss": 1.3134,
"step": 1500
},
{
"epoch": 88.24,
"eval_loss": 0.7372016310691833,
"eval_runtime": 5.0913,
"eval_samples_per_second": 21.998,
"eval_steps_per_second": 1.375,
"eval_wer": 0.9578622816032888,
"step": 1500
},
{
"epoch": 94.12,
"learning_rate": 2.162337662337662e-05,
"loss": 1.271,
"step": 1600
},
{
"epoch": 100.0,
"learning_rate": 1.6753246753246752e-05,
"loss": 1.2273,
"step": 1700
},
{
"epoch": 105.88,
"learning_rate": 1.1883116883116881e-05,
"loss": 1.2121,
"step": 1800
},
{
"epoch": 111.76,
"learning_rate": 7.012987012987012e-06,
"loss": 1.169,
"step": 1900
},
{
"epoch": 117.65,
"learning_rate": 2.1428571428571427e-06,
"loss": 1.1506,
"step": 2000
},
{
"epoch": 117.65,
"eval_loss": 0.6582115292549133,
"eval_runtime": 5.0953,
"eval_samples_per_second": 21.981,
"eval_steps_per_second": 1.374,
"eval_wer": 0.9681397738951696,
"step": 2000
},
{
"epoch": 120.0,
"step": 2040,
"total_flos": 1.105779936504619e+19,
"train_loss": 3.015083034365785,
"train_runtime": 4204.6915,
"train_samples_per_second": 15.326,
"train_steps_per_second": 0.485
}
],
"max_steps": 2040,
"num_train_epochs": 120,
"total_flos": 1.105779936504619e+19,
"trial_name": null,
"trial_params": null
}