hrdipto's picture
Upload trainer_state.json
b6cfea0
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 89.28571428571429,
"global_step": 2500,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 17.86,
"learning_rate": 4.94e-05,
"loss": 19.5604,
"step": 500
},
{
"epoch": 17.86,
"eval_loss": 3.8375885486602783,
"eval_runtime": 2.2223,
"eval_samples_per_second": 86.395,
"eval_steps_per_second": 10.799,
"eval_wer": 1.0,
"step": 500
},
{
"epoch": 35.71,
"learning_rate": 9.94e-05,
"loss": 2.0837,
"step": 1000
},
{
"epoch": 35.71,
"eval_loss": 1.0887540578842163,
"eval_runtime": 2.2007,
"eval_samples_per_second": 87.246,
"eval_steps_per_second": 10.906,
"eval_wer": 0.6354166666666666,
"step": 1000
},
{
"epoch": 53.57,
"learning_rate": 7.255555555555555e-05,
"loss": 0.3185,
"step": 1500
},
{
"epoch": 53.57,
"eval_loss": 0.3722864091396332,
"eval_runtime": 2.1581,
"eval_samples_per_second": 88.967,
"eval_steps_per_second": 11.121,
"eval_wer": 0.296875,
"step": 1500
},
{
"epoch": 71.43,
"learning_rate": 4.477777777777778e-05,
"loss": 0.1425,
"step": 2000
},
{
"epoch": 71.43,
"eval_loss": 0.22876793146133423,
"eval_runtime": 2.2468,
"eval_samples_per_second": 85.454,
"eval_steps_per_second": 10.682,
"eval_wer": 0.28125,
"step": 2000
},
{
"epoch": 89.29,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0932,
"step": 2500
},
{
"epoch": 89.29,
"eval_loss": 0.16792654991149902,
"eval_runtime": 2.2364,
"eval_samples_per_second": 85.85,
"eval_steps_per_second": 10.731,
"eval_wer": 0.18229166666666666,
"step": 2500
}
],
"max_steps": 2800,
"num_train_epochs": 100,
"total_flos": 3.050974757946286e+18,
"trial_name": null,
"trial_params": null
}