dys_base_M12 / last-checkpoint /trainer_state.json
mprzibilla's picture
Training in progress, epoch 15
7ff51e2
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 15.0,
"global_step": 11085,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"learning_rate": 9.831924793466908e-05,
"loss": 18.2448,
"step": 739
},
{
"epoch": 1.0,
"eval_cer": 1.0,
"eval_loss": 3.3216891288757324,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.2541,
"eval_samples_per_second": 24.814,
"eval_steps_per_second": 3.171,
"step": 739
},
{
"epoch": 2.0,
"learning_rate": 9.130187066755295e-05,
"loss": 3.4894,
"step": 1478
},
{
"epoch": 2.0,
"eval_cer": 1.0,
"eval_loss": 3.335986375808716,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.2646,
"eval_samples_per_second": 24.778,
"eval_steps_per_second": 3.166,
"step": 1478
},
{
"epoch": 3.0,
"learning_rate": 8.428449340043682e-05,
"loss": 3.4869,
"step": 2217
},
{
"epoch": 3.0,
"eval_cer": 1.0,
"eval_loss": 3.368795394897461,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.3486,
"eval_samples_per_second": 24.494,
"eval_steps_per_second": 3.13,
"step": 2217
},
{
"epoch": 4.0,
"learning_rate": 7.726711613332067e-05,
"loss": 3.4836,
"step": 2956
},
{
"epoch": 4.0,
"eval_cer": 1.0,
"eval_loss": 3.357470750808716,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.3992,
"eval_samples_per_second": 24.327,
"eval_steps_per_second": 3.108,
"step": 2956
},
{
"epoch": 5.0,
"learning_rate": 7.024973886620455e-05,
"loss": 3.4864,
"step": 3695
},
{
"epoch": 5.0,
"eval_cer": 1.0,
"eval_loss": 3.36539888381958,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.5815,
"eval_samples_per_second": 23.742,
"eval_steps_per_second": 3.034,
"step": 3695
},
{
"epoch": 6.0,
"learning_rate": 6.323236159908841e-05,
"loss": 3.4849,
"step": 4434
},
{
"epoch": 6.0,
"eval_cer": 1.0,
"eval_loss": 3.3517842292785645,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.7896,
"eval_samples_per_second": 23.108,
"eval_steps_per_second": 2.953,
"step": 4434
},
{
"epoch": 7.0,
"learning_rate": 5.6214984331972276e-05,
"loss": 3.484,
"step": 5173
},
{
"epoch": 7.0,
"eval_cer": 1.0,
"eval_loss": 3.3279595375061035,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.3916,
"eval_samples_per_second": 24.352,
"eval_steps_per_second": 3.112,
"step": 5173
},
{
"epoch": 8.0,
"learning_rate": 4.9197607064856144e-05,
"loss": 3.4854,
"step": 5912
},
{
"epoch": 8.0,
"eval_cer": 1.0,
"eval_loss": 3.361226797103882,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.4066,
"eval_samples_per_second": 24.303,
"eval_steps_per_second": 3.105,
"step": 5912
},
{
"epoch": 9.0,
"learning_rate": 4.2180229797740006e-05,
"loss": 3.4807,
"step": 6651
},
{
"epoch": 9.0,
"eval_cer": 1.0,
"eval_loss": 3.3284316062927246,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.4013,
"eval_samples_per_second": 24.32,
"eval_steps_per_second": 3.108,
"step": 6651
},
{
"epoch": 10.0,
"learning_rate": 3.5162852530623875e-05,
"loss": 3.4854,
"step": 7390
},
{
"epoch": 10.0,
"eval_cer": 1.0,
"eval_loss": 3.360283851623535,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.389,
"eval_samples_per_second": 24.361,
"eval_steps_per_second": 3.113,
"step": 7390
},
{
"epoch": 11.0,
"learning_rate": 2.8145475263507744e-05,
"loss": 3.4854,
"step": 8129
},
{
"epoch": 11.0,
"eval_cer": 1.0,
"eval_loss": 3.3530423641204834,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.4543,
"eval_samples_per_second": 24.147,
"eval_steps_per_second": 3.085,
"step": 8129
},
{
"epoch": 12.0,
"learning_rate": 2.112809799639161e-05,
"loss": 3.4855,
"step": 8868
},
{
"epoch": 12.0,
"eval_cer": 1.0,
"eval_loss": 3.3396615982055664,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.3505,
"eval_samples_per_second": 24.488,
"eval_steps_per_second": 3.129,
"step": 8868
},
{
"epoch": 13.0,
"learning_rate": 1.4110720729275472e-05,
"loss": 3.4813,
"step": 9607
},
{
"epoch": 13.0,
"eval_cer": 1.0,
"eval_loss": 3.352962017059326,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.5315,
"eval_samples_per_second": 23.9,
"eval_steps_per_second": 3.054,
"step": 9607
},
{
"epoch": 14.0,
"learning_rate": 7.093343462159339e-06,
"loss": 3.4785,
"step": 10346
},
{
"epoch": 14.0,
"eval_cer": 1.0,
"eval_loss": 3.345838785171509,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.0543,
"eval_samples_per_second": 25.516,
"eval_steps_per_second": 3.26,
"step": 10346
},
{
"epoch": 15.0,
"learning_rate": 7.596619504320577e-08,
"loss": 3.4798,
"step": 11085
},
{
"epoch": 15.0,
"eval_cer": 1.0,
"eval_loss": 3.345510482788086,
"eval_new_wer": 1.0,
"eval_old_wer": 1.0,
"eval_runtime": 7.0297,
"eval_samples_per_second": 25.606,
"eval_steps_per_second": 3.272,
"step": 11085
}
],
"max_steps": 11085,
"num_train_epochs": 15,
"total_flos": 8.649191629868698e+18,
"trial_name": null,
"trial_params": null
}