|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 15.0, |
|
"global_step": 64050, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 9.825795424664739e-05, |
|
"loss": 7.898, |
|
"step": 4270 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_cer": 0.18354978354978355, |
|
"eval_loss": 0.892418622970581, |
|
"eval_new_wer": 0.1, |
|
"eval_old_wer": 0.4714285714285714, |
|
"eval_runtime": 8.5895, |
|
"eval_samples_per_second": 24.448, |
|
"eval_steps_per_second": 3.143, |
|
"step": 4270 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 9.124046805153827e-05, |
|
"loss": 0.9517, |
|
"step": 8540 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_cer": 0.14545454545454545, |
|
"eval_loss": 0.8618147373199463, |
|
"eval_new_wer": 0.12857142857142856, |
|
"eval_old_wer": 0.30952380952380953, |
|
"eval_runtime": 8.4071, |
|
"eval_samples_per_second": 24.979, |
|
"eval_steps_per_second": 3.212, |
|
"step": 8540 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 8.422626873520904e-05, |
|
"loss": 0.6119, |
|
"step": 12810 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_cer": 0.15064935064935064, |
|
"eval_loss": 0.8806686997413635, |
|
"eval_new_wer": 0.12380952380952381, |
|
"eval_old_wer": 0.2904761904761905, |
|
"eval_runtime": 8.4758, |
|
"eval_samples_per_second": 24.776, |
|
"eval_steps_per_second": 3.186, |
|
"step": 12810 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 7.721206941887984e-05, |
|
"loss": 0.4562, |
|
"step": 17080 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_cer": 0.0987012987012987, |
|
"eval_loss": 0.6651872992515564, |
|
"eval_new_wer": 0.09047619047619047, |
|
"eval_old_wer": 0.2, |
|
"eval_runtime": 8.491, |
|
"eval_samples_per_second": 24.732, |
|
"eval_steps_per_second": 3.18, |
|
"step": 17080 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 7.019787010255062e-05, |
|
"loss": 0.3661, |
|
"step": 21350 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_cer": 0.13766233766233765, |
|
"eval_loss": 1.2836520671844482, |
|
"eval_new_wer": 0.19047619047619047, |
|
"eval_old_wer": 0.2619047619047619, |
|
"eval_runtime": 8.4952, |
|
"eval_samples_per_second": 24.72, |
|
"eval_steps_per_second": 3.178, |
|
"step": 21350 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 6.318202734683146e-05, |
|
"loss": 0.2908, |
|
"step": 25620 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_cer": 0.10735930735930736, |
|
"eval_loss": 0.6425668597221375, |
|
"eval_new_wer": 0.10952380952380952, |
|
"eval_old_wer": 0.18571428571428572, |
|
"eval_runtime": 8.4544, |
|
"eval_samples_per_second": 24.839, |
|
"eval_steps_per_second": 3.194, |
|
"step": 25620 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 5.616782803050224e-05, |
|
"loss": 0.2357, |
|
"step": 29890 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_cer": 0.15411255411255412, |
|
"eval_loss": 1.2289475202560425, |
|
"eval_new_wer": 0.1619047619047619, |
|
"eval_old_wer": 0.24761904761904763, |
|
"eval_runtime": 8.4851, |
|
"eval_samples_per_second": 24.749, |
|
"eval_steps_per_second": 3.182, |
|
"step": 29890 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 4.915198527478307e-05, |
|
"loss": 0.1926, |
|
"step": 34160 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_cer": 0.12727272727272726, |
|
"eval_loss": 1.098648190498352, |
|
"eval_new_wer": 0.14761904761904762, |
|
"eval_old_wer": 0.23809523809523808, |
|
"eval_runtime": 8.5184, |
|
"eval_samples_per_second": 24.653, |
|
"eval_steps_per_second": 3.17, |
|
"step": 34160 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 4.213778595845386e-05, |
|
"loss": 0.1601, |
|
"step": 38430 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_cer": 0.14805194805194805, |
|
"eval_loss": 1.2215726375579834, |
|
"eval_new_wer": 0.18095238095238095, |
|
"eval_old_wer": 0.24285714285714285, |
|
"eval_runtime": 8.367, |
|
"eval_samples_per_second": 25.098, |
|
"eval_steps_per_second": 3.227, |
|
"step": 38430 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 3.5121943202734684e-05, |
|
"loss": 0.1317, |
|
"step": 42700 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_cer": 0.12034632034632034, |
|
"eval_loss": 0.9588236212730408, |
|
"eval_new_wer": 0.14761904761904762, |
|
"eval_old_wer": 0.20476190476190476, |
|
"eval_runtime": 8.5613, |
|
"eval_samples_per_second": 24.529, |
|
"eval_steps_per_second": 3.154, |
|
"step": 42700 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"learning_rate": 2.8106100447015514e-05, |
|
"loss": 0.1088, |
|
"step": 46970 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_cer": 0.09610389610389611, |
|
"eval_loss": 0.7578983902931213, |
|
"eval_new_wer": 0.10476190476190476, |
|
"eval_old_wer": 0.1761904761904762, |
|
"eval_runtime": 8.5378, |
|
"eval_samples_per_second": 24.597, |
|
"eval_steps_per_second": 3.162, |
|
"step": 46970 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"learning_rate": 2.1093544570076258e-05, |
|
"loss": 0.0892, |
|
"step": 51240 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_cer": 0.10043290043290043, |
|
"eval_loss": 0.7190653681755066, |
|
"eval_new_wer": 0.11428571428571428, |
|
"eval_old_wer": 0.16666666666666666, |
|
"eval_runtime": 8.7441, |
|
"eval_samples_per_second": 24.016, |
|
"eval_steps_per_second": 3.088, |
|
"step": 51240 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"learning_rate": 1.4079345253747043e-05, |
|
"loss": 0.0714, |
|
"step": 55510 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_cer": 0.08398268398268398, |
|
"eval_loss": 0.4884723424911499, |
|
"eval_new_wer": 0.09523809523809523, |
|
"eval_old_wer": 0.14285714285714285, |
|
"eval_runtime": 8.4874, |
|
"eval_samples_per_second": 24.743, |
|
"eval_steps_per_second": 3.181, |
|
"step": 55510 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"learning_rate": 7.063502498027873e-06, |
|
"loss": 0.0573, |
|
"step": 59780 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_cer": 0.09177489177489177, |
|
"eval_loss": 0.5790263414382935, |
|
"eval_new_wer": 0.10952380952380952, |
|
"eval_old_wer": 0.14285714285714285, |
|
"eval_runtime": 8.6001, |
|
"eval_samples_per_second": 24.418, |
|
"eval_steps_per_second": 3.139, |
|
"step": 59780 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"learning_rate": 4.7659742308703654e-08, |
|
"loss": 0.0469, |
|
"step": 64050 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_cer": 0.09004329004329005, |
|
"eval_loss": 0.6429840922355652, |
|
"eval_new_wer": 0.09523809523809523, |
|
"eval_old_wer": 0.14285714285714285, |
|
"eval_runtime": 8.622, |
|
"eval_samples_per_second": 24.356, |
|
"eval_steps_per_second": 3.132, |
|
"step": 64050 |
|
} |
|
], |
|
"max_steps": 64050, |
|
"num_train_epochs": 15, |
|
"total_flos": 4.852750717448731e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|