|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"global_step": 341600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 9.474208061136448e-05, |
|
"loss": 14.0127, |
|
"step": 34160 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_cer": 0.9619047619047619, |
|
"eval_loss": 3.3398807048797607, |
|
"eval_runtime": 1.0489, |
|
"eval_samples_per_second": 200.219, |
|
"eval_steps_per_second": 25.742, |
|
"eval_wer": 1.0, |
|
"step": 34160 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"learning_rate": 8.422007888573894e-05, |
|
"loss": 2.7792, |
|
"step": 68320 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_cer": 0.9402597402597402, |
|
"eval_loss": 3.2982892990112305, |
|
"eval_runtime": 1.0271, |
|
"eval_samples_per_second": 204.45, |
|
"eval_steps_per_second": 26.286, |
|
"eval_wer": 1.0, |
|
"step": 68320 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"learning_rate": 7.36980771601134e-05, |
|
"loss": 2.7144, |
|
"step": 102480 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_cer": 0.935064935064935, |
|
"eval_loss": 3.2650129795074463, |
|
"eval_runtime": 1.0213, |
|
"eval_samples_per_second": 205.615, |
|
"eval_steps_per_second": 26.436, |
|
"eval_wer": 1.0, |
|
"step": 102480 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"learning_rate": 6.317607543448786e-05, |
|
"loss": 2.6884, |
|
"step": 136640 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_cer": 0.9341991341991343, |
|
"eval_loss": 3.2275328636169434, |
|
"eval_runtime": 1.0304, |
|
"eval_samples_per_second": 203.803, |
|
"eval_steps_per_second": 26.203, |
|
"eval_wer": 1.0, |
|
"step": 136640 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"learning_rate": 5.26537655614446e-05, |
|
"loss": 2.6742, |
|
"step": 170800 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_cer": 0.935064935064935, |
|
"eval_loss": 3.228600025177002, |
|
"eval_runtime": 1.0287, |
|
"eval_samples_per_second": 204.145, |
|
"eval_steps_per_second": 26.247, |
|
"eval_wer": 1.0, |
|
"step": 170800 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"learning_rate": 4.213176383581906e-05, |
|
"loss": 2.6644, |
|
"step": 204960 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_cer": 0.935064935064935, |
|
"eval_loss": 3.192678213119507, |
|
"eval_runtime": 1.0316, |
|
"eval_samples_per_second": 203.564, |
|
"eval_steps_per_second": 26.172, |
|
"eval_wer": 1.0, |
|
"step": 204960 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"learning_rate": 3.161007025761124e-05, |
|
"loss": 2.659, |
|
"step": 239120 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_cer": 0.9333333333333333, |
|
"eval_loss": 3.189307689666748, |
|
"eval_runtime": 1.0408, |
|
"eval_samples_per_second": 201.77, |
|
"eval_steps_per_second": 25.942, |
|
"eval_wer": 1.0, |
|
"step": 239120 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"learning_rate": 2.108776038456798e-05, |
|
"loss": 2.6548, |
|
"step": 273280 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_cer": 0.9324675324675324, |
|
"eval_loss": 3.1870908737182617, |
|
"eval_runtime": 1.0301, |
|
"eval_samples_per_second": 203.86, |
|
"eval_steps_per_second": 26.211, |
|
"eval_wer": 1.0, |
|
"step": 273280 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"learning_rate": 1.0566066806360162e-05, |
|
"loss": 2.6524, |
|
"step": 307440 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_cer": 0.9324675324675324, |
|
"eval_loss": 3.1949210166931152, |
|
"eval_runtime": 1.0305, |
|
"eval_samples_per_second": 203.786, |
|
"eval_steps_per_second": 26.201, |
|
"eval_wer": 1.0, |
|
"step": 307440 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"learning_rate": 4.4373228152348083e-08, |
|
"loss": 2.651, |
|
"step": 341600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_cer": 0.9324675324675324, |
|
"eval_loss": 3.189643144607544, |
|
"eval_runtime": 1.0382, |
|
"eval_samples_per_second": 202.281, |
|
"eval_steps_per_second": 26.008, |
|
"eval_wer": 1.0, |
|
"step": 341600 |
|
} |
|
], |
|
"max_steps": 341600, |
|
"num_train_epochs": 100, |
|
"total_flos": 3.24550895516716e+20, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|