|
{ |
|
"best_metric": 1.0035810470581055, |
|
"best_model_checkpoint": "ckpt_base/checkpoint-1740", |
|
"epoch": 4.0, |
|
"global_step": 1740, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_loss": 1.1327471733093262, |
|
"eval_runtime": 5108.4501, |
|
"eval_samples_per_second": 0.623, |
|
"eval_steps_per_second": 0.311, |
|
"eval_wer": 1053.8786428269746, |
|
"step": 435 |
|
}, |
|
{ |
|
"epoch": 1.15, |
|
"learning_rate": 2.47e-06, |
|
"loss": 1.8361, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_loss": 1.05120849609375, |
|
"eval_runtime": 3561.6255, |
|
"eval_samples_per_second": 0.893, |
|
"eval_steps_per_second": 0.447, |
|
"eval_wer": 648.7118119104604, |
|
"step": 870 |
|
}, |
|
{ |
|
"epoch": 2.3, |
|
"learning_rate": 4.970000000000001e-06, |
|
"loss": 1.0706, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_loss": 1.0082696676254272, |
|
"eval_runtime": 3000.1391, |
|
"eval_samples_per_second": 1.061, |
|
"eval_steps_per_second": 0.53, |
|
"eval_wer": 531.1980853160636, |
|
"step": 1305 |
|
}, |
|
{ |
|
"epoch": 3.45, |
|
"learning_rate": 4.679220779220779e-06, |
|
"loss": 0.953, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_loss": 1.0035810470581055, |
|
"eval_runtime": 2833.412, |
|
"eval_samples_per_second": 1.123, |
|
"eval_steps_per_second": 0.562, |
|
"eval_wer": 529.7761509221456, |
|
"step": 1740 |
|
} |
|
], |
|
"max_steps": 8700, |
|
"num_train_epochs": 20, |
|
"total_flos": 5.902415445120726e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|