|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 60.0, |
|
"global_step": 1260, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 4.76, |
|
"learning_rate": 0.00015, |
|
"loss": 10.7834, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 4.76, |
|
"eval_loss": 3.1524412631988525, |
|
"eval_runtime": 53.4465, |
|
"eval_samples_per_second": 8.719, |
|
"eval_wer": 1.0, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 9.52, |
|
"learning_rate": 0.0003, |
|
"loss": 3.0788, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 9.52, |
|
"eval_loss": 3.044459104537964, |
|
"eval_runtime": 54.4604, |
|
"eval_samples_per_second": 8.557, |
|
"eval_wer": 1.0, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 14.29, |
|
"learning_rate": 0.00023023255813953486, |
|
"loss": 2.9807, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 14.29, |
|
"eval_loss": 2.9658894538879395, |
|
"eval_runtime": 54.1542, |
|
"eval_samples_per_second": 8.605, |
|
"eval_wer": 1.0, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 19.05, |
|
"learning_rate": 0.00016046511627906975, |
|
"loss": 2.2974, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 19.05, |
|
"eval_loss": 0.9927442669868469, |
|
"eval_runtime": 55.0174, |
|
"eval_samples_per_second": 8.47, |
|
"eval_wer": 0.9315901489814533, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 23.81, |
|
"learning_rate": 9.069767441860464e-05, |
|
"loss": 0.6448, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 23.81, |
|
"eval_loss": 0.5772319436073303, |
|
"eval_runtime": 54.9367, |
|
"eval_samples_per_second": 8.482, |
|
"eval_wer": 0.6889632107023411, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 28.57, |
|
"learning_rate": 2.0930232558139532e-05, |
|
"loss": 0.3268, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 28.57, |
|
"eval_loss": 0.5437523126602173, |
|
"eval_runtime": 54.9465, |
|
"eval_samples_per_second": 8.481, |
|
"eval_wer": 0.629674673152934, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 33.33, |
|
"learning_rate": 0.00015849056603773584, |
|
"loss": 0.2512, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 33.33, |
|
"eval_loss": 0.5623383522033691, |
|
"eval_runtime": 53.3134, |
|
"eval_samples_per_second": 8.741, |
|
"eval_wer": 0.5916692003648525, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 38.1, |
|
"learning_rate": 0.000130188679245283, |
|
"loss": 0.1599, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 38.1, |
|
"eval_loss": 0.5707418322563171, |
|
"eval_runtime": 54.2873, |
|
"eval_samples_per_second": 8.584, |
|
"eval_wer": 0.5852842809364549, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 42.86, |
|
"learning_rate": 0.00010188679245283017, |
|
"loss": 0.1179, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 42.86, |
|
"eval_loss": 0.5668476223945618, |
|
"eval_runtime": 54.4224, |
|
"eval_samples_per_second": 8.563, |
|
"eval_wer": 0.5655214350866524, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 47.62, |
|
"learning_rate": 7.358490566037735e-05, |
|
"loss": 0.092, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 47.62, |
|
"eval_loss": 0.6057275533676147, |
|
"eval_runtime": 54.8666, |
|
"eval_samples_per_second": 8.493, |
|
"eval_wer": 0.5640012161751292, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 52.38, |
|
"learning_rate": 4.528301886792452e-05, |
|
"loss": 0.0808, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 52.38, |
|
"eval_loss": 0.6176655888557434, |
|
"eval_runtime": 55.0084, |
|
"eval_samples_per_second": 8.471, |
|
"eval_wer": 0.5506232897537245, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 57.14, |
|
"learning_rate": 1.6981132075471696e-05, |
|
"loss": 0.0862, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 57.14, |
|
"eval_loss": 0.639299213886261, |
|
"eval_runtime": 55.7062, |
|
"eval_samples_per_second": 8.365, |
|
"eval_wer": 0.5649133475220431, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"step": 1260, |
|
"total_flos": 1.120772175088509e+19, |
|
"train_runtime": 5433.1006, |
|
"train_samples_per_second": 0.232 |
|
} |
|
], |
|
"max_steps": 1260, |
|
"num_train_epochs": 60, |
|
"total_flos": 1.120772175088509e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|