|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 200.0, |
|
"global_step": 51600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 25.0, |
|
"learning_rate": 9.47515299877601e-05, |
|
"loss": 26.7169, |
|
"step": 6450 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 3.334904909133911, |
|
"eval_runtime": 8.0603, |
|
"eval_samples_per_second": 26.054, |
|
"eval_steps_per_second": 3.35, |
|
"eval_wer": 1.0, |
|
"step": 6450 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"learning_rate": 8.422521419828641e-05, |
|
"loss": 3.1417, |
|
"step": 12900 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_cer": 0.9991341991341991, |
|
"eval_loss": 3.1051225662231445, |
|
"eval_runtime": 7.9823, |
|
"eval_samples_per_second": 26.308, |
|
"eval_steps_per_second": 3.382, |
|
"eval_wer": 1.0, |
|
"step": 12900 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"learning_rate": 7.370216238270095e-05, |
|
"loss": 2.8102, |
|
"step": 19350 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_cer": 0.9298701298701298, |
|
"eval_loss": 2.55711030960083, |
|
"eval_runtime": 8.1516, |
|
"eval_samples_per_second": 25.762, |
|
"eval_steps_per_second": 3.312, |
|
"eval_wer": 1.0, |
|
"step": 19350 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"learning_rate": 6.318074255405957e-05, |
|
"loss": 2.5334, |
|
"step": 25800 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_cer": 0.8883116883116883, |
|
"eval_loss": 2.404860496520996, |
|
"eval_runtime": 8.0509, |
|
"eval_samples_per_second": 26.084, |
|
"eval_steps_per_second": 3.354, |
|
"eval_wer": 1.0, |
|
"step": 25800 |
|
}, |
|
{ |
|
"epoch": 125.0, |
|
"learning_rate": 5.2657690738474096e-05, |
|
"loss": 2.4155, |
|
"step": 32250 |
|
}, |
|
{ |
|
"epoch": 125.0, |
|
"eval_cer": 0.8571428571428571, |
|
"eval_loss": 2.3261098861694336, |
|
"eval_runtime": 8.0386, |
|
"eval_samples_per_second": 26.124, |
|
"eval_steps_per_second": 3.359, |
|
"eval_wer": 0.9952380952380953, |
|
"step": 32250 |
|
}, |
|
{ |
|
"epoch": 150.0, |
|
"learning_rate": 4.213463892288862e-05, |
|
"loss": 2.3529, |
|
"step": 38700 |
|
}, |
|
{ |
|
"epoch": 150.0, |
|
"eval_cer": 0.8545454545454545, |
|
"eval_loss": 2.290559768676758, |
|
"eval_runtime": 8.0265, |
|
"eval_samples_per_second": 26.163, |
|
"eval_steps_per_second": 3.364, |
|
"eval_wer": 0.9952380952380953, |
|
"step": 38700 |
|
}, |
|
{ |
|
"epoch": 175.0, |
|
"learning_rate": 3.161158710730314e-05, |
|
"loss": 2.3158, |
|
"step": 45150 |
|
}, |
|
{ |
|
"epoch": 175.0, |
|
"eval_cer": 0.8363636363636363, |
|
"eval_loss": 2.258056402206421, |
|
"eval_runtime": 8.0276, |
|
"eval_samples_per_second": 26.16, |
|
"eval_steps_per_second": 3.363, |
|
"eval_wer": 0.9952380952380953, |
|
"step": 45150 |
|
}, |
|
{ |
|
"epoch": 200.0, |
|
"learning_rate": 2.109016727866177e-05, |
|
"loss": 2.2885, |
|
"step": 51600 |
|
}, |
|
{ |
|
"epoch": 200.0, |
|
"eval_cer": 0.8337662337662337, |
|
"eval_loss": 2.2457661628723145, |
|
"eval_runtime": 8.1248, |
|
"eval_samples_per_second": 25.847, |
|
"eval_steps_per_second": 3.323, |
|
"eval_wer": 0.9952380952380953, |
|
"step": 51600 |
|
} |
|
], |
|
"max_steps": 64500, |
|
"num_train_epochs": 250, |
|
"total_flos": 4.958565694536252e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|