|
{ |
|
"best_metric": 0.30957943925233644, |
|
"best_model_checkpoint": "/content/drive/MyDrive/wav2vec2-large-xlsr-persian-asr-shemo/checkpoint-700", |
|
"epoch": 6.25, |
|
"eval_steps": 100, |
|
"global_step": 1000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.62, |
|
"learning_rate": 1.98e-06, |
|
"loss": 0.7564, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.62, |
|
"eval_loss": 0.6704742908477783, |
|
"eval_runtime": 35.2821, |
|
"eval_samples_per_second": 8.049, |
|
"eval_steps_per_second": 1.02, |
|
"eval_wer": 0.3130841121495327, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"learning_rate": 3.96e-06, |
|
"loss": 0.7761, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"eval_loss": 0.666378378868103, |
|
"eval_runtime": 34.5662, |
|
"eval_samples_per_second": 8.216, |
|
"eval_steps_per_second": 1.041, |
|
"eval_wer": 0.3139602803738318, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"learning_rate": 5.94e-06, |
|
"loss": 0.7722, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"eval_loss": 0.6573134064674377, |
|
"eval_runtime": 34.2808, |
|
"eval_samples_per_second": 8.285, |
|
"eval_steps_per_second": 1.05, |
|
"eval_wer": 0.31366822429906543, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 2.5, |
|
"learning_rate": 7.94e-06, |
|
"loss": 0.7035, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 2.5, |
|
"eval_loss": 0.6626747846603394, |
|
"eval_runtime": 33.8115, |
|
"eval_samples_per_second": 8.4, |
|
"eval_steps_per_second": 1.065, |
|
"eval_wer": 0.3157126168224299, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 3.12, |
|
"learning_rate": 9.920000000000002e-06, |
|
"loss": 0.7026, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.12, |
|
"eval_loss": 0.6833900213241577, |
|
"eval_runtime": 34.2659, |
|
"eval_samples_per_second": 8.288, |
|
"eval_steps_per_second": 1.051, |
|
"eval_wer": 0.3107476635514019, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.75, |
|
"learning_rate": 8.08e-06, |
|
"loss": 0.7213, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 3.75, |
|
"eval_loss": 0.6561282277107239, |
|
"eval_runtime": 34.3134, |
|
"eval_samples_per_second": 8.277, |
|
"eval_steps_per_second": 1.049, |
|
"eval_wer": 0.31688084112149534, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 4.38, |
|
"learning_rate": 6.08e-06, |
|
"loss": 0.6996, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 4.38, |
|
"eval_loss": 0.6663690209388733, |
|
"eval_runtime": 34.836, |
|
"eval_samples_per_second": 8.152, |
|
"eval_steps_per_second": 1.033, |
|
"eval_wer": 0.30957943925233644, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 4.08e-06, |
|
"loss": 0.7146, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_loss": 0.6592983603477478, |
|
"eval_runtime": 34.5134, |
|
"eval_samples_per_second": 8.229, |
|
"eval_steps_per_second": 1.043, |
|
"eval_wer": 0.3148364485981308, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 5.62, |
|
"learning_rate": 2.08e-06, |
|
"loss": 0.7071, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 5.62, |
|
"eval_loss": 0.6645920276641846, |
|
"eval_runtime": 34.6798, |
|
"eval_samples_per_second": 8.189, |
|
"eval_steps_per_second": 1.038, |
|
"eval_wer": 0.3125, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 6.25, |
|
"learning_rate": 8e-08, |
|
"loss": 0.7065, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 6.25, |
|
"eval_loss": 0.6634251475334167, |
|
"eval_runtime": 36.7008, |
|
"eval_samples_per_second": 7.738, |
|
"eval_steps_per_second": 0.981, |
|
"eval_wer": 0.3107476635514019, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 6.25, |
|
"step": 1000, |
|
"total_flos": 4.798362622332561e+18, |
|
"train_loss": 0.7259744338989258, |
|
"train_runtime": 4809.6219, |
|
"train_samples_per_second": 3.327, |
|
"train_steps_per_second": 0.208 |
|
} |
|
], |
|
"logging_steps": 100, |
|
"max_steps": 1000, |
|
"num_train_epochs": 7, |
|
"save_steps": 100, |
|
"total_flos": 4.798362622332561e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|