{ "best_metric": null, "best_model_checkpoint": null, "epoch": 150.0, "global_step": 47400, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 15.0, "learning_rate": 9.475238729735733e-05, "loss": 4.9125, "step": 4740 }, { "epoch": 15.0, "eval_cer": 0.7454545454545455, "eval_loss": 5.065438270568848, "eval_runtime": 5.2761, "eval_samples_per_second": 26.535, "eval_steps_per_second": 3.412, "eval_wer": 1.0, "step": 4740 }, { "epoch": 30.0, "learning_rate": 8.422829224961137e-05, "loss": 0.3161, "step": 9480 }, { "epoch": 30.0, "eval_cer": 0.7896103896103897, "eval_loss": 7.881378173828125, "eval_runtime": 5.2288, "eval_samples_per_second": 26.775, "eval_steps_per_second": 3.442, "eval_wer": 1.0, "step": 9480 }, { "epoch": 45.0, "learning_rate": 7.370419720186542e-05, "loss": 0.1445, "step": 14220 }, { "epoch": 45.0, "eval_cer": 0.7285714285714285, "eval_loss": 11.377739906311035, "eval_runtime": 5.8797, "eval_samples_per_second": 23.811, "eval_steps_per_second": 3.061, "eval_wer": 1.0, "step": 14220 }, { "epoch": 60.0, "learning_rate": 6.318454363757495e-05, "loss": 0.0968, "step": 18960 }, { "epoch": 60.0, "eval_cer": 0.8090909090909091, "eval_loss": 12.136865615844727, "eval_runtime": 5.012, "eval_samples_per_second": 27.933, "eval_steps_per_second": 3.591, "eval_wer": 0.9857142857142858, "step": 18960 }, { "epoch": 75.0, "learning_rate": 5.2660448589829e-05, "loss": 0.0671, "step": 23700 }, { "epoch": 75.0, "eval_cer": 0.8233766233766234, "eval_loss": 14.418416976928711, "eval_runtime": 5.0373, "eval_samples_per_second": 27.793, "eval_steps_per_second": 3.573, "eval_wer": 1.0, "step": 23700 }, { "epoch": 90.0, "learning_rate": 4.2138574283810795e-05, "loss": 0.047, "step": 28440 }, { "epoch": 90.0, "eval_cer": 0.8220779220779221, "eval_loss": 12.429436683654785, "eval_runtime": 6.0466, "eval_samples_per_second": 23.154, "eval_steps_per_second": 2.977, "eval_wer": 1.0, "step": 28440 }, { "epoch": 105.0, "learning_rate": 3.1614479236064846e-05, "loss": 0.0298, "step": 33180 }, { "epoch": 105.0, "eval_cer": 0.7688311688311689, "eval_loss": 16.444717407226562, "eval_runtime": 5.0177, "eval_samples_per_second": 27.901, "eval_steps_per_second": 3.587, "eval_wer": 1.0, "step": 33180 }, { "epoch": 120.0, "learning_rate": 2.1092604930046634e-05, "loss": 0.0212, "step": 37920 }, { "epoch": 120.0, "eval_cer": 0.7636363636363637, "eval_loss": 19.72909164428711, "eval_runtime": 4.9946, "eval_samples_per_second": 28.03, "eval_steps_per_second": 3.604, "eval_wer": 1.0, "step": 37920 }, { "epoch": 135.0, "learning_rate": 1.0568509882300689e-05, "loss": 0.0131, "step": 42660 }, { "epoch": 135.0, "eval_cer": 0.7766233766233767, "eval_loss": 17.405521392822266, "eval_runtime": 5.0395, "eval_samples_per_second": 27.781, "eval_steps_per_second": 3.572, "eval_wer": 1.0, "step": 42660 }, { "epoch": 150.0, "learning_rate": 4.8856318010215416e-08, "loss": 0.0102, "step": 47400 }, { "epoch": 150.0, "eval_cer": 0.7688311688311689, "eval_loss": 21.693923950195312, "eval_runtime": 5.0223, "eval_samples_per_second": 27.876, "eval_steps_per_second": 3.584, "eval_wer": 1.0, "step": 47400 } ], "max_steps": 47400, "num_train_epochs": 150, "total_flos": 3.507003787332655e+19, "trial_name": null, "trial_params": null }