{ "best_metric": null, "best_model_checkpoint": null, "epoch": 15.0, "global_step": 15075, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 9.828934506353862e-05, "loss": 13.903, "step": 1005 }, { "epoch": 1.0, "eval_cer": 1.0, "eval_loss": 3.025165557861328, "eval_new_wer": 1.0, "eval_old_wer": 1.0, "eval_runtime": 7.9108, "eval_samples_per_second": 26.546, "eval_steps_per_second": 3.413, "step": 1005 }, { "epoch": 2.0, "learning_rate": 9.127216869152354e-05, "loss": 1.953, "step": 2010 }, { "epoch": 2.0, "eval_cer": 0.13593073593073593, "eval_loss": 0.31833797693252563, "eval_new_wer": 0.0, "eval_old_wer": 0.5619047619047619, "eval_runtime": 7.8333, "eval_samples_per_second": 26.809, "eval_steps_per_second": 3.447, "step": 2010 }, { "epoch": 3.0, "learning_rate": 8.425499231950845e-05, "loss": 0.5726, "step": 3015 }, { "epoch": 3.0, "eval_cer": 0.08917748917748917, "eval_loss": 0.17662236094474792, "eval_new_wer": 0.0, "eval_old_wer": 0.47619047619047616, "eval_runtime": 7.8634, "eval_samples_per_second": 26.706, "eval_steps_per_second": 3.434, "step": 3015 }, { "epoch": 4.0, "learning_rate": 7.723781594749337e-05, "loss": 0.3529, "step": 4020 }, { "epoch": 4.0, "eval_cer": 0.08744588744588745, "eval_loss": 0.12508022785186768, "eval_new_wer": 0.0, "eval_old_wer": 0.4714285714285714, "eval_runtime": 7.8841, "eval_samples_per_second": 26.636, "eval_steps_per_second": 3.425, "step": 4020 }, { "epoch": 5.0, "learning_rate": 7.022063957547829e-05, "loss": 0.2463, "step": 5025 }, { "epoch": 5.0, "eval_cer": 0.015584415584415584, "eval_loss": 0.09194076061248779, "eval_new_wer": 0.0, "eval_old_wer": 0.07142857142857142, "eval_runtime": 7.9312, "eval_samples_per_second": 26.478, "eval_steps_per_second": 3.404, "step": 5025 }, { "epoch": 6.0, "learning_rate": 6.320346320346321e-05, "loss": 0.2048, "step": 6030 }, { "epoch": 6.0, "eval_cer": 0.006060606060606061, "eval_loss": 0.10927814245223999, "eval_new_wer": 0.0, "eval_old_wer": 0.03333333333333333, "eval_runtime": 7.8986, "eval_samples_per_second": 26.587, "eval_steps_per_second": 3.418, "step": 6030 }, { "epoch": 7.0, "learning_rate": 5.618628683144812e-05, "loss": 0.1658, "step": 7035 }, { "epoch": 7.0, "eval_cer": 0.011255411255411256, "eval_loss": 0.3268298804759979, "eval_new_wer": 0.0, "eval_old_wer": 0.06190476190476191, "eval_runtime": 7.9129, "eval_samples_per_second": 26.539, "eval_steps_per_second": 3.412, "step": 7035 }, { "epoch": 8.0, "learning_rate": 4.9169110459433046e-05, "loss": 0.1457, "step": 8040 }, { "epoch": 8.0, "eval_cer": 0.009523809523809525, "eval_loss": 0.11435961723327637, "eval_new_wer": 0.0, "eval_old_wer": 0.047619047619047616, "eval_runtime": 7.9596, "eval_samples_per_second": 26.383, "eval_steps_per_second": 3.392, "step": 8040 }, { "epoch": 9.0, "learning_rate": 4.215193408741796e-05, "loss": 0.1222, "step": 9045 }, { "epoch": 9.0, "eval_cer": 0.009523809523809525, "eval_loss": 0.12004613131284714, "eval_new_wer": 0.0, "eval_old_wer": 0.05238095238095238, "eval_runtime": 8.023, "eval_samples_per_second": 26.175, "eval_steps_per_second": 3.365, "step": 9045 }, { "epoch": 10.0, "learning_rate": 3.514173998044966e-05, "loss": 0.1137, "step": 10050 }, { "epoch": 10.0, "eval_cer": 0.007792207792207792, "eval_loss": 0.12371435761451721, "eval_new_wer": 0.0, "eval_old_wer": 0.04285714285714286, "eval_runtime": 8.0733, "eval_samples_per_second": 26.012, "eval_steps_per_second": 3.344, "step": 10050 }, { "epoch": 11.0, "learning_rate": 2.8124563608434578e-05, "loss": 0.0942, "step": 11055 }, { "epoch": 11.0, "eval_cer": 0.0025974025974025974, "eval_loss": 0.02394554764032364, "eval_new_wer": 0.0, "eval_old_wer": 0.014285714285714285, "eval_runtime": 7.8921, "eval_samples_per_second": 26.609, "eval_steps_per_second": 3.421, "step": 11055 }, { "epoch": 12.0, "learning_rate": 2.1107387236419494e-05, "loss": 0.0843, "step": 12060 }, { "epoch": 12.0, "eval_cer": 0.008658008658008658, "eval_loss": 0.04588039219379425, "eval_new_wer": 0.0, "eval_old_wer": 0.04285714285714286, "eval_runtime": 7.897, "eval_samples_per_second": 26.592, "eval_steps_per_second": 3.419, "step": 12060 }, { "epoch": 13.0, "learning_rate": 1.4097193129451195e-05, "loss": 0.0761, "step": 13065 }, { "epoch": 13.0, "eval_cer": 0.0, "eval_loss": 0.001758816302753985, "eval_new_wer": 0.0, "eval_old_wer": 0.0, "eval_runtime": 7.8846, "eval_samples_per_second": 26.634, "eval_steps_per_second": 3.424, "step": 13065 }, { "epoch": 14.0, "learning_rate": 7.080016757436113e-06, "loss": 0.0667, "step": 14070 }, { "epoch": 14.0, "eval_cer": 0.0017316017316017316, "eval_loss": 0.007288647349923849, "eval_new_wer": 0.0, "eval_old_wer": 0.009523809523809525, "eval_runtime": 7.9378, "eval_samples_per_second": 26.456, "eval_steps_per_second": 3.401, "step": 14070 }, { "epoch": 15.0, "learning_rate": 6.284038542103058e-08, "loss": 0.061, "step": 15075 }, { "epoch": 15.0, "eval_cer": 0.003463203463203463, "eval_loss": 0.012480901554226875, "eval_new_wer": 0.0, "eval_old_wer": 0.01904761904761905, "eval_runtime": 7.8979, "eval_samples_per_second": 26.589, "eval_steps_per_second": 3.419, "step": 15075 } ], "max_steps": 15075, "num_train_epochs": 15, "total_flos": 1.1047783836795744e+19, "trial_name": null, "trial_params": null }