{ "best_metric": null, "best_model_checkpoint": null, "epoch": 45.45340050377834, "global_step": 6000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 3.79, "learning_rate": 0.00039436231366470835, "loss": 1.5121, "step": 500 }, { "epoch": 3.79, "eval_loss": 0.186998650431633, "eval_runtime": 714.138, "eval_samples_per_second": 7.242, "eval_wer": 0.39502654080485317, "step": 500 }, { "epoch": 7.57, "learning_rate": 0.00037776708973098473, "loss": 0.1108, "step": 1000 }, { "epoch": 7.57, "eval_loss": 0.16734005510807037, "eval_runtime": 670.8576, "eval_samples_per_second": 7.71, "eval_wer": 0.33428339826896425, "step": 1000 }, { "epoch": 11.36, "learning_rate": 0.0003511499148708517, "loss": 0.0666, "step": 1500 }, { "epoch": 11.36, "eval_loss": 0.17631034553050995, "eval_runtime": 758.94, "eval_samples_per_second": 6.815, "eval_wer": 0.3243469393091546, "step": 1500 }, { "epoch": 15.15, "learning_rate": 0.00031601138191423965, "loss": 0.0459, "step": 2000 }, { "epoch": 15.15, "eval_loss": 0.2086898684501648, "eval_runtime": 682.0381, "eval_samples_per_second": 7.583, "eval_wer": 0.32364092775148395, "step": 2000 }, { "epoch": 18.94, "learning_rate": 0.0002743324911320655, "loss": 0.0358, "step": 2500 }, { "epoch": 18.94, "eval_loss": 0.1979219615459442, "eval_runtime": 700.5817, "eval_samples_per_second": 7.382, "eval_wer": 0.3092069136835499, "step": 2500 }, { "epoch": 22.73, "learning_rate": 0.00022846296765465705, "loss": 0.0285, "step": 3000 }, { "epoch": 22.73, "eval_loss": 0.19415870308876038, "eval_runtime": 1037.6087, "eval_samples_per_second": 4.985, "eval_wer": 0.3047093585754256, "step": 3000 }, { "epoch": 26.51, "learning_rate": 0.0001809887913391635, "loss": 0.0237, "step": 3500 }, { "epoch": 26.51, "eval_loss": 0.1929541826248169, "eval_runtime": 764.504, "eval_samples_per_second": 6.765, "eval_wer": 0.30026410061972125, "step": 3500 }, { "epoch": 30.3, "learning_rate": 0.0001345864073365157, "loss": 0.0205, "step": 4000 }, { "epoch": 30.3, "eval_loss": 0.2030186504125595, "eval_runtime": 1540.1942, "eval_samples_per_second": 3.358, "eval_wer": 0.29338702507648456, "step": 4000 }, { "epoch": 34.09, "learning_rate": 9.187183650888056e-05, "loss": 0.0174, "step": 4500 }, { "epoch": 34.09, "eval_loss": 0.20308123528957367, "eval_runtime": 964.2383, "eval_samples_per_second": 5.364, "eval_wer": 0.29469445388698584, "step": 4500 }, { "epoch": 37.88, "learning_rate": 5.5253192378985966e-05, "loss": 0.0151, "step": 5000 }, { "epoch": 37.88, "eval_loss": 0.20086798071861267, "eval_runtime": 715.6106, "eval_samples_per_second": 7.227, "eval_wer": 0.28739900112438876, "step": 5000 }, { "epoch": 41.66, "learning_rate": 2.679491924311226e-05, "loss": 0.0138, "step": 5500 }, { "epoch": 41.66, "eval_loss": 0.20132462680339813, "eval_runtime": 773.3872, "eval_samples_per_second": 6.687, "eval_wer": 0.2842350234029757, "step": 5500 }, { "epoch": 45.45, "learning_rate": 8.10140527710055e-06, "loss": 0.0122, "step": 6000 }, { "epoch": 45.45, "eval_loss": 0.20383873581886292, "eval_runtime": 957.0431, "eval_samples_per_second": 5.404, "eval_wer": 0.28167246293439324, "step": 6000 } ], "max_steps": 6600, "num_train_epochs": 50, "total_flos": 9.394750356471834e+19, "trial_name": null, "trial_params": null }