{ "best_metric": null, "best_model_checkpoint": null, "epoch": 28.93617021276596, "global_step": 6800, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.7, "learning_rate": 0.00023999999999999998, "loss": 4.3481, "step": 400 }, { "epoch": 1.7, "eval_loss": 2.619910955429077, "eval_runtime": 671.3151, "eval_samples_per_second": 7.704, "eval_wer": 0.99997385142379, "step": 400 }, { "epoch": 3.4, "learning_rate": 0.00028625954198473283, "loss": 0.5343, "step": 800 }, { "epoch": 3.4, "eval_loss": 0.27097710967063904, "eval_runtime": 691.1513, "eval_samples_per_second": 7.483, "eval_wer": 0.4792511047773449, "step": 800 }, { "epoch": 5.11, "learning_rate": 0.0002679389312977099, "loss": 0.1541, "step": 1200 }, { "epoch": 5.11, "eval_loss": 0.2556667923927307, "eval_runtime": 706.9613, "eval_samples_per_second": 7.316, "eval_wer": 0.44368904113171037, "step": 1200 }, { "epoch": 6.81, "learning_rate": 0.00024961832061068704, "loss": 0.1049, "step": 1600 }, { "epoch": 6.81, "eval_loss": 0.23636971414089203, "eval_runtime": 720.2903, "eval_samples_per_second": 7.18, "eval_wer": 0.4181680307507256, "step": 1600 }, { "epoch": 8.51, "learning_rate": 0.0002312977099236641, "loss": 0.0867, "step": 2000 }, { "epoch": 8.51, "eval_loss": 0.24546758830547333, "eval_runtime": 728.0447, "eval_samples_per_second": 7.104, "eval_wer": 0.40582590277959363, "step": 2000 }, { "epoch": 10.21, "learning_rate": 0.0002129770992366412, "loss": 0.0696, "step": 2400 }, { "epoch": 10.21, "eval_loss": 0.26230543851852417, "eval_runtime": 725.2392, "eval_samples_per_second": 7.131, "eval_wer": 0.3916272258975499, "step": 2400 }, { "epoch": 11.91, "learning_rate": 0.0001946564885496183, "loss": 0.0637, "step": 2800 }, { "epoch": 11.91, "eval_loss": 0.2552664577960968, "eval_runtime": 729.1761, "eval_samples_per_second": 7.093, "eval_wer": 0.3940067463326622, "step": 2800 }, { "epoch": 13.62, "learning_rate": 0.0001763358778625954, "loss": 0.0554, "step": 3200 }, { "epoch": 13.62, "eval_loss": 0.24944408237934113, "eval_runtime": 725.5889, "eval_samples_per_second": 7.128, "eval_wer": 0.3822660356143608, "step": 3200 }, { "epoch": 15.32, "learning_rate": 0.0001580152671755725, "loss": 0.0477, "step": 3600 }, { "epoch": 15.32, "eval_loss": 0.25511008501052856, "eval_runtime": 714.9627, "eval_samples_per_second": 7.234, "eval_wer": 0.38171691551395026, "step": 3600 }, { "epoch": 17.02, "learning_rate": 0.0001396946564885496, "loss": 0.0441, "step": 4000 }, { "epoch": 17.02, "eval_loss": 0.26531100273132324, "eval_runtime": 724.9275, "eval_samples_per_second": 7.135, "eval_wer": 0.3808540124990194, "step": 4000 }, { "epoch": 18.72, "learning_rate": 0.00012137404580152671, "loss": 0.0414, "step": 4400 }, { "epoch": 18.72, "eval_loss": 0.2718845307826996, "eval_runtime": 724.6581, "eval_samples_per_second": 7.137, "eval_wer": 0.3761211202050048, "step": 4400 }, { "epoch": 20.43, "learning_rate": 0.00010305343511450381, "loss": 0.0364, "step": 4800 }, { "epoch": 20.43, "eval_loss": 0.2734206020832062, "eval_runtime": 721.5427, "eval_samples_per_second": 7.168, "eval_wer": 0.36911330178071805, "step": 4800 }, { "epoch": 22.13, "learning_rate": 8.473282442748092e-05, "loss": 0.0345, "step": 5200 }, { "epoch": 22.13, "eval_loss": 0.2777670919895172, "eval_runtime": 750.8687, "eval_samples_per_second": 6.888, "eval_wer": 0.3657924326020448, "step": 5200 }, { "epoch": 23.83, "learning_rate": 6.641221374045802e-05, "loss": 0.0304, "step": 5600 }, { "epoch": 23.83, "eval_loss": 0.2627178430557251, "eval_runtime": 737.7059, "eval_samples_per_second": 7.011, "eval_wer": 0.36197474047538114, "step": 5600 }, { "epoch": 25.53, "learning_rate": 4.809160305343511e-05, "loss": 0.028, "step": 6000 }, { "epoch": 25.53, "eval_loss": 0.2723003923892975, "eval_runtime": 739.1125, "eval_samples_per_second": 6.998, "eval_wer": 0.3572156996051565, "step": 6000 }, { "epoch": 27.23, "learning_rate": 2.977099236641221e-05, "loss": 0.0257, "step": 6400 }, { "epoch": 27.23, "eval_loss": 0.2800405025482178, "eval_runtime": 740.691, "eval_samples_per_second": 6.983, "eval_wer": 0.353633344664383, "step": 6400 }, { "epoch": 28.94, "learning_rate": 1.1450381679389312e-05, "loss": 0.0257, "step": 6800 }, { "epoch": 28.94, "eval_loss": 0.27684447169303894, "eval_runtime": 742.5074, "eval_samples_per_second": 6.966, "eval_wer": 0.35324111602123265, "step": 6800 } ], "max_steps": 7050, "num_train_epochs": 30, "total_flos": 3.4777475593836667e+19, "trial_name": null, "trial_params": null }