{ "best_metric": null, "best_model_checkpoint": null, "epoch": 7.72454448017149, "global_step": 3600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.86, "learning_rate": 0.0002394, "loss": 3.2993, "step": 400 }, { "epoch": 0.86, "eval_loss": Infinity, "eval_runtime": 828.7984, "eval_samples_per_second": 9.006, "eval_steps_per_second": 1.126, "eval_wer": 0.36457931084030065, "step": 400 }, { "epoch": 1.72, "learning_rate": 0.0002723048327137546, "loss": 0.3837, "step": 800 }, { "epoch": 1.72, "eval_loss": Infinity, "eval_runtime": 820.745, "eval_samples_per_second": 9.094, "eval_steps_per_second": 1.137, "eval_wer": 0.25638285452569753, "step": 800 }, { "epoch": 2.57, "learning_rate": 0.00023522304832713752, "loss": 0.2576, "step": 1200 }, { "epoch": 2.57, "eval_loss": Infinity, "eval_runtime": 816.7249, "eval_samples_per_second": 9.139, "eval_steps_per_second": 1.142, "eval_wer": 0.17959103032697818, "step": 1200 }, { "epoch": 3.43, "learning_rate": 0.0001981412639405204, "loss": 0.1963, "step": 1600 }, { "epoch": 3.43, "eval_loss": Infinity, "eval_runtime": 819.1322, "eval_samples_per_second": 9.112, "eval_steps_per_second": 1.139, "eval_wer": 0.1695059854696326, "step": 1600 }, { "epoch": 4.29, "learning_rate": 0.00016096654275092934, "loss": 0.158, "step": 2000 }, { "epoch": 4.29, "eval_loss": Infinity, "eval_runtime": 815.3058, "eval_samples_per_second": 9.155, "eval_steps_per_second": 1.144, "eval_wer": 0.16685675284904763, "step": 2000 }, { "epoch": 5.15, "learning_rate": 0.00012388475836431226, "loss": 0.125, "step": 2400 }, { "epoch": 5.15, "eval_loss": Infinity, "eval_runtime": 815.712, "eval_samples_per_second": 9.15, "eval_steps_per_second": 1.144, "eval_wer": 0.15157202769570643, "step": 2400 }, { "epoch": 6.01, "learning_rate": 8.680297397769517e-05, "loss": 0.101, "step": 2800 }, { "epoch": 6.01, "eval_loss": Infinity, "eval_runtime": 815.5191, "eval_samples_per_second": 9.152, "eval_steps_per_second": 1.144, "eval_wer": 0.1440015087155263, "step": 2800 }, { "epoch": 6.87, "learning_rate": 4.972118959107806e-05, "loss": 0.0793, "step": 3200 }, { "epoch": 6.87, "eval_loss": Infinity, "eval_runtime": 816.2609, "eval_samples_per_second": 9.144, "eval_steps_per_second": 1.143, "eval_wer": 0.139223909548912, "step": 3200 }, { "epoch": 7.72, "learning_rate": 1.2639405204460965e-05, "loss": 0.0642, "step": 3600 }, { "epoch": 7.72, "eval_loss": Infinity, "eval_runtime": 815.052, "eval_samples_per_second": 9.158, "eval_steps_per_second": 1.145, "eval_wer": 0.1354611011827252, "step": 3600 } ], "max_steps": 3728, "num_train_epochs": 8, "total_flos": 4.913815144448316e+19, "trial_name": null, "trial_params": null }