{ "best_metric": null, "best_model_checkpoint": null, "epoch": 13.791738382099828, "global_step": 2000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.03, "learning_rate": 9.99965514863094e-07, "loss": 0.0333, "step": 150 }, { "epoch": 2.07, "learning_rate": 9.99862059452376e-07, "loss": 0.0332, "step": 300 }, { "epoch": 3.1, "learning_rate": 9.99758604041658e-07, "loss": 0.0336, "step": 450 }, { "epoch": 3.45, "eval_loss": 0.21229705214500427, "eval_runtime": 487.1939, "eval_samples_per_second": 10.649, "eval_steps_per_second": 1.332, "eval_wer": 0.1448122092799754, "step": 500 }, { "epoch": 4.14, "learning_rate": 9.9965514863094e-07, "loss": 0.0329, "step": 600 }, { "epoch": 5.17, "learning_rate": 9.995516932202221e-07, "loss": 0.0323, "step": 750 }, { "epoch": 6.21, "learning_rate": 9.99448237809504e-07, "loss": 0.0317, "step": 900 }, { "epoch": 6.9, "eval_loss": 0.20801204442977905, "eval_runtime": 282.77, "eval_samples_per_second": 18.347, "eval_steps_per_second": 2.295, "eval_wer": 0.14550417099142737, "step": 1000 }, { "epoch": 7.24, "learning_rate": 9.993454721015242e-07, "loss": 0.0323, "step": 1050 }, { "epoch": 8.28, "learning_rate": 9.992420166908062e-07, "loss": 0.031, "step": 1200 }, { "epoch": 9.31, "learning_rate": 9.991385612800883e-07, "loss": 0.0314, "step": 1350 }, { "epoch": 10.34, "learning_rate": 9.990351058693703e-07, "loss": 0.0317, "step": 1500 }, { "epoch": 10.34, "eval_loss": 0.2071654200553894, "eval_runtime": 303.1157, "eval_samples_per_second": 17.116, "eval_steps_per_second": 2.141, "eval_wer": 0.14465844001076386, "step": 1500 }, { "epoch": 11.38, "learning_rate": 9.989316504586522e-07, "loss": 0.031, "step": 1650 }, { "epoch": 12.41, "learning_rate": 9.988281950479342e-07, "loss": 0.0318, "step": 1800 }, { "epoch": 13.45, "learning_rate": 9.987247396372162e-07, "loss": 0.0314, "step": 1950 }, { "epoch": 13.79, "eval_loss": 0.20706616342067719, "eval_runtime": 287.3918, "eval_samples_per_second": 18.052, "eval_steps_per_second": 2.258, "eval_wer": 0.1442355745204321, "step": 2000 } ], "max_steps": 1450000, "num_train_epochs": 10000, "total_flos": 5.652539665735567e+19, "trial_name": null, "trial_params": null }