{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.9947774185525988, "global_step": 8500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.06, "learning_rate": 0.00015, "loss": 2.3077, "step": 500 }, { "epoch": 0.06, "eval_loss": 0.9413899183273315, "eval_phone_accuracy": 0.7518319068307362, "eval_runtime": 12.1406, "eval_samples_per_second": 16.474, "eval_steps_per_second": 4.118, "step": 500 }, { "epoch": 0.12, "learning_rate": 0.0003, "loss": 1.1762, "step": 1000 }, { "epoch": 0.12, "eval_loss": 0.6205331683158875, "eval_phone_accuracy": 0.8215267480076658, "eval_runtime": 10.7397, "eval_samples_per_second": 18.623, "eval_steps_per_second": 4.656, "step": 1000 }, { "epoch": 0.18, "learning_rate": 0.00028011664899257687, "loss": 0.8235, "step": 1500 }, { "epoch": 0.18, "eval_loss": 0.4551730751991272, "eval_phone_accuracy": 0.8648594743186174, "eval_runtime": 10.6304, "eval_samples_per_second": 18.814, "eval_steps_per_second": 4.703, "step": 1500 }, { "epoch": 0.23, "learning_rate": 0.0002602332979851537, "loss": 0.6647, "step": 2000 }, { "epoch": 0.23, "eval_loss": 0.3814973533153534, "eval_phone_accuracy": 0.8815525898176332, "eval_runtime": 11.7606, "eval_samples_per_second": 17.006, "eval_steps_per_second": 4.251, "step": 2000 }, { "epoch": 0.29, "learning_rate": 0.0002403499469777306, "loss": 0.5809, "step": 2500 }, { "epoch": 0.29, "eval_loss": 0.3442990481853485, "eval_phone_accuracy": 0.8922361837370032, "eval_runtime": 11.2643, "eval_samples_per_second": 17.755, "eval_steps_per_second": 4.439, "step": 2500 }, { "epoch": 0.35, "learning_rate": 0.00022046659597030753, "loss": 0.5289, "step": 3000 }, { "epoch": 0.35, "eval_loss": 0.314848929643631, "eval_phone_accuracy": 0.9002575509248419, "eval_runtime": 11.2871, "eval_samples_per_second": 17.719, "eval_steps_per_second": 4.43, "step": 3000 }, { "epoch": 0.41, "learning_rate": 0.0002005832449628844, "loss": 0.4896, "step": 3500 }, { "epoch": 0.41, "eval_loss": 0.30238407850265503, "eval_phone_accuracy": 0.9030845408742857, "eval_runtime": 11.2397, "eval_samples_per_second": 17.794, "eval_steps_per_second": 4.449, "step": 3500 }, { "epoch": 0.47, "learning_rate": 0.0001806998939554613, "loss": 0.4622, "step": 4000 }, { "epoch": 0.47, "eval_loss": 0.2689047157764435, "eval_phone_accuracy": 0.9141496917193476, "eval_runtime": 12.0191, "eval_samples_per_second": 16.64, "eval_steps_per_second": 4.16, "step": 4000 }, { "epoch": 0.53, "learning_rate": 0.00016081654294803816, "loss": 0.4386, "step": 4500 }, { "epoch": 0.53, "eval_loss": 0.2747265696525574, "eval_phone_accuracy": 0.9112533277834144, "eval_runtime": 11.09, "eval_samples_per_second": 18.034, "eval_steps_per_second": 4.509, "step": 4500 }, { "epoch": 0.59, "learning_rate": 0.00014093319194061505, "loss": 0.419, "step": 5000 }, { "epoch": 0.59, "eval_loss": 0.2555970251560211, "eval_phone_accuracy": 0.9181213524458666, "eval_runtime": 11.6344, "eval_samples_per_second": 17.19, "eval_steps_per_second": 4.298, "step": 5000 }, { "epoch": 0.64, "learning_rate": 0.00012104984093319194, "loss": 0.4032, "step": 5500 }, { "epoch": 0.64, "eval_loss": 0.2447209358215332, "eval_phone_accuracy": 0.920003121829392, "eval_runtime": 10.8148, "eval_samples_per_second": 18.493, "eval_steps_per_second": 4.623, "step": 5500 }, { "epoch": 0.7, "learning_rate": 0.00010116648992576882, "loss": 0.3892, "step": 6000 }, { "epoch": 0.7, "eval_loss": 0.23665592074394226, "eval_phone_accuracy": 0.9239054085694217, "eval_runtime": 10.9341, "eval_samples_per_second": 18.291, "eval_steps_per_second": 4.573, "step": 6000 }, { "epoch": 0.76, "learning_rate": 8.12831389183457e-05, "loss": 0.3786, "step": 6500 }, { "epoch": 0.76, "eval_loss": 0.2295096516609192, "eval_phone_accuracy": 0.9251801555711647, "eval_runtime": 10.8468, "eval_samples_per_second": 18.439, "eval_steps_per_second": 4.61, "step": 6500 }, { "epoch": 0.82, "learning_rate": 6.139978791092258e-05, "loss": 0.3701, "step": 7000 }, { "epoch": 0.82, "eval_loss": 0.22638411819934845, "eval_phone_accuracy": 0.9254229645238776, "eval_runtime": 10.8611, "eval_samples_per_second": 18.414, "eval_steps_per_second": 4.604, "step": 7000 }, { "epoch": 0.88, "learning_rate": 4.151643690349946e-05, "loss": 0.3592, "step": 7500 }, { "epoch": 0.88, "eval_loss": 0.2183924913406372, "eval_phone_accuracy": 0.9286401831473243, "eval_runtime": 11.5166, "eval_samples_per_second": 17.366, "eval_steps_per_second": 4.342, "step": 7500 }, { "epoch": 0.94, "learning_rate": 2.163308589607635e-05, "loss": 0.3511, "step": 8000 }, { "epoch": 0.94, "eval_loss": 0.2142486721277237, "eval_phone_accuracy": 0.9288309616101702, "eval_runtime": 11.0635, "eval_samples_per_second": 18.077, "eval_steps_per_second": 4.519, "step": 8000 }, { "epoch": 0.99, "learning_rate": 1.7497348886532342e-06, "loss": 0.3459, "step": 8500 }, { "epoch": 0.99, "eval_loss": 0.2112182378768921, "eval_phone_accuracy": 0.9303051588230703, "eval_runtime": 10.7118, "eval_samples_per_second": 18.671, "eval_steps_per_second": 4.668, "step": 8500 } ], "max_steps": 8544, "num_train_epochs": 1, "total_flos": 1.2317797842209997e+19, "trial_name": null, "trial_params": null }