{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.8777365254128793, "global_step": 11000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.09, "learning_rate": 0.00025, "loss": 1.6044, "step": 500 }, { "epoch": 0.17, "learning_rate": 0.0005, "loss": 0.957, "step": 1000 }, { "epoch": 0.17, "eval_loss": 0.7217180132865906, "eval_phone_accuracy": 0.7656547891757681, "eval_runtime": 9.9001, "eval_samples_per_second": 20.202, "eval_steps_per_second": 1.717, "step": 1000 }, { "epoch": 0.26, "learning_rate": 0.0004766703994027622, "loss": 0.8156, "step": 1500 }, { "epoch": 0.34, "learning_rate": 0.0004533407988055245, "loss": 0.7327, "step": 2000 }, { "epoch": 0.34, "eval_loss": 0.5681599974632263, "eval_phone_accuracy": 0.8123568272172383, "eval_runtime": 9.9031, "eval_samples_per_second": 20.196, "eval_steps_per_second": 1.717, "step": 2000 }, { "epoch": 0.43, "learning_rate": 0.00043001119820828664, "loss": 0.6781, "step": 2500 }, { "epoch": 0.51, "learning_rate": 0.0004066815976110489, "loss": 0.6426, "step": 3000 }, { "epoch": 0.51, "eval_loss": 0.4999035894870758, "eval_phone_accuracy": 0.8317913778579135, "eval_runtime": 9.8493, "eval_samples_per_second": 20.306, "eval_steps_per_second": 1.726, "step": 3000 }, { "epoch": 0.6, "learning_rate": 0.0003833519970138111, "loss": 0.6148, "step": 3500 }, { "epoch": 0.68, "learning_rate": 0.0003600223964165734, "loss": 0.5924, "step": 4000 }, { "epoch": 0.68, "eval_loss": 0.4667314887046814, "eval_phone_accuracy": 0.8421219869056944, "eval_runtime": 10.1485, "eval_samples_per_second": 19.707, "eval_steps_per_second": 1.675, "step": 4000 }, { "epoch": 0.77, "learning_rate": 0.0003366927958193356, "loss": 0.5743, "step": 4500 }, { "epoch": 0.85, "learning_rate": 0.0003133631952220978, "loss": 0.559, "step": 5000 }, { "epoch": 0.85, "eval_loss": 0.43349266052246094, "eval_phone_accuracy": 0.8515954066476509, "eval_runtime": 10.2876, "eval_samples_per_second": 19.441, "eval_steps_per_second": 1.652, "step": 5000 }, { "epoch": 0.94, "learning_rate": 0.00029003359462486, "loss": 0.5442, "step": 5500 }, { "epoch": 1.02, "learning_rate": 0.00026670399402762223, "loss": 0.5294, "step": 6000 }, { "epoch": 1.02, "eval_loss": 0.4208233654499054, "eval_phone_accuracy": 0.8561843252590042, "eval_runtime": 10.0364, "eval_samples_per_second": 19.928, "eval_steps_per_second": 1.694, "step": 6000 }, { "epoch": 1.11, "learning_rate": 0.00024337439343038447, "loss": 0.5128, "step": 6500 }, { "epoch": 1.19, "learning_rate": 0.0002200447928331467, "loss": 0.5037, "step": 7000 }, { "epoch": 1.19, "eval_loss": 0.40133553743362427, "eval_phone_accuracy": 0.8622585460295878, "eval_runtime": 10.294, "eval_samples_per_second": 19.429, "eval_steps_per_second": 1.651, "step": 7000 }, { "epoch": 1.28, "learning_rate": 0.00019671519223590892, "loss": 0.497, "step": 7500 }, { "epoch": 1.37, "learning_rate": 0.00017338559163867115, "loss": 0.4918, "step": 8000 }, { "epoch": 1.37, "eval_loss": 0.3905256986618042, "eval_phone_accuracy": 0.8658424840754918, "eval_runtime": 10.3057, "eval_samples_per_second": 19.407, "eval_steps_per_second": 1.65, "step": 8000 }, { "epoch": 1.45, "learning_rate": 0.0001500559910414334, "loss": 0.4832, "step": 8500 }, { "epoch": 1.54, "learning_rate": 0.0001267263904441956, "loss": 0.475, "step": 9000 }, { "epoch": 1.54, "eval_loss": 0.37418654561042786, "eval_phone_accuracy": 0.8692195143579209, "eval_runtime": 10.1391, "eval_samples_per_second": 19.726, "eval_steps_per_second": 1.677, "step": 9000 }, { "epoch": 1.62, "learning_rate": 0.00010339678984695783, "loss": 0.4684, "step": 9500 }, { "epoch": 1.71, "learning_rate": 8.006718924972005e-05, "loss": 0.4647, "step": 10000 }, { "epoch": 1.71, "eval_loss": 0.36982452869415283, "eval_phone_accuracy": 0.8727960628408435, "eval_runtime": 9.9379, "eval_samples_per_second": 20.125, "eval_steps_per_second": 1.711, "step": 10000 }, { "epoch": 1.79, "learning_rate": 5.678424785367675e-05, "loss": 0.4579, "step": 10500 }, { "epoch": 1.88, "learning_rate": 3.345464725643897e-05, "loss": 0.4556, "step": 11000 }, { "epoch": 1.88, "eval_loss": 0.3634908199310303, "eval_phone_accuracy": 0.875249397750617, "eval_runtime": 10.1013, "eval_samples_per_second": 19.799, "eval_steps_per_second": 1.683, "step": 11000 } ], "max_steps": 11716, "num_train_epochs": 2, "total_flos": 1.8523977459584336e+19, "trial_name": null, "trial_params": null }