{ "best_metric": null, "best_model_checkpoint": null, "epoch": 19.230215827338128, "global_step": 4000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.44, "learning_rate": 0.00017879999999999998, "loss": 3.4798, "step": 300 }, { "epoch": 1.92, "eval_loss": 4.179981231689453, "eval_runtime": 203.6334, "eval_samples_per_second": 10.966, "eval_steps_per_second": 1.375, "eval_wer": 0.9931173409434279, "step": 400 }, { "epoch": 2.88, "learning_rate": 0.0002948780487804878, "loss": 3.4274, "step": 600 }, { "epoch": 3.84, "eval_loss": 3.7398014068603516, "eval_runtime": 203.914, "eval_samples_per_second": 10.951, "eval_steps_per_second": 1.373, "eval_wer": 0.9930334060768843, "step": 800 }, { "epoch": 4.33, "learning_rate": 0.00027919860627177696, "loss": 3.3742, "step": 900 }, { "epoch": 5.77, "learning_rate": 0.0002635191637630662, "loss": 3.3302, "step": 1200 }, { "epoch": 5.77, "eval_loss": 3.6393752098083496, "eval_runtime": 206.073, "eval_samples_per_second": 10.836, "eval_steps_per_second": 1.359, "eval_wer": 0.995971126405909, "step": 1200 }, { "epoch": 7.21, "learning_rate": 0.0002478397212543554, "loss": 3.2912, "step": 1500 }, { "epoch": 7.69, "eval_loss": 3.7553415298461914, "eval_runtime": 204.658, "eval_samples_per_second": 10.911, "eval_steps_per_second": 1.368, "eval_wer": 0.9923619271445359, "step": 1600 }, { "epoch": 8.65, "learning_rate": 0.0002321602787456446, "loss": 3.2096, "step": 1800 }, { "epoch": 9.61, "eval_loss": 3.4753119945526123, "eval_runtime": 204.5164, "eval_samples_per_second": 10.918, "eval_steps_per_second": 1.369, "eval_wer": 0.9903474903474904, "step": 2000 }, { "epoch": 10.1, "learning_rate": 0.0002164808362369338, "loss": 3.1291, "step": 2100 }, { "epoch": 11.54, "learning_rate": 0.0002009059233449477, "loss": 3.0236, "step": 2400 }, { "epoch": 11.54, "eval_loss": 3.3585305213928223, "eval_runtime": 201.3035, "eval_samples_per_second": 11.093, "eval_steps_per_second": 1.391, "eval_wer": 0.9937888198757764, "step": 2400 }, { "epoch": 12.98, "learning_rate": 0.0001852264808362369, "loss": 2.8714, "step": 2700 }, { "epoch": 13.46, "eval_loss": 3.3223414421081543, "eval_runtime": 204.2132, "eval_samples_per_second": 10.935, "eval_steps_per_second": 1.371, "eval_wer": 0.9984891724022159, "step": 2800 }, { "epoch": 14.42, "learning_rate": 0.00016954703832752614, "loss": 2.7351, "step": 3000 }, { "epoch": 15.38, "eval_loss": 3.2935783863067627, "eval_runtime": 202.4119, "eval_samples_per_second": 11.032, "eval_steps_per_second": 1.383, "eval_wer": 0.9994963908007386, "step": 3200 }, { "epoch": 15.86, "learning_rate": 0.00015386759581881532, "loss": 2.5377, "step": 3300 }, { "epoch": 17.31, "learning_rate": 0.00013818815331010452, "loss": 2.4208, "step": 3600 }, { "epoch": 17.31, "eval_loss": 3.3104729652404785, "eval_runtime": 203.9464, "eval_samples_per_second": 10.949, "eval_steps_per_second": 1.373, "eval_wer": 1.0033573946617425, "step": 3600 }, { "epoch": 18.75, "learning_rate": 0.00012250871080139372, "loss": 2.2863, "step": 3900 }, { "epoch": 19.23, "eval_loss": 3.474734306335449, "eval_runtime": 201.7307, "eval_samples_per_second": 11.069, "eval_steps_per_second": 1.388, "eval_wer": 1.011499076716468, "step": 4000 } ], "max_steps": 6240, "num_train_epochs": 30, "total_flos": 6.355921309017135e+18, "trial_name": null, "trial_params": null }