{ "best_metric": null, "best_model_checkpoint": null, "epoch": 15.0, "global_step": 1635, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.92, "eval_loss": 3.5931618213653564, "eval_runtime": 126.9872, "eval_samples_per_second": 12.97, "eval_steps_per_second": 1.622, "eval_wer": 1.0, "step": 100 }, { "epoch": 1.83, "eval_loss": 3.0185344219207764, "eval_runtime": 122.4223, "eval_samples_per_second": 13.453, "eval_steps_per_second": 1.683, "eval_wer": 0.9998978653865795, "step": 200 }, { "epoch": 2.75, "eval_loss": 0.9357358813285828, "eval_runtime": 124.4606, "eval_samples_per_second": 13.233, "eval_steps_per_second": 1.655, "eval_wer": 0.8007353692166275, "step": 300 }, { "epoch": 3.67, "eval_loss": 0.5944719910621643, "eval_runtime": 124.5538, "eval_samples_per_second": 13.223, "eval_steps_per_second": 1.654, "eval_wer": 0.63180471861914, "step": 400 }, { "epoch": 4.59, "learning_rate": 0.0002988, "loss": 3.1829, "step": 500 }, { "epoch": 4.59, "eval_loss": 0.4931354224681854, "eval_runtime": 132.5462, "eval_samples_per_second": 12.426, "eval_steps_per_second": 1.554, "eval_wer": 0.5265039321826167, "step": 500 }, { "epoch": 5.5, "eval_loss": 0.47567814588546753, "eval_runtime": 131.8607, "eval_samples_per_second": 12.49, "eval_steps_per_second": 1.562, "eval_wer": 0.47839852926156673, "step": 600 }, { "epoch": 6.42, "eval_loss": 0.4281878173351288, "eval_runtime": 125.8942, "eval_samples_per_second": 13.082, "eval_steps_per_second": 1.636, "eval_wer": 0.45398835665407006, "step": 700 }, { "epoch": 7.34, "eval_loss": 0.3994791507720947, "eval_runtime": 125.4372, "eval_samples_per_second": 13.13, "eval_steps_per_second": 1.642, "eval_wer": 0.4251863956694924, "step": 800 }, { "epoch": 8.26, "eval_loss": 0.4046003818511963, "eval_runtime": 121.2245, "eval_samples_per_second": 13.586, "eval_steps_per_second": 1.699, "eval_wer": 0.4148707997140231, "step": 900 }, { "epoch": 9.17, "learning_rate": 0.00016837004405286342, "loss": 0.2215, "step": 1000 }, { "epoch": 9.17, "eval_loss": 0.4047873914241791, "eval_runtime": 124.6186, "eval_samples_per_second": 13.216, "eval_steps_per_second": 1.653, "eval_wer": 0.39505668471044836, "step": 1000 }, { "epoch": 10.09, "eval_loss": 0.39440903067588806, "eval_runtime": 125.2639, "eval_samples_per_second": 13.148, "eval_steps_per_second": 1.645, "eval_wer": 0.38647737718312736, "step": 1100 }, { "epoch": 11.01, "eval_loss": 0.38526079058647156, "eval_runtime": 122.7703, "eval_samples_per_second": 13.415, "eval_steps_per_second": 1.678, "eval_wer": 0.3643141660708814, "step": 1200 }, { "epoch": 11.93, "eval_loss": 0.395017147064209, "eval_runtime": 125.4537, "eval_samples_per_second": 13.128, "eval_steps_per_second": 1.642, "eval_wer": 0.36319068532325605, "step": 1300 }, { "epoch": 12.84, "eval_loss": 0.3835676610469818, "eval_runtime": 124.6558, "eval_samples_per_second": 13.212, "eval_steps_per_second": 1.653, "eval_wer": 0.350628127872536, "step": 1400 }, { "epoch": 13.76, "learning_rate": 3.621145374449339e-05, "loss": 0.1009, "step": 1500 }, { "epoch": 13.76, "eval_loss": 0.38080519437789917, "eval_runtime": 122.1546, "eval_samples_per_second": 13.483, "eval_steps_per_second": 1.686, "eval_wer": 0.35103666632621794, "step": 1500 }, { "epoch": 14.68, "eval_loss": 0.38068610429763794, "eval_runtime": 125.0336, "eval_samples_per_second": 13.172, "eval_steps_per_second": 1.648, "eval_wer": 0.3456235318149321, "step": 1600 }, { "epoch": 15.0, "step": 1635, "total_flos": 6.464559143942451e+18, "train_loss": 1.0781283684826772, "train_runtime": 7410.3512, "train_samples_per_second": 7.04, "train_steps_per_second": 0.221 } ], "max_steps": 1635, "num_train_epochs": 15, "total_flos": 6.464559143942451e+18, "trial_name": null, "trial_params": null }