{ "best_metric": 58.830205811138015, "best_model_checkpoint": "./checkpoint-300", "epoch": 11.11111111111111, "global_step": 300, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 3.7, "learning_rate": 1.9200000000000003e-06, "loss": 2.1183, "step": 100 }, { "epoch": 3.7, "eval_loss": 1.3170489072799683, "eval_runtime": 435.5063, "eval_samples_per_second": 1.176, "eval_steps_per_second": 0.147, "eval_wer": 76.95217917675545, "step": 100 }, { "epoch": 7.41, "learning_rate": 3.920000000000001e-06, "loss": 0.8565, "step": 200 }, { "epoch": 7.41, "eval_loss": 0.9366902709007263, "eval_runtime": 473.9252, "eval_samples_per_second": 1.08, "eval_steps_per_second": 0.135, "eval_wer": 61.99303874092009, "step": 200 }, { "epoch": 7.78, "learning_rate": 4.12e-06, "loss": 0.5824, "step": 210 }, { "epoch": 8.15, "learning_rate": 4.32e-06, "loss": 0.5195, "step": 220 }, { "epoch": 8.52, "learning_rate": 4.520000000000001e-06, "loss": 0.4472, "step": 230 }, { "epoch": 8.89, "learning_rate": 4.7200000000000005e-06, "loss": 0.4615, "step": 240 }, { "epoch": 9.26, "learning_rate": 4.92e-06, "loss": 0.4068, "step": 250 }, { "epoch": 9.63, "learning_rate": 5.12e-06, "loss": 0.3408, "step": 260 }, { "epoch": 10.0, "learning_rate": 5.320000000000001e-06, "loss": 0.3718, "step": 270 }, { "epoch": 10.37, "learning_rate": 5.5200000000000005e-06, "loss": 0.2749, "step": 280 }, { "epoch": 10.74, "learning_rate": 5.72e-06, "loss": 0.2625, "step": 290 }, { "epoch": 11.11, "learning_rate": 5.92e-06, "loss": 0.2246, "step": 300 }, { "epoch": 11.11, "eval_loss": 0.9642460942268372, "eval_runtime": 439.7231, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.146, "eval_wer": 58.830205811138015, "step": 300 }, { "epoch": 11.11, "step": 300, "total_flos": 1.38203548213248e+18, "train_loss": 0.1297293774286906, "train_runtime": 532.6482, "train_samples_per_second": 9.012, "train_steps_per_second": 0.563 } ], "max_steps": 300, "num_train_epochs": 12, "total_flos": 1.38203548213248e+18, "trial_name": null, "trial_params": null }