{ "best_metric": null, "best_model_checkpoint": null, "epoch": 15.0, "global_step": 1260, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.19, "eval_loss": 4.574927806854248, "eval_runtime": 492.4632, "eval_samples_per_second": 22.05, "eval_steps_per_second": 0.345, "eval_wer": 1.0, "step": 100 }, { "epoch": 2.38, "eval_loss": 3.2543928623199463, "eval_runtime": 477.4917, "eval_samples_per_second": 22.742, "eval_steps_per_second": 0.356, "eval_wer": 1.0, "step": 200 }, { "epoch": 3.57, "eval_loss": 3.110656261444092, "eval_runtime": 470.1018, "eval_samples_per_second": 23.099, "eval_steps_per_second": 0.362, "eval_wer": 1.000137922254286, "step": 300 }, { "epoch": 4.76, "eval_loss": 0.9151943922042847, "eval_runtime": 469.7177, "eval_samples_per_second": 23.118, "eval_steps_per_second": 0.362, "eval_wer": 1.017081140723137, "step": 400 }, { "epoch": 5.95, "learning_rate": 0.0003, "loss": 3.9561, "step": 500 }, { "epoch": 5.95, "eval_loss": 0.6422096490859985, "eval_runtime": 477.7033, "eval_samples_per_second": 22.732, "eval_steps_per_second": 0.356, "eval_wer": 1.059041334238669, "step": 500 }, { "epoch": 7.14, "eval_loss": 0.49003028869628906, "eval_runtime": 424.1123, "eval_samples_per_second": 25.604, "eval_steps_per_second": 0.401, "eval_wer": 1.0866682227126125, "step": 600 }, { "epoch": 8.33, "eval_loss": 0.4251333475112915, "eval_runtime": 495.8179, "eval_samples_per_second": 21.901, "eval_steps_per_second": 0.343, "eval_wer": 1.095516465795281, "step": 700 }, { "epoch": 9.52, "eval_loss": 0.4232262969017029, "eval_runtime": 527.1122, "eval_samples_per_second": 20.601, "eval_steps_per_second": 0.323, "eval_wer": 1.1464522152435919, "step": 800 }, { "epoch": 10.71, "eval_loss": 0.4133465588092804, "eval_runtime": 479.4028, "eval_samples_per_second": 22.651, "eval_steps_per_second": 0.355, "eval_wer": 1.1194300628076728, "step": 900 }, { "epoch": 11.9, "learning_rate": 0.00010263157894736841, "loss": 0.2637, "step": 1000 }, { "epoch": 11.9, "eval_loss": 0.3940434157848358, "eval_runtime": 489.7721, "eval_samples_per_second": 22.172, "eval_steps_per_second": 0.347, "eval_wer": 1.13066542182991, "step": 1000 }, { "epoch": 13.1, "eval_loss": 0.3943102955818176, "eval_runtime": 478.1637, "eval_samples_per_second": 22.71, "eval_steps_per_second": 0.356, "eval_wer": 1.0963758275335258, "step": 1100 }, { "epoch": 14.29, "eval_loss": 0.3974030613899231, "eval_runtime": 476.6101, "eval_samples_per_second": 22.784, "eval_steps_per_second": 0.357, "eval_wer": 1.0893630113732813, "step": 1200 }, { "epoch": 15.0, "step": 1260, "total_flos": 2.676196803813189e+19, "train_loss": 1.7017262231735957, "train_runtime": 141338.6512, "train_samples_per_second": 1.71, "train_steps_per_second": 0.009 } ], "max_steps": 1260, "num_train_epochs": 15, "total_flos": 2.676196803813189e+19, "trial_name": null, "trial_params": null }