{ "best_metric": 1.7099316120147705, "best_model_checkpoint": "models/opus-mt-en-id-opus100/checkpoint-31250", "epoch": 15.0, "global_step": 468750, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 9.649404953361209e-05, "loss": 1.6086, "step": 31250 }, { "epoch": 1.0, "eval_bleu": 29.4293, "eval_loss": 1.7099316120147705, "eval_runtime": 35.1916, "eval_samples_per_second": 56.832, "eval_steps_per_second": 1.79, "step": 31250 }, { "epoch": 2.0, "learning_rate": 9.247346413637826e-05, "loss": 1.5762, "step": 62500 }, { "epoch": 2.0, "eval_bleu": 28.948, "eval_loss": 1.7409919500350952, "eval_runtime": 34.945, "eval_samples_per_second": 57.233, "eval_steps_per_second": 1.803, "step": 62500 }, { "epoch": 3.0, "learning_rate": 8.845287873914442e-05, "loss": 1.5027, "step": 93750 }, { "epoch": 3.0, "eval_bleu": 28.6931, "eval_loss": 1.767769694328308, "eval_runtime": 34.3563, "eval_samples_per_second": 58.214, "eval_steps_per_second": 1.834, "step": 93750 }, { "epoch": 4.0, "learning_rate": 8.443229334191058e-05, "loss": 1.4377, "step": 125000 }, { "epoch": 4.0, "eval_bleu": 28.9463, "eval_loss": 1.779849648475647, "eval_runtime": 34.8763, "eval_samples_per_second": 57.345, "eval_steps_per_second": 1.806, "step": 125000 }, { "epoch": 5.0, "learning_rate": 8.041170794467674e-05, "loss": 1.3763, "step": 156250 }, { "epoch": 5.0, "eval_bleu": 28.4966, "eval_loss": 1.8018742799758911, "eval_runtime": 37.3892, "eval_samples_per_second": 53.491, "eval_steps_per_second": 1.685, "step": 156250 }, { "epoch": 6.0, "learning_rate": 7.63911225474429e-05, "loss": 1.3198, "step": 187500 }, { "epoch": 6.0, "eval_bleu": 29.6279, "eval_loss": 1.8202235698699951, "eval_runtime": 35.8037, "eval_samples_per_second": 55.86, "eval_steps_per_second": 1.76, "step": 187500 }, { "epoch": 7.0, "learning_rate": 7.237053715020908e-05, "loss": 1.2648, "step": 218750 }, { "epoch": 7.0, "eval_bleu": 29.8151, "eval_loss": 1.8312174081802368, "eval_runtime": 34.1488, "eval_samples_per_second": 58.567, "eval_steps_per_second": 1.845, "step": 218750 }, { "epoch": 8.0, "learning_rate": 6.834995175297524e-05, "loss": 1.2115, "step": 250000 }, { "epoch": 8.0, "eval_bleu": 29.3032, "eval_loss": 1.8490322828292847, "eval_runtime": 35.0418, "eval_samples_per_second": 57.075, "eval_steps_per_second": 1.798, "step": 250000 }, { "epoch": 9.0, "learning_rate": 6.43293663557414e-05, "loss": 1.1584, "step": 281250 }, { "epoch": 9.0, "eval_bleu": 28.7282, "eval_loss": 1.8729382753372192, "eval_runtime": 35.1809, "eval_samples_per_second": 56.849, "eval_steps_per_second": 1.791, "step": 281250 }, { "epoch": 10.0, "learning_rate": 6.030878095850756e-05, "loss": 1.1067, "step": 312500 }, { "epoch": 10.0, "eval_bleu": 29.4797, "eval_loss": 1.8971490859985352, "eval_runtime": 35.2599, "eval_samples_per_second": 56.722, "eval_steps_per_second": 1.787, "step": 312500 }, { "epoch": 11.0, "learning_rate": 5.6288195561273725e-05, "loss": 1.0555, "step": 343750 }, { "epoch": 11.0, "eval_bleu": 29.3416, "eval_loss": 1.940462589263916, "eval_runtime": 37.5609, "eval_samples_per_second": 53.247, "eval_steps_per_second": 1.677, "step": 343750 }, { "epoch": 12.0, "learning_rate": 5.2267610164039885e-05, "loss": 1.0052, "step": 375000 }, { "epoch": 12.0, "eval_bleu": 29.0168, "eval_loss": 1.9554133415222168, "eval_runtime": 34.6681, "eval_samples_per_second": 57.69, "eval_steps_per_second": 1.817, "step": 375000 }, { "epoch": 13.0, "learning_rate": 4.8247024766806045e-05, "loss": 0.956, "step": 406250 }, { "epoch": 13.0, "eval_bleu": 28.2454, "eval_loss": 2.0001118183135986, "eval_runtime": 35.9349, "eval_samples_per_second": 55.656, "eval_steps_per_second": 1.753, "step": 406250 }, { "epoch": 14.0, "learning_rate": 4.422643936957221e-05, "loss": 0.9069, "step": 437500 }, { "epoch": 14.0, "eval_bleu": 28.6705, "eval_loss": 2.028186082839966, "eval_runtime": 36.16, "eval_samples_per_second": 55.31, "eval_steps_per_second": 1.742, "step": 437500 }, { "epoch": 15.0, "learning_rate": 4.020585397233837e-05, "loss": 0.8589, "step": 468750 }, { "epoch": 15.0, "eval_bleu": 28.1988, "eval_loss": 2.059141159057617, "eval_runtime": 36.5906, "eval_samples_per_second": 54.659, "eval_steps_per_second": 1.722, "step": 468750 } ], "max_steps": 781250, "num_train_epochs": 25, "total_flos": 1.2468304214595994e+17, "trial_name": null, "trial_params": null }