{ "best_metric": 36.8601893452485, "best_model_checkpoint": "./hebert_parashoot/checkpoint-1407", "epoch": 5.0, "global_step": 2345, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_exact_match": 12.217194570135746, "eval_f1": 30.9937324652663, "eval_runtime": 6.4609, "eval_samples_per_second": 38.539, "eval_steps_per_second": 4.953, "step": 469 }, { "epoch": 1.07, "learning_rate": 2.3603411513859275e-05, "loss": 4.3712, "step": 500 }, { "epoch": 2.0, "eval_exact_match": 17.647058823529413, "eval_f1": 35.4171725736381, "eval_runtime": 6.8735, "eval_samples_per_second": 36.226, "eval_steps_per_second": 4.656, "step": 938 }, { "epoch": 2.13, "learning_rate": 1.7206823027718552e-05, "loss": 2.926, "step": 1000 }, { "epoch": 3.0, "eval_exact_match": 18.099547511312217, "eval_f1": 36.8601893452485, "eval_runtime": 6.9389, "eval_samples_per_second": 35.884, "eval_steps_per_second": 4.612, "step": 1407 }, { "epoch": 3.2, "learning_rate": 1.0810234541577825e-05, "loss": 1.9172, "step": 1500 }, { "epoch": 4.0, "eval_exact_match": 18.552036199095024, "eval_f1": 35.27425497728763, "eval_runtime": 6.9353, "eval_samples_per_second": 35.903, "eval_steps_per_second": 4.614, "step": 1876 }, { "epoch": 4.26, "learning_rate": 4.4136460554371e-06, "loss": 1.1751, "step": 2000 }, { "epoch": 5.0, "eval_exact_match": 17.194570135746606, "eval_f1": 35.41593343704486, "eval_runtime": 6.9293, "eval_samples_per_second": 35.934, "eval_steps_per_second": 4.618, "step": 2345 }, { "epoch": 5.0, "step": 2345, "total_flos": 1836262957962240.0, "train_loss": 2.3373700692963753, "train_runtime": 923.5379, "train_samples_per_second": 10.146, "train_steps_per_second": 2.539 } ], "max_steps": 2345, "num_train_epochs": 5, "total_flos": 1836262957962240.0, "trial_name": null, "trial_params": null }