{ "best_metric": 73.29457345565194, "best_model_checkpoint": "/data/jcanete/all_results/sqac/beto_uncased/epochs_3_bs_16_lr_5e-5/checkpoint-3000", "epoch": 3.0, "global_step": 3117, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.19, "eval_exact_match": 34.44206008583691, "eval_f1": 52.267743165936324, "step": 200 }, { "epoch": 0.38, "eval_exact_match": 44.0450643776824, "eval_f1": 64.115641012021, "step": 400 }, { "epoch": 0.48, "learning_rate": 4.202759063201797e-05, "loss": 2.3707, "step": 500 }, { "epoch": 0.58, "eval_exact_match": 45.65450643776824, "eval_f1": 65.58217781199122, "step": 600 }, { "epoch": 0.77, "eval_exact_match": 47.6931330472103, "eval_f1": 67.5072070043358, "step": 800 }, { "epoch": 0.96, "learning_rate": 3.400705806865576e-05, "loss": 1.5329, "step": 1000 }, { "epoch": 0.96, "eval_exact_match": 50.21459227467811, "eval_f1": 69.674278273471, "step": 1000 }, { "epoch": 1.15, "eval_exact_match": 52.95064377682404, "eval_f1": 70.8690079988791, "step": 1200 }, { "epoch": 1.35, "eval_exact_match": 52.57510729613734, "eval_f1": 70.63857527605586, "step": 1400 }, { "epoch": 1.44, "learning_rate": 2.5986525505293552e-05, "loss": 0.84, "step": 1500 }, { "epoch": 1.54, "eval_exact_match": 52.52145922746781, "eval_f1": 71.19360550371005, "step": 1600 }, { "epoch": 1.73, "eval_exact_match": 53.91630901287554, "eval_f1": 71.97381382088393, "step": 1800 }, { "epoch": 1.92, "learning_rate": 1.7965992941931346e-05, "loss": 0.7768, "step": 2000 }, { "epoch": 1.92, "eval_exact_match": 54.238197424892704, "eval_f1": 72.70653141591409, "step": 2000 }, { "epoch": 2.12, "eval_exact_match": 55.042918454935624, "eval_f1": 72.49398474649861, "step": 2200 }, { "epoch": 2.31, "eval_exact_match": 54.6137339055794, "eval_f1": 72.34612760031646, "step": 2400 }, { "epoch": 2.41, "learning_rate": 9.945460378569138e-06, "loss": 0.4207, "step": 2500 }, { "epoch": 2.5, "eval_exact_match": 55.09656652360515, "eval_f1": 72.93749771717988, "step": 2600 }, { "epoch": 2.69, "eval_exact_match": 55.15021459227468, "eval_f1": 72.52429747494757, "step": 2800 }, { "epoch": 2.89, "learning_rate": 1.92492781520693e-06, "loss": 0.3301, "step": 3000 }, { "epoch": 2.89, "eval_exact_match": 55.90128755364807, "eval_f1": 73.29457345565194, "step": 3000 }, { "epoch": 3.0, "step": 3117, "total_flos": 1.2746774359663104e+16, "train_loss": 1.0182803597326342, "train_runtime": 2823.9441, "train_samples_per_second": 17.66, "train_steps_per_second": 1.104 } ], "max_steps": 3117, "num_train_epochs": 3, "total_flos": 1.2746774359663104e+16, "trial_name": null, "trial_params": null }