{ "best_metric": 0.5955409356725146, "best_model_checkpoint": "bert-finetuned-sem_eval-english/checkpoint-36819", "epoch": 3.0, "global_step": 36819, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.04, "learning_rate": 1.9796300822944678e-05, "loss": 0.5178, "step": 500 }, { "epoch": 0.08, "learning_rate": 1.9592601645889353e-05, "loss": 0.4894, "step": 1000 }, { "epoch": 0.12, "learning_rate": 1.938890246883403e-05, "loss": 0.4786, "step": 1500 }, { "epoch": 0.16, "learning_rate": 1.9185203291778702e-05, "loss": 0.4728, "step": 2000 }, { "epoch": 0.2, "learning_rate": 1.8981504114723378e-05, "loss": 0.4741, "step": 2500 }, { "epoch": 0.24, "learning_rate": 1.8777804937668054e-05, "loss": 0.4631, "step": 3000 }, { "epoch": 0.29, "learning_rate": 1.857410576061273e-05, "loss": 0.4518, "step": 3500 }, { "epoch": 0.33, "learning_rate": 1.8370406583557402e-05, "loss": 0.4509, "step": 4000 }, { "epoch": 0.37, "learning_rate": 1.816670740650208e-05, "loss": 0.4528, "step": 4500 }, { "epoch": 0.41, "learning_rate": 1.7963008229446754e-05, "loss": 0.4601, "step": 5000 }, { "epoch": 0.45, "learning_rate": 1.775930905239143e-05, "loss": 0.4445, "step": 5500 }, { "epoch": 0.49, "learning_rate": 1.7555609875336106e-05, "loss": 0.4527, "step": 6000 }, { "epoch": 0.53, "learning_rate": 1.735191069828078e-05, "loss": 0.4526, "step": 6500 }, { "epoch": 0.57, "learning_rate": 1.7148211521225454e-05, "loss": 0.4555, "step": 7000 }, { "epoch": 0.61, "learning_rate": 1.6944512344170133e-05, "loss": 0.4448, "step": 7500 }, { "epoch": 0.65, "learning_rate": 1.6740813167114806e-05, "loss": 0.4414, "step": 8000 }, { "epoch": 0.69, "learning_rate": 1.6537113990059482e-05, "loss": 0.4502, "step": 8500 }, { "epoch": 0.73, "learning_rate": 1.6333414813004154e-05, "loss": 0.4391, "step": 9000 }, { "epoch": 0.77, "learning_rate": 1.6129715635948834e-05, "loss": 0.4313, "step": 9500 }, { "epoch": 0.81, "learning_rate": 1.5926016458893506e-05, "loss": 0.4419, "step": 10000 }, { "epoch": 0.86, "learning_rate": 1.5722317281838182e-05, "loss": 0.4361, "step": 10500 }, { "epoch": 0.9, "learning_rate": 1.5518618104782858e-05, "loss": 0.4366, "step": 11000 }, { "epoch": 0.94, "learning_rate": 1.5314918927727534e-05, "loss": 0.4411, "step": 11500 }, { "epoch": 0.98, "learning_rate": 1.5111219750672208e-05, "loss": 0.4366, "step": 12000 }, { "epoch": 1.0, "eval_accuracy": 0.35986638422682093, "eval_f1": 0.5769146847043422, "eval_loss": 0.416496217250824, "eval_roc_auc": 0.7106236321499733, "eval_runtime": 1041.9101, "eval_samples_per_second": 11.78, "eval_steps_per_second": 1.473, "step": 12273 }, { "epoch": 1.02, "learning_rate": 1.4907520573616886e-05, "loss": 0.4239, "step": 12500 }, { "epoch": 1.06, "learning_rate": 1.470382139656156e-05, "loss": 0.4166, "step": 13000 }, { "epoch": 1.1, "learning_rate": 1.4500122219506234e-05, "loss": 0.4077, "step": 13500 }, { "epoch": 1.14, "learning_rate": 1.4296423042450908e-05, "loss": 0.403, "step": 14000 }, { "epoch": 1.18, "learning_rate": 1.4092723865395586e-05, "loss": 0.4102, "step": 14500 }, { "epoch": 1.22, "learning_rate": 1.388902468834026e-05, "loss": 0.4055, "step": 15000 }, { "epoch": 1.26, "learning_rate": 1.3685325511284934e-05, "loss": 0.4017, "step": 15500 }, { "epoch": 1.3, "learning_rate": 1.3481626334229612e-05, "loss": 0.4089, "step": 16000 }, { "epoch": 1.34, "learning_rate": 1.3277927157174286e-05, "loss": 0.4021, "step": 16500 }, { "epoch": 1.39, "learning_rate": 1.307422798011896e-05, "loss": 0.4153, "step": 17000 }, { "epoch": 1.43, "learning_rate": 1.2870528803063638e-05, "loss": 0.4086, "step": 17500 }, { "epoch": 1.47, "learning_rate": 1.2666829626008312e-05, "loss": 0.4132, "step": 18000 }, { "epoch": 1.51, "learning_rate": 1.2463130448952986e-05, "loss": 0.4136, "step": 18500 }, { "epoch": 1.55, "learning_rate": 1.2259431271897662e-05, "loss": 0.4045, "step": 19000 }, { "epoch": 1.59, "learning_rate": 1.2055732094842338e-05, "loss": 0.408, "step": 19500 }, { "epoch": 1.63, "learning_rate": 1.1852032917787012e-05, "loss": 0.3941, "step": 20000 }, { "epoch": 1.67, "learning_rate": 1.1648333740731688e-05, "loss": 0.4135, "step": 20500 }, { "epoch": 1.71, "learning_rate": 1.1444634563676364e-05, "loss": 0.4086, "step": 21000 }, { "epoch": 1.75, "learning_rate": 1.124093538662104e-05, "loss": 0.4166, "step": 21500 }, { "epoch": 1.79, "learning_rate": 1.1037236209565714e-05, "loss": 0.4077, "step": 22000 }, { "epoch": 1.83, "learning_rate": 1.083353703251039e-05, "loss": 0.4092, "step": 22500 }, { "epoch": 1.87, "learning_rate": 1.0629837855455066e-05, "loss": 0.4048, "step": 23000 }, { "epoch": 1.91, "learning_rate": 1.042613867839974e-05, "loss": 0.4089, "step": 23500 }, { "epoch": 1.96, "learning_rate": 1.0222439501344414e-05, "loss": 0.4052, "step": 24000 }, { "epoch": 2.0, "learning_rate": 1.0018740324289092e-05, "loss": 0.4008, "step": 24500 }, { "epoch": 2.0, "eval_accuracy": 0.37974580413883, "eval_f1": 0.5928196793972076, "eval_loss": 0.4055616855621338, "eval_roc_auc": 0.7192491902327842, "eval_runtime": 1043.4921, "eval_samples_per_second": 11.762, "eval_steps_per_second": 1.471, "step": 24546 }, { "epoch": 2.04, "learning_rate": 9.815041147233766e-06, "loss": 0.3812, "step": 25000 }, { "epoch": 2.08, "learning_rate": 9.611341970178442e-06, "loss": 0.3776, "step": 25500 }, { "epoch": 2.12, "learning_rate": 9.407642793123116e-06, "loss": 0.3678, "step": 26000 }, { "epoch": 2.16, "learning_rate": 9.203943616067792e-06, "loss": 0.3664, "step": 26500 }, { "epoch": 2.2, "learning_rate": 9.000244439012466e-06, "loss": 0.3768, "step": 27000 }, { "epoch": 2.24, "learning_rate": 8.796545261957142e-06, "loss": 0.3774, "step": 27500 }, { "epoch": 2.28, "learning_rate": 8.592846084901818e-06, "loss": 0.3668, "step": 28000 }, { "epoch": 2.32, "learning_rate": 8.389146907846492e-06, "loss": 0.3699, "step": 28500 }, { "epoch": 2.36, "learning_rate": 8.185447730791168e-06, "loss": 0.3731, "step": 29000 }, { "epoch": 2.4, "learning_rate": 7.981748553735843e-06, "loss": 0.3692, "step": 29500 }, { "epoch": 2.44, "learning_rate": 7.778049376680518e-06, "loss": 0.3686, "step": 30000 }, { "epoch": 2.49, "learning_rate": 7.574350199625194e-06, "loss": 0.3664, "step": 30500 }, { "epoch": 2.53, "learning_rate": 7.370651022569869e-06, "loss": 0.3748, "step": 31000 }, { "epoch": 2.57, "learning_rate": 7.1669518455145444e-06, "loss": 0.3623, "step": 31500 }, { "epoch": 2.61, "learning_rate": 6.96325266845922e-06, "loss": 0.3778, "step": 32000 }, { "epoch": 2.65, "learning_rate": 6.759553491403895e-06, "loss": 0.3707, "step": 32500 }, { "epoch": 2.69, "learning_rate": 6.555854314348571e-06, "loss": 0.3703, "step": 33000 }, { "epoch": 2.73, "learning_rate": 6.3521551372932455e-06, "loss": 0.3651, "step": 33500 }, { "epoch": 2.77, "learning_rate": 6.148455960237921e-06, "loss": 0.3682, "step": 34000 }, { "epoch": 2.81, "learning_rate": 5.944756783182597e-06, "loss": 0.3767, "step": 34500 }, { "epoch": 2.85, "learning_rate": 5.7410576061272715e-06, "loss": 0.3717, "step": 35000 }, { "epoch": 2.89, "learning_rate": 5.537358429071947e-06, "loss": 0.371, "step": 35500 }, { "epoch": 2.93, "learning_rate": 5.333659252016622e-06, "loss": 0.3684, "step": 36000 }, { "epoch": 2.97, "learning_rate": 5.1299600749612975e-06, "loss": 0.3707, "step": 36500 }, { "epoch": 3.0, "eval_accuracy": 0.3732279615447287, "eval_f1": 0.5955409356725146, "eval_loss": 0.41057834029197693, "eval_roc_auc": 0.7213548698125667, "eval_runtime": 1042.5077, "eval_samples_per_second": 11.774, "eval_steps_per_second": 1.472, "step": 36819 } ], "max_steps": 49092, "num_train_epochs": 4, "total_flos": 1.951031236478976e+16, "trial_name": null, "trial_params": null }