{ "best_metric": 0.8578431372549019, "best_model_checkpoint": "./bert-base-uncased/fine_tuned_models/checkpoint-460", "epoch": 10.0, "global_step": 1150, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 1e-05, "loss": 0.6308, "step": 115 }, { "epoch": 1.0, "eval_accuracy": 0.7058823529411765, "eval_combined_score": 0.7639204049572351, "eval_f1": 0.8219584569732937, "eval_loss": 0.5484543442726135, "eval_runtime": 1.1176, "eval_samples_per_second": 365.063, "eval_steps_per_second": 45.633, "step": 115 }, { "epoch": 2.0, "learning_rate": 2e-05, "loss": 0.488, "step": 230 }, { "epoch": 2.0, "eval_accuracy": 0.7990196078431373, "eval_combined_score": 0.8344304388422037, "eval_f1": 0.86984126984127, "eval_loss": 0.44723159074783325, "eval_runtime": 1.121, "eval_samples_per_second": 363.966, "eval_steps_per_second": 45.496, "step": 230 }, { "epoch": 3.0, "learning_rate": 1.7500000000000002e-05, "loss": 0.3019, "step": 345 }, { "epoch": 3.0, "eval_accuracy": 0.8406862745098039, "eval_combined_score": 0.8653515974917887, "eval_f1": 0.8900169204737733, "eval_loss": 0.3739049434661865, "eval_runtime": 1.1236, "eval_samples_per_second": 363.103, "eval_steps_per_second": 45.388, "step": 345 }, { "epoch": 4.0, "learning_rate": 1.5000000000000002e-05, "loss": 0.1395, "step": 460 }, { "epoch": 4.0, "eval_accuracy": 0.8578431372549019, "eval_combined_score": 0.8790933899332929, "eval_f1": 0.9003436426116839, "eval_loss": 0.48073676228523254, "eval_runtime": 1.1302, "eval_samples_per_second": 360.994, "eval_steps_per_second": 45.124, "step": 460 }, { "epoch": 5.0, "learning_rate": 1.25e-05, "loss": 0.0603, "step": 575 }, { "epoch": 5.0, "eval_accuracy": 0.8357843137254902, "eval_combined_score": 0.8594279334770557, "eval_f1": 0.8830715532286212, "eval_loss": 0.6254621148109436, "eval_runtime": 1.1347, "eval_samples_per_second": 359.579, "eval_steps_per_second": 44.947, "step": 575 }, { "epoch": 6.0, "learning_rate": 1e-05, "loss": 0.0356, "step": 690 }, { "epoch": 6.0, "eval_accuracy": 0.8431372549019608, "eval_combined_score": 0.8676965735789266, "eval_f1": 0.8922558922558923, "eval_loss": 0.8049449324607849, "eval_runtime": 1.1199, "eval_samples_per_second": 364.325, "eval_steps_per_second": 45.541, "step": 690 }, { "epoch": 7.0, "learning_rate": 7.500000000000001e-06, "loss": 0.0267, "step": 805 }, { "epoch": 7.0, "eval_accuracy": 0.8455882352941176, "eval_combined_score": 0.8668438512172187, "eval_f1": 0.8880994671403197, "eval_loss": 0.7565263509750366, "eval_runtime": 1.1371, "eval_samples_per_second": 358.818, "eval_steps_per_second": 44.852, "step": 805 }, { "epoch": 8.0, "learning_rate": 5e-06, "loss": 0.0117, "step": 920 }, { "epoch": 8.0, "eval_accuracy": 0.8382352941176471, "eval_combined_score": 0.8622210953346856, "eval_f1": 0.8862068965517241, "eval_loss": 0.8377837538719177, "eval_runtime": 1.1383, "eval_samples_per_second": 358.436, "eval_steps_per_second": 44.805, "step": 920 }, { "epoch": 9.0, "learning_rate": 2.5e-06, "loss": 0.0086, "step": 1035 }, { "epoch": 9.0, "eval_accuracy": 0.8382352941176471, "eval_combined_score": 0.8614253393665159, "eval_f1": 0.8846153846153846, "eval_loss": 0.870381772518158, "eval_runtime": 1.1281, "eval_samples_per_second": 361.659, "eval_steps_per_second": 45.207, "step": 1035 }, { "epoch": 10.0, "learning_rate": 0.0, "loss": 0.0075, "step": 1150 }, { "epoch": 10.0, "eval_accuracy": 0.8406862745098039, "eval_combined_score": 0.8640173140313319, "eval_f1": 0.8873483535528597, "eval_loss": 0.8665909171104431, "eval_runtime": 1.1293, "eval_samples_per_second": 361.28, "eval_steps_per_second": 45.16, "step": 1150 }, { "epoch": 10.0, "step": 1150, "total_flos": 2412728377651200.0, "train_loss": 0.17106628703034443, "train_runtime": 327.4394, "train_samples_per_second": 112.021, "train_steps_per_second": 3.512 } ], "max_steps": 1150, "num_train_epochs": 10, "total_flos": 2412728377651200.0, "trial_name": null, "trial_params": null }