{ "best_metric": 0.6654040404040403, "best_model_checkpoint": "twitter-roberta-base-WNUT/checkpoint-500", "epoch": 10.0, "global_step": 540, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.46, "eval_accuracy": 0.9205491641772071, "eval_f1": 0.0, "eval_loss": 0.39121243357658386, "eval_precision": 0.0, "eval_recall": 0.0, "eval_runtime": 1.5425, "eval_samples_per_second": 654.138, "eval_steps_per_second": 0.648, "step": 25 }, { "epoch": 0.93, "eval_accuracy": 0.9209305281891565, "eval_f1": 0.004739336492890995, "eval_loss": 0.2846619784832001, "eval_precision": 0.25, "eval_recall": 0.0023923444976076554, "eval_runtime": 1.5304, "eval_samples_per_second": 659.288, "eval_steps_per_second": 0.653, "step": 50 }, { "epoch": 1.39, "eval_accuracy": 0.9426047162016145, "eval_f1": 0.4239766081871345, "eval_loss": 0.2449360191822052, "eval_precision": 0.5451127819548872, "eval_recall": 0.34688995215311, "eval_runtime": 1.487, "eval_samples_per_second": 678.556, "eval_steps_per_second": 0.673, "step": 75 }, { "epoch": 1.85, "eval_accuracy": 0.9491514650734125, "eval_f1": 0.5565455791638108, "eval_loss": 0.19464540481567383, "eval_precision": 0.651685393258427, "eval_recall": 0.48564593301435405, "eval_runtime": 1.5409, "eval_samples_per_second": 654.812, "eval_steps_per_second": 0.649, "step": 100 }, { "epoch": 2.31, "eval_accuracy": 0.9581135193542236, "eval_f1": 0.621870882740448, "eval_loss": 0.1851097047328949, "eval_precision": 0.6920821114369502, "eval_recall": 0.5645933014354066, "eval_runtime": 1.5283, "eval_samples_per_second": 660.202, "eval_steps_per_second": 0.654, "step": 125 }, { "epoch": 2.78, "eval_accuracy": 0.9594482933960465, "eval_f1": 0.6331399097356544, "eval_loss": 0.1671772003173828, "eval_precision": 0.6867132867132867, "eval_recall": 0.5873205741626795, "eval_runtime": 1.7364, "eval_samples_per_second": 581.088, "eval_steps_per_second": 0.576, "step": 150 }, { "epoch": 3.24, "eval_accuracy": 0.9615457954617682, "eval_f1": 0.6276527331189711, "eval_loss": 0.16754180192947388, "eval_precision": 0.6787204450625869, "eval_recall": 0.583732057416268, "eval_runtime": 1.522, "eval_samples_per_second": 662.938, "eval_steps_per_second": 0.657, "step": 175 }, { "epoch": 3.7, "eval_accuracy": 0.9637704188648064, "eval_f1": 0.65389369592089, "eval_loss": 0.16441918909549713, "eval_precision": 0.6764705882352942, "eval_recall": 0.6327751196172249, "eval_runtime": 1.5477, "eval_samples_per_second": 651.939, "eval_steps_per_second": 0.646, "step": 200 }, { "epoch": 4.17, "eval_accuracy": 0.9640246615394394, "eval_f1": 0.673697270471464, "eval_loss": 0.1672356277704239, "eval_precision": 0.6997422680412371, "eval_recall": 0.6495215311004785, "eval_runtime": 1.5668, "eval_samples_per_second": 643.973, "eval_steps_per_second": 0.638, "step": 225 }, { "epoch": 4.63, "eval_accuracy": 0.9648509502319964, "eval_f1": 0.6666666666666666, "eval_loss": 0.16518081724643707, "eval_precision": 0.6915167095115681, "eval_recall": 0.6435406698564593, "eval_runtime": 1.544, "eval_samples_per_second": 653.501, "eval_steps_per_second": 0.648, "step": 250 }, { "epoch": 5.09, "eval_accuracy": 0.9629441301722494, "eval_f1": 0.6520618556701031, "eval_loss": 0.18820269405841827, "eval_precision": 0.7067039106145251, "eval_recall": 0.6052631578947368, "eval_runtime": 1.5459, "eval_samples_per_second": 652.688, "eval_steps_per_second": 0.647, "step": 275 }, { "epoch": 5.56, "eval_accuracy": 0.9644695862200471, "eval_f1": 0.6717267552182163, "eval_loss": 0.17831429839134216, "eval_precision": 0.7127516778523489, "eval_recall": 0.6351674641148325, "eval_runtime": 1.5976, "eval_samples_per_second": 631.564, "eval_steps_per_second": 0.626, "step": 300 }, { "epoch": 6.02, "eval_accuracy": 0.9638975402021229, "eval_f1": 0.6564885496183207, "eval_loss": 0.18128034472465515, "eval_precision": 0.7010869565217391, "eval_recall": 0.6172248803827751, "eval_runtime": 1.5524, "eval_samples_per_second": 649.966, "eval_steps_per_second": 0.644, "step": 325 }, { "epoch": 6.48, "eval_accuracy": 0.96472382889468, "eval_f1": 0.677561282212445, "eval_loss": 0.18036700785160065, "eval_precision": 0.713907284768212, "eval_recall": 0.6447368421052632, "eval_runtime": 1.6249, "eval_samples_per_second": 620.943, "eval_steps_per_second": 0.615, "step": 350 }, { "epoch": 6.94, "eval_accuracy": 0.9640882222080976, "eval_f1": 0.6709346991037132, "eval_loss": 0.19022008776664734, "eval_precision": 0.721763085399449, "eval_recall": 0.6267942583732058, "eval_runtime": 1.8093, "eval_samples_per_second": 557.663, "eval_steps_per_second": 0.553, "step": 375 }, { "epoch": 7.41, "eval_accuracy": 0.9640882222080976, "eval_f1": 0.668777707409753, "eval_loss": 0.1882619857788086, "eval_precision": 0.7106325706594886, "eval_recall": 0.631578947368421, "eval_runtime": 1.62, "eval_samples_per_second": 622.858, "eval_steps_per_second": 0.617, "step": 400 }, { "epoch": 7.87, "eval_accuracy": 0.9642789042140724, "eval_f1": 0.6683480453972257, "eval_loss": 0.18618735671043396, "eval_precision": 0.7066666666666667, "eval_recall": 0.6339712918660287, "eval_runtime": 1.5944, "eval_samples_per_second": 632.853, "eval_steps_per_second": 0.627, "step": 425 }, { "epoch": 8.33, "eval_accuracy": 0.9638975402021229, "eval_f1": 0.6670870113493064, "eval_loss": 0.1881590634584427, "eval_precision": 0.7053333333333334, "eval_recall": 0.6327751196172249, "eval_runtime": 1.7003, "eval_samples_per_second": 593.415, "eval_steps_per_second": 0.588, "step": 450 }, { "epoch": 8.8, "eval_accuracy": 0.9638339795334647, "eval_f1": 0.6658243840808591, "eval_loss": 0.19190868735313416, "eval_precision": 0.7054886211512718, "eval_recall": 0.6303827751196173, "eval_runtime": 1.543, "eval_samples_per_second": 653.928, "eval_steps_per_second": 0.648, "step": 475 }, { "epoch": 9.26, "learning_rate": 1.4814814814814815e-06, "loss": 0.1175, "step": 500 }, { "epoch": 9.26, "eval_accuracy": 0.9639611008707811, "eval_f1": 0.6654040404040403, "eval_loss": 0.19381117820739746, "eval_precision": 0.7045454545454546, "eval_recall": 0.6303827751196173, "eval_runtime": 1.541, "eval_samples_per_second": 654.789, "eval_steps_per_second": 0.649, "step": 500 }, { "epoch": 9.72, "eval_accuracy": 0.9645967075573635, "eval_f1": 0.6704190118824266, "eval_loss": 0.18799594044685364, "eval_precision": 0.7024901703800787, "eval_recall": 0.6411483253588517, "eval_runtime": 1.6071, "eval_samples_per_second": 627.849, "eval_steps_per_second": 0.622, "step": 525 }, { "epoch": 10.0, "step": 540, "total_flos": 1009327449452316.0, "train_loss": 0.11085769158822519, "train_runtime": 157.5154, "train_samples_per_second": 215.471, "train_steps_per_second": 3.428 } ], "max_steps": 540, "num_train_epochs": 10, "total_flos": 1009327449452316.0, "trial_name": null, "trial_params": null }