twitter-roberta-base-WNUT / trainer_state.json
emilys's picture
End of training
c528230
{
"best_metric": 0.6654040404040403,
"best_model_checkpoint": "twitter-roberta-base-WNUT/checkpoint-500",
"epoch": 10.0,
"global_step": 540,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.46,
"eval_accuracy": 0.9205491641772071,
"eval_f1": 0.0,
"eval_loss": 0.39121243357658386,
"eval_precision": 0.0,
"eval_recall": 0.0,
"eval_runtime": 1.5425,
"eval_samples_per_second": 654.138,
"eval_steps_per_second": 0.648,
"step": 25
},
{
"epoch": 0.93,
"eval_accuracy": 0.9209305281891565,
"eval_f1": 0.004739336492890995,
"eval_loss": 0.2846619784832001,
"eval_precision": 0.25,
"eval_recall": 0.0023923444976076554,
"eval_runtime": 1.5304,
"eval_samples_per_second": 659.288,
"eval_steps_per_second": 0.653,
"step": 50
},
{
"epoch": 1.39,
"eval_accuracy": 0.9426047162016145,
"eval_f1": 0.4239766081871345,
"eval_loss": 0.2449360191822052,
"eval_precision": 0.5451127819548872,
"eval_recall": 0.34688995215311,
"eval_runtime": 1.487,
"eval_samples_per_second": 678.556,
"eval_steps_per_second": 0.673,
"step": 75
},
{
"epoch": 1.85,
"eval_accuracy": 0.9491514650734125,
"eval_f1": 0.5565455791638108,
"eval_loss": 0.19464540481567383,
"eval_precision": 0.651685393258427,
"eval_recall": 0.48564593301435405,
"eval_runtime": 1.5409,
"eval_samples_per_second": 654.812,
"eval_steps_per_second": 0.649,
"step": 100
},
{
"epoch": 2.31,
"eval_accuracy": 0.9581135193542236,
"eval_f1": 0.621870882740448,
"eval_loss": 0.1851097047328949,
"eval_precision": 0.6920821114369502,
"eval_recall": 0.5645933014354066,
"eval_runtime": 1.5283,
"eval_samples_per_second": 660.202,
"eval_steps_per_second": 0.654,
"step": 125
},
{
"epoch": 2.78,
"eval_accuracy": 0.9594482933960465,
"eval_f1": 0.6331399097356544,
"eval_loss": 0.1671772003173828,
"eval_precision": 0.6867132867132867,
"eval_recall": 0.5873205741626795,
"eval_runtime": 1.7364,
"eval_samples_per_second": 581.088,
"eval_steps_per_second": 0.576,
"step": 150
},
{
"epoch": 3.24,
"eval_accuracy": 0.9615457954617682,
"eval_f1": 0.6276527331189711,
"eval_loss": 0.16754180192947388,
"eval_precision": 0.6787204450625869,
"eval_recall": 0.583732057416268,
"eval_runtime": 1.522,
"eval_samples_per_second": 662.938,
"eval_steps_per_second": 0.657,
"step": 175
},
{
"epoch": 3.7,
"eval_accuracy": 0.9637704188648064,
"eval_f1": 0.65389369592089,
"eval_loss": 0.16441918909549713,
"eval_precision": 0.6764705882352942,
"eval_recall": 0.6327751196172249,
"eval_runtime": 1.5477,
"eval_samples_per_second": 651.939,
"eval_steps_per_second": 0.646,
"step": 200
},
{
"epoch": 4.17,
"eval_accuracy": 0.9640246615394394,
"eval_f1": 0.673697270471464,
"eval_loss": 0.1672356277704239,
"eval_precision": 0.6997422680412371,
"eval_recall": 0.6495215311004785,
"eval_runtime": 1.5668,
"eval_samples_per_second": 643.973,
"eval_steps_per_second": 0.638,
"step": 225
},
{
"epoch": 4.63,
"eval_accuracy": 0.9648509502319964,
"eval_f1": 0.6666666666666666,
"eval_loss": 0.16518081724643707,
"eval_precision": 0.6915167095115681,
"eval_recall": 0.6435406698564593,
"eval_runtime": 1.544,
"eval_samples_per_second": 653.501,
"eval_steps_per_second": 0.648,
"step": 250
},
{
"epoch": 5.09,
"eval_accuracy": 0.9629441301722494,
"eval_f1": 0.6520618556701031,
"eval_loss": 0.18820269405841827,
"eval_precision": 0.7067039106145251,
"eval_recall": 0.6052631578947368,
"eval_runtime": 1.5459,
"eval_samples_per_second": 652.688,
"eval_steps_per_second": 0.647,
"step": 275
},
{
"epoch": 5.56,
"eval_accuracy": 0.9644695862200471,
"eval_f1": 0.6717267552182163,
"eval_loss": 0.17831429839134216,
"eval_precision": 0.7127516778523489,
"eval_recall": 0.6351674641148325,
"eval_runtime": 1.5976,
"eval_samples_per_second": 631.564,
"eval_steps_per_second": 0.626,
"step": 300
},
{
"epoch": 6.02,
"eval_accuracy": 0.9638975402021229,
"eval_f1": 0.6564885496183207,
"eval_loss": 0.18128034472465515,
"eval_precision": 0.7010869565217391,
"eval_recall": 0.6172248803827751,
"eval_runtime": 1.5524,
"eval_samples_per_second": 649.966,
"eval_steps_per_second": 0.644,
"step": 325
},
{
"epoch": 6.48,
"eval_accuracy": 0.96472382889468,
"eval_f1": 0.677561282212445,
"eval_loss": 0.18036700785160065,
"eval_precision": 0.713907284768212,
"eval_recall": 0.6447368421052632,
"eval_runtime": 1.6249,
"eval_samples_per_second": 620.943,
"eval_steps_per_second": 0.615,
"step": 350
},
{
"epoch": 6.94,
"eval_accuracy": 0.9640882222080976,
"eval_f1": 0.6709346991037132,
"eval_loss": 0.19022008776664734,
"eval_precision": 0.721763085399449,
"eval_recall": 0.6267942583732058,
"eval_runtime": 1.8093,
"eval_samples_per_second": 557.663,
"eval_steps_per_second": 0.553,
"step": 375
},
{
"epoch": 7.41,
"eval_accuracy": 0.9640882222080976,
"eval_f1": 0.668777707409753,
"eval_loss": 0.1882619857788086,
"eval_precision": 0.7106325706594886,
"eval_recall": 0.631578947368421,
"eval_runtime": 1.62,
"eval_samples_per_second": 622.858,
"eval_steps_per_second": 0.617,
"step": 400
},
{
"epoch": 7.87,
"eval_accuracy": 0.9642789042140724,
"eval_f1": 0.6683480453972257,
"eval_loss": 0.18618735671043396,
"eval_precision": 0.7066666666666667,
"eval_recall": 0.6339712918660287,
"eval_runtime": 1.5944,
"eval_samples_per_second": 632.853,
"eval_steps_per_second": 0.627,
"step": 425
},
{
"epoch": 8.33,
"eval_accuracy": 0.9638975402021229,
"eval_f1": 0.6670870113493064,
"eval_loss": 0.1881590634584427,
"eval_precision": 0.7053333333333334,
"eval_recall": 0.6327751196172249,
"eval_runtime": 1.7003,
"eval_samples_per_second": 593.415,
"eval_steps_per_second": 0.588,
"step": 450
},
{
"epoch": 8.8,
"eval_accuracy": 0.9638339795334647,
"eval_f1": 0.6658243840808591,
"eval_loss": 0.19190868735313416,
"eval_precision": 0.7054886211512718,
"eval_recall": 0.6303827751196173,
"eval_runtime": 1.543,
"eval_samples_per_second": 653.928,
"eval_steps_per_second": 0.648,
"step": 475
},
{
"epoch": 9.26,
"learning_rate": 1.4814814814814815e-06,
"loss": 0.1175,
"step": 500
},
{
"epoch": 9.26,
"eval_accuracy": 0.9639611008707811,
"eval_f1": 0.6654040404040403,
"eval_loss": 0.19381117820739746,
"eval_precision": 0.7045454545454546,
"eval_recall": 0.6303827751196173,
"eval_runtime": 1.541,
"eval_samples_per_second": 654.789,
"eval_steps_per_second": 0.649,
"step": 500
},
{
"epoch": 9.72,
"eval_accuracy": 0.9645967075573635,
"eval_f1": 0.6704190118824266,
"eval_loss": 0.18799594044685364,
"eval_precision": 0.7024901703800787,
"eval_recall": 0.6411483253588517,
"eval_runtime": 1.6071,
"eval_samples_per_second": 627.849,
"eval_steps_per_second": 0.622,
"step": 525
},
{
"epoch": 10.0,
"step": 540,
"total_flos": 1009327449452316.0,
"train_loss": 0.11085769158822519,
"train_runtime": 157.5154,
"train_samples_per_second": 215.471,
"train_steps_per_second": 3.428
}
],
"max_steps": 540,
"num_train_epochs": 10,
"total_flos": 1009327449452316.0,
"trial_name": null,
"trial_params": null
}