nerugm-lora-r16-4 / trainer_state.json
apwic's picture
End of training
50138ee verified
raw
history blame
145 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.391684889793396,
"learning_rate": 4.9500000000000004e-05,
"loss": 1.1481,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.0,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.0,
"eval_PERSON_recall": 0.0,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.7146090865135193,
"eval_overall_accuracy": 0.8365739601279842,
"eval_overall_f1": 0.0,
"eval_overall_precision": 0.0,
"eval_overall_recall": 0.0,
"eval_runtime": 0.9362,
"eval_samples_per_second": 199.746,
"eval_steps_per_second": 3.204,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.086163878440857,
"learning_rate": 4.9e-05,
"loss": 0.6809,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.012820512820512822,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.16666666666666666,
"eval_PERSON_recall": 0.006666666666666667,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5919493436813354,
"eval_overall_accuracy": 0.8385429485601772,
"eval_overall_f1": 0.005509641873278238,
"eval_overall_precision": 0.08333333333333333,
"eval_overall_recall": 0.002849002849002849,
"eval_runtime": 0.974,
"eval_samples_per_second": 191.988,
"eval_steps_per_second": 3.08,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.1405037641525269,
"learning_rate": 4.85e-05,
"loss": 0.5553,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.09302325581395347,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.3076923076923077,
"eval_LOCATION_recall": 0.0547945205479452,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.18834080717488788,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.2876712328767123,
"eval_PERSON_recall": 0.14,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.11538461538461539,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.16666666666666666,
"eval_TIME_recall": 0.08823529411764706,
"eval_loss": 0.45798516273498535,
"eval_overall_accuracy": 0.8599556977602757,
"eval_overall_f1": 0.12043010752688173,
"eval_overall_precision": 0.24561403508771928,
"eval_overall_recall": 0.07977207977207977,
"eval_runtime": 1.0183,
"eval_samples_per_second": 183.643,
"eval_steps_per_second": 2.946,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.2108490467071533,
"learning_rate": 4.8e-05,
"loss": 0.4289,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.40601503759398494,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.45,
"eval_LOCATION_recall": 0.3698630136986301,
"eval_ORGANIZATION_f1": 0.14,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.2,
"eval_ORGANIZATION_recall": 0.1076923076923077,
"eval_PERSON_f1": 0.6265060240963856,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.5714285714285714,
"eval_PERSON_recall": 0.6933333333333334,
"eval_QUANTITY_f1": 0.2173913043478261,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.29411764705882354,
"eval_QUANTITY_recall": 0.1724137931034483,
"eval_TIME_f1": 0.5074626865671642,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.5151515151515151,
"eval_TIME_recall": 0.5,
"eval_loss": 0.3399774134159088,
"eval_overall_accuracy": 0.9059808023627861,
"eval_overall_f1": 0.471976401179941,
"eval_overall_precision": 0.4892966360856269,
"eval_overall_recall": 0.45584045584045585,
"eval_runtime": 0.9802,
"eval_samples_per_second": 190.773,
"eval_steps_per_second": 3.061,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.8846955299377441,
"learning_rate": 4.75e-05,
"loss": 0.3345,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.576923076923077,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.5421686746987951,
"eval_LOCATION_recall": 0.6164383561643836,
"eval_ORGANIZATION_f1": 0.4477611940298507,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.43478260869565216,
"eval_ORGANIZATION_recall": 0.46153846153846156,
"eval_PERSON_f1": 0.7641791044776118,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.6918918918918919,
"eval_PERSON_recall": 0.8533333333333334,
"eval_QUANTITY_f1": 0.4482758620689655,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.4482758620689655,
"eval_QUANTITY_recall": 0.4482758620689655,
"eval_TIME_f1": 0.5945945945945946,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.55,
"eval_TIME_recall": 0.6470588235294118,
"eval_loss": 0.2660435438156128,
"eval_overall_accuracy": 0.9276396751169087,
"eval_overall_f1": 0.6287978863936591,
"eval_overall_precision": 0.5862068965517241,
"eval_overall_recall": 0.6780626780626781,
"eval_runtime": 0.9444,
"eval_samples_per_second": 198.0,
"eval_steps_per_second": 3.176,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 2.0284557342529297,
"learning_rate": 4.7e-05,
"loss": 0.2736,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.6473988439306358,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.56,
"eval_LOCATION_recall": 0.7671232876712328,
"eval_ORGANIZATION_f1": 0.5694444444444443,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5189873417721519,
"eval_ORGANIZATION_recall": 0.6307692307692307,
"eval_PERSON_f1": 0.8263473053892216,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.75,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.43750000000000006,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.4,
"eval_QUANTITY_recall": 0.4827586206896552,
"eval_TIME_f1": 0.6578947368421053,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.5952380952380952,
"eval_TIME_recall": 0.7352941176470589,
"eval_loss": 0.23392952978610992,
"eval_overall_accuracy": 0.9355156288456805,
"eval_overall_f1": 0.6927939317319847,
"eval_overall_precision": 0.6227272727272727,
"eval_overall_recall": 0.7806267806267806,
"eval_runtime": 1.0811,
"eval_samples_per_second": 172.97,
"eval_steps_per_second": 2.775,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 1.2625077962875366,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.2339,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.6896551724137931,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.594059405940594,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.5874125874125874,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5384615384615384,
"eval_ORGANIZATION_recall": 0.6461538461538462,
"eval_PERSON_f1": 0.871165644171779,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8068181818181818,
"eval_PERSON_recall": 0.9466666666666667,
"eval_QUANTITY_f1": 0.4666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.45161290322580644,
"eval_QUANTITY_recall": 0.4827586206896552,
"eval_TIME_f1": 0.6666666666666667,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.5909090909090909,
"eval_TIME_recall": 0.7647058823529411,
"eval_loss": 0.19882944226264954,
"eval_overall_accuracy": 0.9414225941422594,
"eval_overall_f1": 0.7272727272727274,
"eval_overall_precision": 0.6604651162790698,
"eval_overall_recall": 0.8091168091168092,
"eval_runtime": 0.9366,
"eval_samples_per_second": 199.653,
"eval_steps_per_second": 3.203,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 1.0806405544281006,
"learning_rate": 4.600000000000001e-05,
"loss": 0.213,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.696629213483146,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.5904761904761905,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6133333333333333,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5411764705882353,
"eval_ORGANIZATION_recall": 0.7076923076923077,
"eval_PERSON_f1": 0.8695652173913044,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.813953488372093,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.4918032786885246,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.46875,
"eval_QUANTITY_recall": 0.5172413793103449,
"eval_TIME_f1": 0.7088607594936709,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6222222222222222,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.1896568089723587,
"eval_overall_accuracy": 0.9406842234801871,
"eval_overall_f1": 0.7367088607594937,
"eval_overall_precision": 0.662870159453303,
"eval_overall_recall": 0.8290598290598291,
"eval_runtime": 0.9615,
"eval_samples_per_second": 194.494,
"eval_steps_per_second": 3.12,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 2.574251651763916,
"learning_rate": 4.55e-05,
"loss": 0.1927,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7052023121387282,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.61,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.5960264900662252,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5232558139534884,
"eval_ORGANIZATION_recall": 0.6923076923076923,
"eval_PERSON_f1": 0.8607594936708859,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8192771084337349,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.5333333333333333,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5161290322580645,
"eval_QUANTITY_recall": 0.5517241379310345,
"eval_TIME_f1": 0.7272727272727273,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6511627906976745,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.17324766516685486,
"eval_overall_accuracy": 0.9419148412503077,
"eval_overall_f1": 0.7361647361647361,
"eval_overall_precision": 0.6713615023474179,
"eval_overall_recall": 0.8148148148148148,
"eval_runtime": 0.9772,
"eval_samples_per_second": 191.367,
"eval_steps_per_second": 3.07,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 1.0041288137435913,
"learning_rate": 4.5e-05,
"loss": 0.1794,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7710843373493976,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6881720430107527,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6206896551724138,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5625,
"eval_ORGANIZATION_recall": 0.6923076923076923,
"eval_PERSON_f1": 0.8517350157728706,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8083832335329342,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.523076923076923,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.4722222222222222,
"eval_QUANTITY_recall": 0.5862068965517241,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.16186459362506866,
"eval_overall_accuracy": 0.9470834358848141,
"eval_overall_f1": 0.7624020887728459,
"eval_overall_precision": 0.7036144578313253,
"eval_overall_recall": 0.8319088319088319,
"eval_runtime": 0.9594,
"eval_samples_per_second": 194.91,
"eval_steps_per_second": 3.127,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 1.2041752338409424,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1696,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7619047619047619,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6736842105263158,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6357615894039734,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5581395348837209,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8598726114649682,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.823170731707317,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.6461538461538462,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5833333333333334,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8108108108108107,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.15661031007766724,
"eval_overall_accuracy": 0.948806300762983,
"eval_overall_f1": 0.7720207253886011,
"eval_overall_precision": 0.7078384798099763,
"eval_overall_recall": 0.8490028490028491,
"eval_runtime": 0.9517,
"eval_samples_per_second": 196.498,
"eval_steps_per_second": 3.152,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 1.5384461879730225,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1593,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7804878048780488,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7032967032967034,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6282051282051283,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5384615384615384,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8706624605678233,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8263473053892215,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.15920695662498474,
"eval_overall_accuracy": 0.950775289195176,
"eval_overall_f1": 0.7866323907455014,
"eval_overall_precision": 0.7166276346604216,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.9534,
"eval_samples_per_second": 196.149,
"eval_steps_per_second": 3.147,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 1.1916617155075073,
"learning_rate": 4.35e-05,
"loss": 0.1517,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.7924528301886793,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6538461538461537,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5604395604395604,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8589341692789968,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8106508875739645,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.575,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8378378378378379,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.775,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.15383993089199066,
"eval_overall_accuracy": 0.9510214127492,
"eval_overall_f1": 0.785070785070785,
"eval_overall_precision": 0.715962441314554,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.957,
"eval_samples_per_second": 195.394,
"eval_steps_per_second": 3.135,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.1742634773254395,
"learning_rate": 4.3e-05,
"loss": 0.1512,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7804878048780488,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7032967032967034,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6219512195121952,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5151515151515151,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8535825545171339,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8011695906432749,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7142857142857144,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6097560975609756,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8051948051948051,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7209302325581395,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.15704582631587982,
"eval_overall_accuracy": 0.9500369185331036,
"eval_overall_f1": 0.7738693467336684,
"eval_overall_precision": 0.6921348314606741,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.9592,
"eval_samples_per_second": 194.955,
"eval_steps_per_second": 3.128,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 1.3693042993545532,
"learning_rate": 4.25e-05,
"loss": 0.1456,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.7636363636363637,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6847826086956522,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6329113924050633,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5376344086021505,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8706624605678233,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8263473053892215,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6857142857142856,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5853658536585366,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.794871794871795,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7045454545454546,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.15755978226661682,
"eval_overall_accuracy": 0.9502830420871278,
"eval_overall_f1": 0.7766497461928934,
"eval_overall_precision": 0.700228832951945,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.9594,
"eval_samples_per_second": 194.913,
"eval_steps_per_second": 3.127,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 1.6605894565582275,
"learning_rate": 4.2e-05,
"loss": 0.1386,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.7590361445783131,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6774193548387096,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6451612903225806,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5555555555555556,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8616352201257862,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8154761904761905,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.676056338028169,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5714285714285714,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.794871794871795,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7045454545454546,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1546044647693634,
"eval_overall_accuracy": 0.9510214127492,
"eval_overall_f1": 0.7741116751269036,
"eval_overall_precision": 0.6979405034324943,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.9626,
"eval_samples_per_second": 194.274,
"eval_steps_per_second": 3.117,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.814884603023529,
"learning_rate": 4.15e-05,
"loss": 0.1366,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7974683544303799,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6496815286624205,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5543478260869565,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.575,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8051948051948051,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7209302325581395,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14499862492084503,
"eval_overall_accuracy": 0.9539748953974896,
"eval_overall_f1": 0.7881136950904393,
"eval_overall_precision": 0.7210401891252955,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.9628,
"eval_samples_per_second": 194.217,
"eval_steps_per_second": 3.116,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 1.8611637353897095,
"learning_rate": 4.1e-05,
"loss": 0.1338,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.7924528301886793,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6578947368421053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5747126436781609,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6567164179104478,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5789473684210527,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14045144617557526,
"eval_overall_accuracy": 0.9552055131676102,
"eval_overall_f1": 0.7906371911573472,
"eval_overall_precision": 0.7272727272727273,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 1.0246,
"eval_samples_per_second": 182.513,
"eval_steps_per_second": 2.928,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 1.1466857194900513,
"learning_rate": 4.05e-05,
"loss": 0.1282,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.7974683544303799,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6463414634146342,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5353535353535354,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8553459119496856,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8095238095238095,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6153846153846154,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8051948051948051,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7209302325581395,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1484779715538025,
"eval_overall_accuracy": 0.9524981540733448,
"eval_overall_f1": 0.7821656050955413,
"eval_overall_precision": 0.7073732718894009,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.9587,
"eval_samples_per_second": 195.054,
"eval_steps_per_second": 3.129,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 1.398795247077942,
"learning_rate": 4e-05,
"loss": 0.1253,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.802547770700637,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6622516556291391,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5813953488372093,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7246376811594203,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13943925499916077,
"eval_overall_accuracy": 0.9556977602756583,
"eval_overall_f1": 0.7979139504563233,
"eval_overall_precision": 0.7355769230769231,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.9521,
"eval_samples_per_second": 196.41,
"eval_steps_per_second": 3.151,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 1.8820486068725586,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.1245,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6578947368421053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5747126436781609,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13452573120594025,
"eval_overall_accuracy": 0.9586512429239479,
"eval_overall_f1": 0.8042049934296978,
"eval_overall_precision": 0.7463414634146341,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.9556,
"eval_samples_per_second": 195.683,
"eval_steps_per_second": 3.139,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 1.1895145177841187,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.12,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6583850931677019,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5520833333333334,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8714733542319748,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8224852071005917,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7246376811594203,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.150462806224823,
"eval_overall_accuracy": 0.9522520305193207,
"eval_overall_f1": 0.788265306122449,
"eval_overall_precision": 0.7136258660508084,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.9605,
"eval_samples_per_second": 194.682,
"eval_steps_per_second": 3.123,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 2.248535633087158,
"learning_rate": 3.85e-05,
"loss": 0.1191,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6538461538461537,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5604395604395604,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7246376811594203,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13763977587223053,
"eval_overall_accuracy": 0.9561900073837066,
"eval_overall_f1": 0.8010403120936281,
"eval_overall_precision": 0.7368421052631579,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.9781,
"eval_samples_per_second": 191.185,
"eval_steps_per_second": 3.067,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.4806087017059326,
"learning_rate": 3.8e-05,
"loss": 0.1188,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7924528301886793,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6753246753246754,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5842696629213483,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6376811594202898,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.55,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14500263333320618,
"eval_overall_accuracy": 0.9559438838296825,
"eval_overall_f1": 0.7927461139896372,
"eval_overall_precision": 0.7268408551068883,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.9648,
"eval_samples_per_second": 193.813,
"eval_steps_per_second": 3.109,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 1.1676396131515503,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.1158,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5714285714285714,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6857142857142856,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5853658536585366,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14524681866168976,
"eval_overall_accuracy": 0.9544671425055378,
"eval_overall_f1": 0.788659793814433,
"eval_overall_precision": 0.72,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.9488,
"eval_samples_per_second": 197.084,
"eval_steps_per_second": 3.162,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 2.0401439666748047,
"learning_rate": 3.7e-05,
"loss": 0.1162,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.675496688741722,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5930232558139535,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6153846153846154,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8108108108108107,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13445432484149933,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.7979002624671917,
"eval_overall_precision": 0.7396593673965937,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.9577,
"eval_samples_per_second": 195.269,
"eval_steps_per_second": 3.133,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.6006813645362854,
"learning_rate": 3.65e-05,
"loss": 0.1118,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8181818181818182,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6666666666666667,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5795454545454546,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.131368950009346,
"eval_overall_accuracy": 0.9591434900319961,
"eval_overall_f1": 0.8083989501312336,
"eval_overall_precision": 0.7493917274939172,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.9543,
"eval_samples_per_second": 195.947,
"eval_steps_per_second": 3.144,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.7794803380966187,
"learning_rate": 3.6e-05,
"loss": 0.1128,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6666666666666667,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5882352941176471,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13416561484336853,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.7973684210526317,
"eval_overall_precision": 0.7408312958435208,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.953,
"eval_samples_per_second": 196.219,
"eval_steps_per_second": 3.148,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 1.108047366142273,
"learning_rate": 3.55e-05,
"loss": 0.1089,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6538461538461537,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5604395604395604,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13507266342639923,
"eval_overall_accuracy": 0.9584051193699237,
"eval_overall_f1": 0.7984395318595578,
"eval_overall_precision": 0.7344497607655502,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.9682,
"eval_samples_per_second": 193.134,
"eval_steps_per_second": 3.098,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 1.1064585447311401,
"learning_rate": 3.5e-05,
"loss": 0.1054,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6756756756756758,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6024096385542169,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.12900210916996002,
"eval_overall_accuracy": 0.9598818606940684,
"eval_overall_f1": 0.8068783068783069,
"eval_overall_precision": 0.7530864197530864,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.9665,
"eval_samples_per_second": 193.482,
"eval_steps_per_second": 3.104,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.547255277633667,
"learning_rate": 3.45e-05,
"loss": 0.1029,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6878980891719746,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5869565217391305,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8670886075949367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8253012048192772,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6410256410256411,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.7837837837837837,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.725,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.13610094785690308,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8,
"eval_overall_precision": 0.7350835322195705,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.9586,
"eval_samples_per_second": 195.083,
"eval_steps_per_second": 3.13,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.32147249579429626,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.1023,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6794871794871795,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5824175824175825,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6410256410256411,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13857892155647278,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.8015564202334631,
"eval_overall_precision": 0.7357142857142858,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.963,
"eval_samples_per_second": 194.191,
"eval_steps_per_second": 3.115,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 1.505850911140442,
"learning_rate": 3.35e-05,
"loss": 0.1028,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7006369426751592,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5978260869565217,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8333333333333333,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7894736842105263,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1360621303319931,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.8020833333333333,
"eval_overall_precision": 0.7386091127098321,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.9705,
"eval_samples_per_second": 192.685,
"eval_steps_per_second": 3.091,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 1.6967480182647705,
"learning_rate": 3.3e-05,
"loss": 0.0991,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6710526315789473,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5862068965517241,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8648648648648648,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13175979256629944,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.7999999999999999,
"eval_overall_precision": 0.7391304347826086,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.967,
"eval_samples_per_second": 193.389,
"eval_steps_per_second": 3.103,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 1.3785823583602905,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0983,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.7530864197530865,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6853932584269663,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6838709677419356,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5888888888888889,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8108108108108107,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14071786403656006,
"eval_overall_accuracy": 0.9556977602756583,
"eval_overall_f1": 0.7896774193548387,
"eval_overall_precision": 0.7216981132075472,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.9573,
"eval_samples_per_second": 195.336,
"eval_steps_per_second": 3.134,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 1.251754879951477,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0962,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7169811320754718,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6063829787234043,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6153846153846154,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8108108108108107,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14177566766738892,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.8067444876783397,
"eval_overall_precision": 0.7404761904761905,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.962,
"eval_samples_per_second": 194.386,
"eval_steps_per_second": 3.118,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 1.2584689855575562,
"learning_rate": 3.15e-05,
"loss": 0.0986,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.708860759493671,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6021505376344086,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7837837837837837,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.725,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.1421373039484024,
"eval_overall_accuracy": 0.9556977602756583,
"eval_overall_f1": 0.7974193548387097,
"eval_overall_precision": 0.7287735849056604,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.9499,
"eval_samples_per_second": 196.858,
"eval_steps_per_second": 3.158,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.9512435793876648,
"learning_rate": 3.1e-05,
"loss": 0.0971,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.684931506849315,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6172839506172839,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.575,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13257591426372528,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.7963206307490145,
"eval_overall_precision": 0.7390243902439024,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.9531,
"eval_samples_per_second": 196.208,
"eval_steps_per_second": 3.148,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 1.808843731880188,
"learning_rate": 3.05e-05,
"loss": 0.0944,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.7749999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7012987012987013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6067415730337079,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8383233532934131,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.676470588235294,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5897435897435898,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7837837837837837,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.725,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.1387697011232376,
"eval_overall_accuracy": 0.9564361309377307,
"eval_overall_f1": 0.7968952134540751,
"eval_overall_precision": 0.7298578199052133,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.9514,
"eval_samples_per_second": 196.544,
"eval_steps_per_second": 3.153,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 1.092385172843933,
"learning_rate": 3e-05,
"loss": 0.093,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7368421052631579,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6436781609195402,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8670886075949367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8253012048192772,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6567164179104478,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5789473684210527,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8333333333333333,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7894736842105263,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1326187252998352,
"eval_overall_accuracy": 0.958897366477972,
"eval_overall_f1": 0.8057742782152231,
"eval_overall_precision": 0.7469586374695864,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.9497,
"eval_samples_per_second": 196.897,
"eval_steps_per_second": 3.159,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.6803504824638367,
"learning_rate": 2.95e-05,
"loss": 0.0911,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7368421052631579,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6436781609195402,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.12640033662319183,
"eval_overall_accuracy": 0.9603741078021166,
"eval_overall_f1": 0.8137384412153237,
"eval_overall_precision": 0.7586206896551724,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.955,
"eval_samples_per_second": 195.805,
"eval_steps_per_second": 3.141,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.7038798928260803,
"learning_rate": 2.9e-05,
"loss": 0.0915,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7225806451612903,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6222222222222222,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8333333333333333,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7894736842105263,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13610343635082245,
"eval_overall_accuracy": 0.9593896135860202,
"eval_overall_f1": 0.8104575163398693,
"eval_overall_precision": 0.748792270531401,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.9531,
"eval_samples_per_second": 196.198,
"eval_steps_per_second": 3.148,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.7236311435699463,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0896,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6986301369863014,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6296296296296297,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8333333333333333,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7894736842105263,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1266656517982483,
"eval_overall_accuracy": 0.9596357371400444,
"eval_overall_f1": 0.8031914893617021,
"eval_overall_precision": 0.7531172069825436,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.9502,
"eval_samples_per_second": 196.803,
"eval_steps_per_second": 3.157,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 1.4153372049331665,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0891,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8157894736842105,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.12547963857650757,
"eval_overall_accuracy": 0.9596357371400444,
"eval_overall_f1": 0.8116710875331565,
"eval_overall_precision": 0.7593052109181141,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.9553,
"eval_samples_per_second": 195.759,
"eval_steps_per_second": 3.141,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 3.5179989337921143,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0882,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8157894736842105,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7320261437908497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13158655166625977,
"eval_overall_accuracy": 0.9603741078021166,
"eval_overall_f1": 0.8194993412384717,
"eval_overall_precision": 0.7622549019607843,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.9562,
"eval_samples_per_second": 195.568,
"eval_steps_per_second": 3.137,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 1.2313103675842285,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0853,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8157894736842105,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8484848484848485,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.6984126984126984,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6470588235294118,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8421052631578947,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.12368568032979965,
"eval_overall_accuracy": 0.9625892197883338,
"eval_overall_f1": 0.827127659574468,
"eval_overall_precision": 0.7755610972568578,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.9617,
"eval_samples_per_second": 194.451,
"eval_steps_per_second": 3.12,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 1.974324107170105,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0874,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.7924528301886793,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8769716088328076,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8323353293413174,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1277364045381546,
"eval_overall_accuracy": 0.9608663549101649,
"eval_overall_f1": 0.8162729658792651,
"eval_overall_precision": 0.7566909975669099,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.9678,
"eval_samples_per_second": 193.219,
"eval_steps_per_second": 3.1,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 2.900847911834717,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0863,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.7974683544303799,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.879746835443038,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8373493975903614,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13069714605808258,
"eval_overall_accuracy": 0.9598818606940684,
"eval_overall_f1": 0.8152031454783748,
"eval_overall_precision": 0.7548543689320388,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.9521,
"eval_samples_per_second": 196.413,
"eval_steps_per_second": 3.151,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.5791418552398682,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0881,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6179775280898876,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8706624605678233,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8263473053892215,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8108108108108107,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1359923928976059,
"eval_overall_accuracy": 0.9579128722618755,
"eval_overall_f1": 0.7994825355756792,
"eval_overall_precision": 0.7322274881516587,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.9488,
"eval_samples_per_second": 197.098,
"eval_steps_per_second": 3.162,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.3018290996551514,
"learning_rate": 2.5e-05,
"loss": 0.0852,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7105263157894737,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6206896551724138,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6153846153846154,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13739532232284546,
"eval_overall_accuracy": 0.958897366477972,
"eval_overall_f1": 0.8020833333333333,
"eval_overall_precision": 0.7386091127098321,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.9606,
"eval_samples_per_second": 194.667,
"eval_steps_per_second": 3.123,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 1.6092292070388794,
"learning_rate": 2.45e-05,
"loss": 0.0816,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1346472203731537,
"eval_overall_accuracy": 0.9591434900319961,
"eval_overall_f1": 0.8067885117493472,
"eval_overall_precision": 0.744578313253012,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.9667,
"eval_samples_per_second": 193.447,
"eval_steps_per_second": 3.103,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 1.4530425071716309,
"learning_rate": 2.4e-05,
"loss": 0.084,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.7922077922077922,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.879746835443038,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8373493975903614,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8333333333333333,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7894736842105263,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13276532292366028,
"eval_overall_accuracy": 0.9598818606940684,
"eval_overall_f1": 0.811023622047244,
"eval_overall_precision": 0.7518248175182481,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.9609,
"eval_samples_per_second": 194.599,
"eval_steps_per_second": 3.122,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 2.500049352645874,
"learning_rate": 2.35e-05,
"loss": 0.0806,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8679245283018867,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8214285714285714,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7945205479452054,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7435897435897436,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.13982656598091125,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.7963683527885862,
"eval_overall_precision": 0.7309523809523809,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.9688,
"eval_samples_per_second": 193.02,
"eval_steps_per_second": 3.097,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 2.2398998737335205,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0827,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6962025316455697,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5913978494623656,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1386086791753769,
"eval_overall_accuracy": 0.9586512429239479,
"eval_overall_f1": 0.8072916666666667,
"eval_overall_precision": 0.7434052757793765,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.9542,
"eval_samples_per_second": 195.97,
"eval_steps_per_second": 3.144,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.9107390642166138,
"learning_rate": 2.25e-05,
"loss": 0.0816,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8853503184713376,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8475609756097561,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6857142857142856,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5853658536585366,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13677756488323212,
"eval_overall_accuracy": 0.958897366477972,
"eval_overall_f1": 0.807843137254902,
"eval_overall_precision": 0.7463768115942029,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.9619,
"eval_samples_per_second": 194.412,
"eval_steps_per_second": 3.119,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 2.796041965484619,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0828,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.7922077922077922,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8742138364779874,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8273809523809523,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13076351583003998,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8162729658792651,
"eval_overall_precision": 0.7566909975669099,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.9668,
"eval_samples_per_second": 193.426,
"eval_steps_per_second": 3.103,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 1.4414466619491577,
"learning_rate": 2.15e-05,
"loss": 0.0813,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7114093959731543,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6309523809523809,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8860759493670886,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8433734939759037,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8378378378378379,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.775,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.12566277384757996,
"eval_overall_accuracy": 0.961112478464189,
"eval_overall_f1": 0.8190224570673711,
"eval_overall_precision": 0.7635467980295566,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 1.0243,
"eval_samples_per_second": 182.567,
"eval_steps_per_second": 2.929,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.5744277834892273,
"learning_rate": 2.1e-05,
"loss": 0.0797,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7027027027027027,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6265060240963856,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8383233532934131,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7837837837837837,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.725,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.12857982516288757,
"eval_overall_accuracy": 0.958897366477972,
"eval_overall_f1": 0.8057742782152231,
"eval_overall_precision": 0.7469586374695864,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.9638,
"eval_samples_per_second": 194.014,
"eval_steps_per_second": 3.113,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 2.238668203353882,
"learning_rate": 2.05e-05,
"loss": 0.0782,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8383233532934131,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13031935691833496,
"eval_overall_accuracy": 0.9608663549101649,
"eval_overall_f1": 0.8147174770039421,
"eval_overall_precision": 0.7560975609756098,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.9586,
"eval_samples_per_second": 195.077,
"eval_steps_per_second": 3.13,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 1.372519612312317,
"learning_rate": 2e-05,
"loss": 0.0804,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8769716088328076,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8323353293413174,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.12692256271839142,
"eval_overall_accuracy": 0.961112478464189,
"eval_overall_f1": 0.8210526315789473,
"eval_overall_precision": 0.7628361858190709,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9613,
"eval_samples_per_second": 194.533,
"eval_steps_per_second": 3.121,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 2.849003553390503,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0777,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.7922077922077922,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7236842105263158,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8742138364779874,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8273809523809523,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6571428571428571,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8732394366197184,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8378378378378378,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.12815138697624207,
"eval_overall_accuracy": 0.961112478464189,
"eval_overall_f1": 0.8142292490118577,
"eval_overall_precision": 0.7573529411764706,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.9568,
"eval_samples_per_second": 195.448,
"eval_steps_per_second": 3.136,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 1.4931484460830688,
"learning_rate": 1.9e-05,
"loss": 0.0769,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.7922077922077922,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7236842105263158,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8825396825396825,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8424242424242424,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8333333333333333,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7894736842105263,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13441848754882812,
"eval_overall_accuracy": 0.961112478464189,
"eval_overall_f1": 0.811023622047244,
"eval_overall_precision": 0.7518248175182481,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.9895,
"eval_samples_per_second": 188.992,
"eval_steps_per_second": 3.032,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 7.7728190422058105,
"learning_rate": 1.85e-05,
"loss": 0.0766,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8383233532934131,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13149088621139526,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8210526315789473,
"eval_overall_precision": 0.7628361858190709,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9572,
"eval_samples_per_second": 195.358,
"eval_steps_per_second": 3.134,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 1.2526227235794067,
"learning_rate": 1.8e-05,
"loss": 0.0768,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7123287671232877,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6419753086419753,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8825396825396825,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8424242424242424,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7619047619047619,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.7058823529411765,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.12420864403247833,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.822429906542056,
"eval_overall_precision": 0.7738693467336684,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.9596,
"eval_samples_per_second": 194.871,
"eval_steps_per_second": 3.126,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 1.5504401922225952,
"learning_rate": 1.75e-05,
"loss": 0.0772,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.738255033557047,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6547619047619048,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.12913870811462402,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8190224570673711,
"eval_overall_precision": 0.7635467980295566,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.9536,
"eval_samples_per_second": 196.097,
"eval_steps_per_second": 3.146,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 1.0265319347381592,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0738,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7236842105263158,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8714733542319748,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8224852071005917,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13372032344341278,
"eval_overall_accuracy": 0.9601279842480925,
"eval_overall_f1": 0.8109517601043025,
"eval_overall_precision": 0.7475961538461539,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.955,
"eval_samples_per_second": 195.812,
"eval_steps_per_second": 3.141,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 1.6299247741699219,
"learning_rate": 1.65e-05,
"loss": 0.0752,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.12958921492099762,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8227513227513228,
"eval_overall_precision": 0.7679012345679013,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.955,
"eval_samples_per_second": 195.809,
"eval_steps_per_second": 3.141,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 1.4963232278823853,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0743,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7074829931972789,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6341463414634146,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.696969696969697,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6216216216216216,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13297563791275024,
"eval_overall_accuracy": 0.9606202313561408,
"eval_overall_f1": 0.8116710875331565,
"eval_overall_precision": 0.7593052109181141,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.9533,
"eval_samples_per_second": 196.168,
"eval_steps_per_second": 3.147,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 1.4221112728118896,
"learning_rate": 1.55e-05,
"loss": 0.0758,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8825396825396825,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8424242424242424,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6571428571428571,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1320372223854065,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8190224570673711,
"eval_overall_precision": 0.7635467980295566,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.9574,
"eval_samples_per_second": 195.314,
"eval_steps_per_second": 3.133,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.8428576588630676,
"learning_rate": 1.5e-05,
"loss": 0.0729,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.879746835443038,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8373493975903614,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1279895156621933,
"eval_overall_accuracy": 0.9613586020182131,
"eval_overall_f1": 0.8174603174603174,
"eval_overall_precision": 0.762962962962963,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.9596,
"eval_samples_per_second": 194.864,
"eval_steps_per_second": 3.126,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 2.0319900512695312,
"learning_rate": 1.45e-05,
"loss": 0.0728,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.7922077922077922,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7096774193548387,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6111111111111112,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.696969696969697,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6216216216216216,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1363026648759842,
"eval_overall_accuracy": 0.9598818606940684,
"eval_overall_f1": 0.8105263157894738,
"eval_overall_precision": 0.7530562347188264,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.9593,
"eval_samples_per_second": 194.942,
"eval_steps_per_second": 3.127,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 1.2698560953140259,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0725,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1346251517534256,
"eval_overall_accuracy": 0.9603741078021166,
"eval_overall_f1": 0.8153034300791556,
"eval_overall_precision": 0.7592137592137592,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.9608,
"eval_samples_per_second": 194.624,
"eval_steps_per_second": 3.122,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.6609696745872498,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0713,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.7922077922077922,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13484306633472443,
"eval_overall_accuracy": 0.961112478464189,
"eval_overall_f1": 0.8179419525065963,
"eval_overall_precision": 0.7616707616707616,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.9626,
"eval_samples_per_second": 194.273,
"eval_steps_per_second": 3.117,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 2.321972131729126,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0717,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7074829931972789,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6341463414634146,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.888178913738019,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13028575479984283,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.8213333333333335,
"eval_overall_precision": 0.7719298245614035,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.9468,
"eval_samples_per_second": 197.515,
"eval_steps_per_second": 3.169,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 1.0534641742706299,
"learning_rate": 1.25e-05,
"loss": 0.074,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.575,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13667696714401245,
"eval_overall_accuracy": 0.9608663549101649,
"eval_overall_f1": 0.8163804491413474,
"eval_overall_precision": 0.7610837438423645,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.9529,
"eval_samples_per_second": 196.237,
"eval_steps_per_second": 3.148,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 2.212968111038208,
"learning_rate": 1.2e-05,
"loss": 0.073,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1331731677055359,
"eval_overall_accuracy": 0.9623430962343096,
"eval_overall_f1": 0.8233731739707835,
"eval_overall_precision": 0.7711442786069652,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.9553,
"eval_samples_per_second": 195.751,
"eval_steps_per_second": 3.14,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 1.6397372484207153,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0714,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.888178913738019,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1331976056098938,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.8211920529801325,
"eval_overall_precision": 0.7673267326732673,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.9558,
"eval_samples_per_second": 195.645,
"eval_steps_per_second": 3.139,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 2.294029474258423,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0705,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.135635107755661,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.8258575197889182,
"eval_overall_precision": 0.769041769041769,
"eval_overall_recall": 0.8917378917378918,
"eval_runtime": 0.9599,
"eval_samples_per_second": 194.803,
"eval_steps_per_second": 3.125,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 1.3058913946151733,
"learning_rate": 1.05e-05,
"loss": 0.072,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13674825429916382,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.8194993412384717,
"eval_overall_precision": 0.7622549019607843,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.9529,
"eval_samples_per_second": 196.243,
"eval_steps_per_second": 3.148,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 1.1319706439971924,
"learning_rate": 1e-05,
"loss": 0.0691,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8493150684931507,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7948717948717948,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1365245133638382,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.8184210526315789,
"eval_overall_precision": 0.7603911980440098,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.9471,
"eval_samples_per_second": 197.451,
"eval_steps_per_second": 3.168,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 1.053929090499878,
"learning_rate": 9.5e-06,
"loss": 0.0709,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6571428571428571,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13273945450782776,
"eval_overall_accuracy": 0.963081466896382,
"eval_overall_f1": 0.8260292164674634,
"eval_overall_precision": 0.7736318407960199,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.9555,
"eval_samples_per_second": 195.717,
"eval_steps_per_second": 3.14,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 1.5062341690063477,
"learning_rate": 9e-06,
"loss": 0.0702,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.7922077922077922,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1342259794473648,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.823841059602649,
"eval_overall_precision": 0.7698019801980198,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.9561,
"eval_samples_per_second": 195.594,
"eval_steps_per_second": 3.138,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 1.0942083597183228,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0703,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.7922077922077922,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13451319932937622,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.8190224570673711,
"eval_overall_precision": 0.7635467980295566,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.9561,
"eval_samples_per_second": 195.58,
"eval_steps_per_second": 3.138,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 1.3639521598815918,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0687,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8333333333333333,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7894736842105263,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13550812005996704,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.8227513227513228,
"eval_overall_precision": 0.7679012345679013,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.9603,
"eval_samples_per_second": 194.739,
"eval_steps_per_second": 3.124,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 1.3763707876205444,
"learning_rate": 7.5e-06,
"loss": 0.0707,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.7922077922077922,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7236842105263158,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7575757575757576,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8219178082191781,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7692307692307693,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13885249197483063,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.8205804749340371,
"eval_overall_precision": 0.7641277641277642,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.9502,
"eval_samples_per_second": 196.794,
"eval_steps_per_second": 3.157,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.6508387923240662,
"learning_rate": 7.000000000000001e-06,
"loss": 0.069,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8333333333333333,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7894736842105263,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.13471482694149017,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.8253968253968255,
"eval_overall_precision": 0.7703703703703704,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9478,
"eval_samples_per_second": 197.302,
"eval_steps_per_second": 3.165,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 1.5169206857681274,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0699,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13515108823776245,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.8275862068965517,
"eval_overall_precision": 0.7741935483870968,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9449,
"eval_samples_per_second": 197.905,
"eval_steps_per_second": 3.175,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.8914301991462708,
"learning_rate": 6e-06,
"loss": 0.0668,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1347392499446869,
"eval_overall_accuracy": 0.9616047255722373,
"eval_overall_f1": 0.8253968253968255,
"eval_overall_precision": 0.7703703703703704,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9567,
"eval_samples_per_second": 195.462,
"eval_steps_per_second": 3.136,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 3.5633649826049805,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0702,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.738255033557047,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6547619047619048,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13250109553337097,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.8275862068965517,
"eval_overall_precision": 0.7741935483870968,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9522,
"eval_samples_per_second": 196.391,
"eval_steps_per_second": 3.151,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 4.408683776855469,
"learning_rate": 5e-06,
"loss": 0.0673,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.738255033557047,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6547619047619048,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1317829042673111,
"eval_overall_accuracy": 0.9623430962343096,
"eval_overall_f1": 0.8286852589641434,
"eval_overall_precision": 0.7761194029850746,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9498,
"eval_samples_per_second": 196.876,
"eval_steps_per_second": 3.158,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 1.6093438863754272,
"learning_rate": 4.5e-06,
"loss": 0.0677,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1336798220872879,
"eval_overall_accuracy": 0.9623430962343096,
"eval_overall_f1": 0.8264900662251655,
"eval_overall_precision": 0.7722772277227723,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 1.0231,
"eval_samples_per_second": 182.78,
"eval_steps_per_second": 2.932,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 1.4977636337280273,
"learning_rate": 4.000000000000001e-06,
"loss": 0.068,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13396261632442474,
"eval_overall_accuracy": 0.9623430962343096,
"eval_overall_f1": 0.8264900662251655,
"eval_overall_precision": 0.7722772277227723,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.96,
"eval_samples_per_second": 194.788,
"eval_steps_per_second": 3.125,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.2478037327528,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0673,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13295292854309082,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.8253968253968255,
"eval_overall_precision": 0.7703703703703704,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9596,
"eval_samples_per_second": 194.864,
"eval_steps_per_second": 3.126,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 1.5132652521133423,
"learning_rate": 3e-06,
"loss": 0.0666,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7236842105263158,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.632183908045977,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1347019225358963,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.8243064729194187,
"eval_overall_precision": 0.7684729064039408,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.958,
"eval_samples_per_second": 195.195,
"eval_steps_per_second": 3.131,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.8759310245513916,
"learning_rate": 2.5e-06,
"loss": 0.0669,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13462986052036285,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.8264900662251655,
"eval_overall_precision": 0.7722772277227723,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9564,
"eval_samples_per_second": 195.523,
"eval_steps_per_second": 3.137,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 1.3174265623092651,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0683,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13497987389564514,
"eval_overall_accuracy": 0.9625892197883338,
"eval_overall_f1": 0.8253968253968255,
"eval_overall_precision": 0.7703703703703704,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 1.0176,
"eval_samples_per_second": 183.773,
"eval_steps_per_second": 2.948,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.7363091111183167,
"learning_rate": 1.5e-06,
"loss": 0.0659,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13355118036270142,
"eval_overall_accuracy": 0.9618508491262614,
"eval_overall_f1": 0.8264900662251655,
"eval_overall_precision": 0.7722772277227723,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9627,
"eval_samples_per_second": 194.239,
"eval_steps_per_second": 3.116,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.7795009613037109,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0679,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1339399665594101,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.8264900662251655,
"eval_overall_precision": 0.7722772277227723,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9645,
"eval_samples_per_second": 193.887,
"eval_steps_per_second": 3.11,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.9519725441932678,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0674,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13475549221038818,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.8264900662251655,
"eval_overall_precision": 0.7722772277227723,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9607,
"eval_samples_per_second": 194.64,
"eval_steps_per_second": 3.123,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.5444777607917786,
"learning_rate": 0.0,
"loss": 0.0677,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.861111111111111,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8157894736842105,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1346171796321869,
"eval_overall_accuracy": 0.9620969726802855,
"eval_overall_f1": 0.8264900662251655,
"eval_overall_precision": 0.7722772277227723,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.9671,
"eval_samples_per_second": 193.362,
"eval_steps_per_second": 3.102,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4551589111445376.0,
"train_loss": 0.12355997449946854,
"train_runtime": 1233.063,
"train_samples_per_second": 136.895,
"train_steps_per_second": 8.596
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4551589111445376.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}