nerugm-unipelt-1 / trainer_state.json
apwic's picture
End of training
e557e9f verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.0568287372589111,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.9528,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.012738853503184716,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.25,
"eval_PERSON_recall": 0.006535947712418301,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.6222904920578003,
"eval_overall_accuracy": 0.8357691354966559,
"eval_overall_f1": 0.005698005698005698,
"eval_overall_precision": 0.2,
"eval_overall_recall": 0.002890173410404624,
"eval_runtime": 0.4063,
"eval_samples_per_second": 460.253,
"eval_steps_per_second": 7.384,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.066505789756775,
"learning_rate": 4.9e-05,
"loss": 0.5159,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.45312499999999994,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.4915254237288136,
"eval_LOCATION_recall": 0.42028985507246375,
"eval_ORGANIZATION_f1": 0.06060606060606061,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.07894736842105263,
"eval_ORGANIZATION_recall": 0.04918032786885246,
"eval_PERSON_f1": 0.5912596401028277,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.4872881355932203,
"eval_PERSON_recall": 0.7516339869281046,
"eval_QUANTITY_f1": 0.03773584905660377,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.047619047619047616,
"eval_QUANTITY_recall": 0.03125,
"eval_TIME_f1": 0.5405405405405406,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.46511627906976744,
"eval_TIME_recall": 0.6451612903225806,
"eval_loss": 0.36079517006874084,
"eval_overall_accuracy": 0.8981917265296012,
"eval_overall_f1": 0.45222072678331093,
"eval_overall_precision": 0.42317380352644834,
"eval_overall_recall": 0.48554913294797686,
"eval_runtime": 0.4072,
"eval_samples_per_second": 459.196,
"eval_steps_per_second": 7.367,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.205767273902893,
"learning_rate": 4.85e-05,
"loss": 0.297,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.6946107784431138,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.5918367346938775,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.513888888888889,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.4457831325301205,
"eval_ORGANIZATION_recall": 0.6065573770491803,
"eval_PERSON_f1": 0.8414634146341464,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.7885714285714286,
"eval_PERSON_recall": 0.9019607843137255,
"eval_QUANTITY_f1": 0.5866666666666667,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.5116279069767442,
"eval_QUANTITY_recall": 0.6875,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.19271065294742584,
"eval_overall_accuracy": 0.940797621996532,
"eval_overall_f1": 0.7249357326478149,
"eval_overall_precision": 0.6527777777777778,
"eval_overall_recall": 0.815028901734104,
"eval_runtime": 0.4062,
"eval_samples_per_second": 460.369,
"eval_steps_per_second": 7.386,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.6758396625518799,
"learning_rate": 4.8e-05,
"loss": 0.1907,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.7142857142857143,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6060606060606061,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.624113475177305,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.55,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.8685015290519879,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8160919540229885,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.5952380952380952,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.4807692307692308,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.7123287671232876,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6190476190476191,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.17424248158931732,
"eval_overall_accuracy": 0.9437701263314342,
"eval_overall_f1": 0.7490542244640607,
"eval_overall_precision": 0.6644295302013423,
"eval_overall_recall": 0.8583815028901735,
"eval_runtime": 0.4062,
"eval_samples_per_second": 460.371,
"eval_steps_per_second": 7.386,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.1901781558990479,
"learning_rate": 4.75e-05,
"loss": 0.1593,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.728476821192053,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6707317073170732,
"eval_LOCATION_recall": 0.7971014492753623,
"eval_ORGANIZATION_f1": 0.6573426573426574,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.573170731707317,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.8703703703703703,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8245614035087719,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7536231884057971,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8709677419354839,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8709677419354839,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13567817211151123,
"eval_overall_accuracy": 0.9549170175873173,
"eval_overall_f1": 0.7903871829105475,
"eval_overall_precision": 0.7344913151364765,
"eval_overall_recall": 0.8554913294797688,
"eval_runtime": 0.4057,
"eval_samples_per_second": 460.888,
"eval_steps_per_second": 7.394,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 0.41255536675453186,
"learning_rate": 4.7e-05,
"loss": 0.1401,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.720496894409938,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6304347826086957,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5783132530120482,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.8909657320872275,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8511904761904762,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7397260273972602,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6585365853658537,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7941176470588235,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7297297297297297,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1358344703912735,
"eval_overall_accuracy": 0.9554124349764677,
"eval_overall_f1": 0.7900912646675358,
"eval_overall_precision": 0.7197149643705463,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.4073,
"eval_samples_per_second": 459.153,
"eval_steps_per_second": 7.366,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.6113700270652771,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.1309,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.713375796178344,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6363636363636364,
"eval_LOCATION_recall": 0.8115942028985508,
"eval_ORGANIZATION_f1": 0.6853146853146853,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5975609756097561,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8875000000000001,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8502994011976048,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7027027027027026,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6190476190476191,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13016657531261444,
"eval_overall_accuracy": 0.9571463958384939,
"eval_overall_f1": 0.7915567282321899,
"eval_overall_precision": 0.7281553398058253,
"eval_overall_recall": 0.8670520231213873,
"eval_runtime": 0.4064,
"eval_samples_per_second": 460.124,
"eval_steps_per_second": 7.382,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.6097145080566406,
"learning_rate": 4.600000000000001e-05,
"loss": 0.1197,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6950354609929078,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6125,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9150326797385621,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7536231884057972,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6842105263157895,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1251688003540039,
"eval_overall_accuracy": 0.9581372306167947,
"eval_overall_f1": 0.8080536912751678,
"eval_overall_precision": 0.7543859649122807,
"eval_overall_recall": 0.869942196531792,
"eval_runtime": 0.4062,
"eval_samples_per_second": 460.399,
"eval_steps_per_second": 7.386,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.3508681058883667,
"learning_rate": 4.55e-05,
"loss": 0.1102,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7468354430379747,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6629213483146067,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6969696969696969,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.647887323943662,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.8909657320872275,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8511904761904762,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.823529411764706,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7777777777777778,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.782608695652174,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7105263157894737,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13306157290935516,
"eval_overall_accuracy": 0.9588803567005202,
"eval_overall_f1": 0.8101604278074866,
"eval_overall_precision": 0.753731343283582,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.4057,
"eval_samples_per_second": 460.913,
"eval_steps_per_second": 7.394,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 1.0420314073562622,
"learning_rate": 4.5e-05,
"loss": 0.1078,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6466165413533835,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5972222222222222,
"eval_ORGANIZATION_recall": 0.7049180327868853,
"eval_PERSON_f1": 0.9050632911392406,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.787878787878788,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.11589627712965012,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.815934065934066,
"eval_overall_precision": 0.7774869109947644,
"eval_overall_recall": 0.8583815028901735,
"eval_runtime": 0.4069,
"eval_samples_per_second": 459.57,
"eval_steps_per_second": 7.373,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.47683292627334595,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1003,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7682119205298014,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7073170731707317,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6865671641791045,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6301369863013698,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.89375,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8562874251497006,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7714285714285716,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6923076923076923,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.12274792045354843,
"eval_overall_accuracy": 0.9591280653950953,
"eval_overall_f1": 0.8080536912751678,
"eval_overall_precision": 0.7543859649122807,
"eval_overall_recall": 0.869942196531792,
"eval_runtime": 0.4044,
"eval_samples_per_second": 462.406,
"eval_steps_per_second": 7.418,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 1.9095113277435303,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.0953,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6515151515151515,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6056338028169014,
"eval_ORGANIZATION_recall": 0.7049180327868853,
"eval_PERSON_f1": 0.9009584664536741,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.12356565147638321,
"eval_overall_accuracy": 0.9581372306167947,
"eval_overall_f1": 0.8110344827586207,
"eval_overall_precision": 0.7757255936675461,
"eval_overall_recall": 0.8497109826589595,
"eval_runtime": 0.4041,
"eval_samples_per_second": 462.759,
"eval_steps_per_second": 7.424,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.6649303436279297,
"learning_rate": 4.35e-05,
"loss": 0.0906,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.7549668874172186,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6951219512195121,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.7272727272727272,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6341463414634146,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9034267912772587,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8630952380952381,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.12967564165592194,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.822429906542056,
"eval_overall_precision": 0.7642679900744417,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.4045,
"eval_samples_per_second": 462.351,
"eval_steps_per_second": 7.417,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.123289704322815,
"learning_rate": 4.3e-05,
"loss": 0.0875,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7891156462585034,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6928104575163399,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5760869565217391,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.9090909090909091,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8734939759036144,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7222222222222222,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6341463414634146,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1440243422985077,
"eval_overall_accuracy": 0.9546693088927422,
"eval_overall_f1": 0.8099606815203145,
"eval_overall_precision": 0.7410071942446043,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.4035,
"eval_samples_per_second": 463.475,
"eval_steps_per_second": 7.435,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 0.35692471265792847,
"learning_rate": 4.25e-05,
"loss": 0.0851,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.7972972972972974,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6715328467153285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6052631578947368,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.8930817610062893,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8606060606060606,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13237613439559937,
"eval_overall_accuracy": 0.9573941045330691,
"eval_overall_f1": 0.8130081300813009,
"eval_overall_precision": 0.7653061224489796,
"eval_overall_recall": 0.8670520231213873,
"eval_runtime": 0.4054,
"eval_samples_per_second": 461.222,
"eval_steps_per_second": 7.399,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 0.7279097437858582,
"learning_rate": 4.2e-05,
"loss": 0.0757,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.7919463087248322,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6329113924050633,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9022082018927446,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8719512195121951,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1373172551393509,
"eval_overall_accuracy": 0.9593757740896706,
"eval_overall_f1": 0.8232118758434549,
"eval_overall_precision": 0.7721518987341772,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4031,
"eval_samples_per_second": 463.937,
"eval_steps_per_second": 7.443,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.11543399840593338,
"learning_rate": 4.15e-05,
"loss": 0.0752,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7483870967741935,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6744186046511628,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6811594202898551,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6103896103896104,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8765432098765432,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.12998123466968536,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8118279569892471,
"eval_overall_precision": 0.7587939698492462,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.4006,
"eval_samples_per_second": 466.782,
"eval_steps_per_second": 7.488,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.6546134948730469,
"learning_rate": 4.1e-05,
"loss": 0.0707,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.7972972972972974,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6461538461538462,
"eval_ORGANIZATION_recall": 0.6885245901639344,
"eval_PERSON_f1": 0.9022082018927446,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8719512195121951,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.787878787878788,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1343889832496643,
"eval_overall_accuracy": 0.9591280653950953,
"eval_overall_f1": 0.8181818181818181,
"eval_overall_precision": 0.781578947368421,
"eval_overall_recall": 0.8583815028901735,
"eval_runtime": 0.4031,
"eval_samples_per_second": 463.911,
"eval_steps_per_second": 7.442,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 1.4081445932388306,
"learning_rate": 4.05e-05,
"loss": 0.0692,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.7945205479452054,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7058823529411764,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.8930817610062893,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8606060606060606,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.8115942028985507,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7567567567567568,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1338239461183548,
"eval_overall_accuracy": 0.9601189001733961,
"eval_overall_f1": 0.8228882833787465,
"eval_overall_precision": 0.7783505154639175,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.4025,
"eval_samples_per_second": 464.628,
"eval_steps_per_second": 7.454,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.6560825705528259,
"learning_rate": 4e-05,
"loss": 0.0647,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7058823529411764,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9056603773584905,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8727272727272727,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1284184455871582,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.8333333333333334,
"eval_overall_precision": 0.7901554404145078,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4032,
"eval_samples_per_second": 463.739,
"eval_steps_per_second": 7.44,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 1.2687212228775024,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0611,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.7549668874172186,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6951219512195121,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.689655172413793,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5952380952380952,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8902821316614421,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8554216867469879,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7123287671232876,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6341463414634146,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7647058823529411,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7027027027027027,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.15563081204891205,
"eval_overall_accuracy": 0.9521922219469904,
"eval_overall_f1": 0.7962962962962963,
"eval_overall_precision": 0.7341463414634146,
"eval_overall_recall": 0.869942196531792,
"eval_runtime": 0.4026,
"eval_samples_per_second": 464.462,
"eval_steps_per_second": 7.451,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.9706618189811707,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0626,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7083333333333334,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6144578313253012,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9119496855345912,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8787878787878788,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7536231884057971,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7647058823529411,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7027027027027027,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1527089774608612,
"eval_overall_accuracy": 0.9583849393113698,
"eval_overall_f1": 0.8175765645805592,
"eval_overall_precision": 0.7580246913580246,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.4032,
"eval_samples_per_second": 463.751,
"eval_steps_per_second": 7.44,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.8338723182678223,
"learning_rate": 3.85e-05,
"loss": 0.0588,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6906474820143885,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6153846153846154,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9137380191693291,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.89375,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13671712577342987,
"eval_overall_accuracy": 0.9611097349516968,
"eval_overall_f1": 0.831275720164609,
"eval_overall_precision": 0.7911227154046997,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.4037,
"eval_samples_per_second": 463.194,
"eval_steps_per_second": 7.431,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.8579022884368896,
"learning_rate": 3.8e-05,
"loss": 0.0549,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7164179104477612,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6575342465753424,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9009584664536741,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.8358208955223881,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14114215970039368,
"eval_overall_accuracy": 0.961357443646272,
"eval_overall_f1": 0.8324175824175825,
"eval_overall_precision": 0.7931937172774869,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.4057,
"eval_samples_per_second": 460.959,
"eval_steps_per_second": 7.395,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.7675341963768005,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0524,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.7682119205298014,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7073170731707317,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7050359712230215,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6282051282051282,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9056603773584905,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8727272727272727,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1436871439218521,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8232118758434549,
"eval_overall_precision": 0.7721518987341772,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4021,
"eval_samples_per_second": 465.093,
"eval_steps_per_second": 7.461,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.9390576481819153,
"learning_rate": 3.7e-05,
"loss": 0.0526,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6666666666666667,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6081081081081081,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9056603773584905,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8727272727272727,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13506074249744415,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8224043715846995,
"eval_overall_precision": 0.7797927461139896,
"eval_overall_recall": 0.869942196531792,
"eval_runtime": 0.4036,
"eval_samples_per_second": 463.371,
"eval_steps_per_second": 7.434,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.5190781354904175,
"learning_rate": 3.65e-05,
"loss": 0.0487,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6911764705882353,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6266666666666667,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9050632911392406,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14294296503067017,
"eval_overall_accuracy": 0.9611097349516968,
"eval_overall_f1": 0.8256130790190735,
"eval_overall_precision": 0.7809278350515464,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.4031,
"eval_samples_per_second": 463.951,
"eval_steps_per_second": 7.443,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.7428516149520874,
"learning_rate": 3.6e-05,
"loss": 0.0476,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7142857142857143,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7022900763358779,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6571428571428571,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9022082018927446,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8719512195121951,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7941176470588235,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7297297297297297,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14721077680587769,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8233695652173912,
"eval_overall_precision": 0.7769230769230769,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.4015,
"eval_samples_per_second": 465.726,
"eval_steps_per_second": 7.472,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 1.087302803993225,
"learning_rate": 3.55e-05,
"loss": 0.0462,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.7733333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7160493827160493,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7083333333333334,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6144578313253012,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9216300940438872,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8855421686746988,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16020502150058746,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8299866131191432,
"eval_overall_precision": 0.773067331670823,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.4026,
"eval_samples_per_second": 464.429,
"eval_steps_per_second": 7.451,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.6619191765785217,
"learning_rate": 3.5e-05,
"loss": 0.0444,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8137931034482757,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.620253164556962,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9216300940438872,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8855421686746988,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15210027992725372,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.8408163265306122,
"eval_overall_precision": 0.794344473007712,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.4053,
"eval_samples_per_second": 461.371,
"eval_steps_per_second": 7.402,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.4051073491573334,
"learning_rate": 3.45e-05,
"loss": 0.0446,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.7702702702702703,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7215189873417721,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.7,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.620253164556962,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9119496855345912,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8787878787878788,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15809132158756256,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.8276797829036635,
"eval_overall_precision": 0.7800511508951407,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.403,
"eval_samples_per_second": 464.077,
"eval_steps_per_second": 7.445,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.33254846930503845,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0406,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6766917293233082,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9269841269841269,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9012345679012346,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15239284932613373,
"eval_overall_accuracy": 0.9623482784245727,
"eval_overall_f1": 0.8418156808803301,
"eval_overall_precision": 0.8031496062992126,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4004,
"eval_samples_per_second": 466.996,
"eval_steps_per_second": 7.492,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.20717833936214447,
"learning_rate": 3.35e-05,
"loss": 0.0411,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.821917808219178,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6956521739130435,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6233766233766234,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14470325410366058,
"eval_overall_accuracy": 0.9638345305920237,
"eval_overall_f1": 0.8372093023255814,
"eval_overall_precision": 0.7948051948051948,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.409,
"eval_samples_per_second": 457.261,
"eval_steps_per_second": 7.336,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 1.046993613243103,
"learning_rate": 3.3e-05,
"loss": 0.0376,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.7733333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7160493827160493,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.684931506849315,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5882352941176471,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.17131732404232025,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8252688172043011,
"eval_overall_precision": 0.7713567839195979,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.4026,
"eval_samples_per_second": 464.46,
"eval_steps_per_second": 7.451,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 1.2515838146209717,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0386,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6911764705882353,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6266666666666667,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9085173501577287,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8780487804878049,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15111976861953735,
"eval_overall_accuracy": 0.9630914045082982,
"eval_overall_f1": 0.8283378746594006,
"eval_overall_precision": 0.7835051546391752,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.4042,
"eval_samples_per_second": 462.608,
"eval_steps_per_second": 7.422,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 1.2548344135284424,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0357,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7092198581560285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9182389937106918,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8848484848484849,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8484848484848485,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8235294117647058,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1648045778274536,
"eval_overall_accuracy": 0.9628436958137231,
"eval_overall_f1": 0.8458390177353343,
"eval_overall_precision": 0.8010335917312662,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.4042,
"eval_samples_per_second": 462.674,
"eval_steps_per_second": 7.423,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 2.816448450088501,
"learning_rate": 3.15e-05,
"loss": 0.0347,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.7891156462585034,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7222222222222222,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6265060240963856,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9303797468354431,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.901840490797546,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.170131117105484,
"eval_overall_accuracy": 0.9635868218974486,
"eval_overall_f1": 0.8439620081411127,
"eval_overall_precision": 0.7953964194373402,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.4012,
"eval_samples_per_second": 466.072,
"eval_steps_per_second": 7.477,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 1.0050489902496338,
"learning_rate": 3.1e-05,
"loss": 0.0354,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.7808219178082192,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7402597402597403,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6197183098591549,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14870800077915192,
"eval_overall_accuracy": 0.964082239286599,
"eval_overall_f1": 0.8275862068965517,
"eval_overall_precision": 0.7915567282321899,
"eval_overall_recall": 0.8670520231213873,
"eval_runtime": 0.4006,
"eval_samples_per_second": 466.802,
"eval_steps_per_second": 7.489,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.5996510982513428,
"learning_rate": 3.05e-05,
"loss": 0.0337,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6190476190476191,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9090909090909091,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8734939759036144,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16299550235271454,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.8394062078272604,
"eval_overall_precision": 0.7873417721518987,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.4063,
"eval_samples_per_second": 460.239,
"eval_steps_per_second": 7.384,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 2.1595568656921387,
"learning_rate": 3e-05,
"loss": 0.031,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.7651006711409397,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7125,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.7014925373134328,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6438356164383562,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9182389937106918,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8848484848484849,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1605391651391983,
"eval_overall_accuracy": 0.9630914045082982,
"eval_overall_f1": 0.829467939972715,
"eval_overall_precision": 0.7855297157622739,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.4029,
"eval_samples_per_second": 464.118,
"eval_steps_per_second": 7.446,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.07246937602758408,
"learning_rate": 2.95e-05,
"loss": 0.0305,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.7755102040816326,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7307692307692307,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.676056338028169,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5925925925925926,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9119496855345912,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8787878787878788,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1640830785036087,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8238482384823848,
"eval_overall_precision": 0.7755102040816326,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.4046,
"eval_samples_per_second": 462.202,
"eval_steps_per_second": 7.415,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 1.7377935647964478,
"learning_rate": 2.9e-05,
"loss": 0.0292,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7092198581560285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9269841269841269,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9012345679012346,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16985991597175598,
"eval_overall_accuracy": 0.9635868218974486,
"eval_overall_f1": 0.8415300546448088,
"eval_overall_precision": 0.7979274611398963,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.4032,
"eval_samples_per_second": 463.799,
"eval_steps_per_second": 7.441,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.08767852932214737,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0296,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.7702702702702703,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7215189873417721,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.6984126984126984,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.676923076923077,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9269841269841269,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9012345679012346,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16103391349315643,
"eval_overall_accuracy": 0.9660639088432004,
"eval_overall_f1": 0.8344923504867872,
"eval_overall_precision": 0.8042895442359249,
"eval_overall_recall": 0.8670520231213873,
"eval_runtime": 0.4057,
"eval_samples_per_second": 460.877,
"eval_steps_per_second": 7.394,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.5797997117042542,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0271,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6969696969696969,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.647887323943662,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9182389937106918,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8848484848484849,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1736581176519394,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.837912087912088,
"eval_overall_precision": 0.7984293193717278,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4141,
"eval_samples_per_second": 451.532,
"eval_steps_per_second": 7.244,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 0.5857752561569214,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0257,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.7945205479452054,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6716417910447762,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6164383561643836,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9216300940438872,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8855421686746988,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16865137219429016,
"eval_overall_accuracy": 0.964082239286599,
"eval_overall_f1": 0.8340192043895747,
"eval_overall_precision": 0.793733681462141,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.4037,
"eval_samples_per_second": 463.213,
"eval_steps_per_second": 7.431,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.6415446400642395,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0267,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.7945205479452054,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.676470588235294,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6133333333333333,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9299363057324841,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.906832298136646,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16720764338970184,
"eval_overall_accuracy": 0.9638345305920237,
"eval_overall_f1": 0.8386206896551723,
"eval_overall_precision": 0.8021108179419525,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.405,
"eval_samples_per_second": 461.732,
"eval_steps_per_second": 7.407,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 4.307225704193115,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0243,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7050359712230215,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6282051282051282,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9274447949526814,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8963414634146342,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.17239607870578766,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8399452804377565,
"eval_overall_precision": 0.7974025974025974,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.4036,
"eval_samples_per_second": 463.275,
"eval_steps_per_second": 7.432,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 2.830711841583252,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0245,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6814814814814815,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6216216216216216,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.17494605481624603,
"eval_overall_accuracy": 0.9630914045082982,
"eval_overall_f1": 0.837912087912088,
"eval_overall_precision": 0.7984293193717278,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4037,
"eval_samples_per_second": 463.262,
"eval_steps_per_second": 7.432,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.654138445854187,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0248,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8137931034482757,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6917293233082706,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6388888888888888,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1652275174856186,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8386206896551723,
"eval_overall_precision": 0.8021108179419525,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.4028,
"eval_samples_per_second": 464.213,
"eval_steps_per_second": 7.447,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 0.5925632119178772,
"learning_rate": 2.5e-05,
"loss": 0.024,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.7972027972027972,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7702702702702703,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.6717557251908397,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6285714285714286,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1688040941953659,
"eval_overall_accuracy": 0.9621005697299975,
"eval_overall_f1": 0.8289290681502086,
"eval_overall_precision": 0.7989276139410187,
"eval_overall_recall": 0.861271676300578,
"eval_runtime": 0.4031,
"eval_samples_per_second": 463.874,
"eval_steps_per_second": 7.442,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.48497816920280457,
"learning_rate": 2.45e-05,
"loss": 0.0218,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.704225352112676,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6172839506172839,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9367088607594937,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9079754601226994,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1846623569726944,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8505434782608696,
"eval_overall_precision": 0.8025641025641026,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.4053,
"eval_samples_per_second": 461.373,
"eval_steps_per_second": 7.402,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 1.1621553897857666,
"learning_rate": 2.4e-05,
"loss": 0.0213,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7123287671232876,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.611764705882353,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9396825396825397,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9135802469135802,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.180556520819664,
"eval_overall_accuracy": 0.9635868218974486,
"eval_overall_f1": 0.8486486486486486,
"eval_overall_precision": 0.7969543147208121,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.4094,
"eval_samples_per_second": 456.723,
"eval_steps_per_second": 7.327,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.4603475332260132,
"learning_rate": 2.35e-05,
"loss": 0.0201,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8055555555555556,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7733333333333333,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7375886524822695,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9245283018867925,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8909090909090909,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.18687838315963745,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8458390177353343,
"eval_overall_precision": 0.8010335917312662,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.4094,
"eval_samples_per_second": 456.771,
"eval_steps_per_second": 7.328,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.3411925733089447,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.02,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.712121212121212,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6619718309859155,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.927899686520376,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.891566265060241,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.8484848484848485,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8235294117647058,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1793394833803177,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.848901098901099,
"eval_overall_precision": 0.8089005235602095,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.4098,
"eval_samples_per_second": 456.305,
"eval_steps_per_second": 7.32,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.9535180330276489,
"learning_rate": 2.25e-05,
"loss": 0.0204,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8055555555555556,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7733333333333333,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6715328467153285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6052631578947368,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9022082018927446,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8719512195121951,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1895986944437027,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8224043715846995,
"eval_overall_precision": 0.7797927461139896,
"eval_overall_recall": 0.869942196531792,
"eval_runtime": 0.4065,
"eval_samples_per_second": 459.994,
"eval_steps_per_second": 7.38,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.5869280099868774,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0221,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8251748251748252,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7972972972972973,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6917293233082706,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6388888888888888,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.939297124600639,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.91875,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.17885428667068481,
"eval_overall_accuracy": 0.96556849145405,
"eval_overall_f1": 0.85,
"eval_overall_precision": 0.8181818181818182,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4069,
"eval_samples_per_second": 459.619,
"eval_steps_per_second": 7.374,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 1.007596492767334,
"learning_rate": 2.15e-05,
"loss": 0.0191,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6716417910447762,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6164383561643836,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9333333333333333,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9074074074074074,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.18730428814888,
"eval_overall_accuracy": 0.9633391132028735,
"eval_overall_f1": 0.8425414364640884,
"eval_overall_precision": 0.8068783068783069,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4082,
"eval_samples_per_second": 458.124,
"eval_steps_per_second": 7.35,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.05349158123135567,
"learning_rate": 2.1e-05,
"loss": 0.0184,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6715328467153285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6052631578947368,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9216300940438872,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8855421686746988,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1908842921257019,
"eval_overall_accuracy": 0.9623482784245727,
"eval_overall_f1": 0.8344733242134064,
"eval_overall_precision": 0.7922077922077922,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4093,
"eval_samples_per_second": 456.924,
"eval_steps_per_second": 7.33,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.5943154692649841,
"learning_rate": 2.05e-05,
"loss": 0.0173,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8333333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6617647058823529,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9211356466876972,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8902439024390244,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.19820117950439453,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.8356164383561644,
"eval_overall_precision": 0.7942708333333334,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4065,
"eval_samples_per_second": 460.074,
"eval_steps_per_second": 7.381,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.6145533323287964,
"learning_rate": 2e-05,
"loss": 0.018,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6853146853146853,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5975609756097561,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.874251497005988,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.202591672539711,
"eval_overall_accuracy": 0.9623482784245727,
"eval_overall_f1": 0.8319783197831978,
"eval_overall_precision": 0.7831632653061225,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.4085,
"eval_samples_per_second": 457.796,
"eval_steps_per_second": 7.344,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 1.8163769245147705,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0174,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8028169014084506,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7808219178082192,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.6929133858267716,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9201277955271565,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.18250833451747894,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8387096774193549,
"eval_overall_precision": 0.8147138964577657,
"eval_overall_recall": 0.8641618497109826,
"eval_runtime": 0.4055,
"eval_samples_per_second": 461.15,
"eval_steps_per_second": 7.398,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.7063648104667664,
"learning_rate": 1.9e-05,
"loss": 0.0159,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6713286713286712,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5853658536585366,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.915360501567398,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8795180722891566,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.20766791701316833,
"eval_overall_accuracy": 0.9630914045082982,
"eval_overall_f1": 0.8362652232746955,
"eval_overall_precision": 0.7862595419847328,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.4037,
"eval_samples_per_second": 463.189,
"eval_steps_per_second": 7.431,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.06240615248680115,
"learning_rate": 1.85e-05,
"loss": 0.0159,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8251748251748252,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7972972972972973,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.676470588235294,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6133333333333333,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9274447949526814,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8963414634146342,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.20551708340644836,
"eval_overall_accuracy": 0.9623482784245727,
"eval_overall_f1": 0.839506172839506,
"eval_overall_precision": 0.7989556135770235,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4048,
"eval_samples_per_second": 461.929,
"eval_steps_per_second": 7.411,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 3.2396926879882812,
"learning_rate": 1.8e-05,
"loss": 0.0151,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6857142857142857,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6075949367088608,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9396825396825397,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9135802469135802,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.20788374543190002,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.8485675306957707,
"eval_overall_precision": 0.8036175710594315,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.4028,
"eval_samples_per_second": 464.3,
"eval_steps_per_second": 7.449,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.9956832528114319,
"learning_rate": 1.75e-05,
"loss": 0.0162,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.821917808219178,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6715328467153285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6052631578947368,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9211356466876972,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8902439024390244,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.19509576261043549,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8383561643835618,
"eval_overall_precision": 0.796875,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4029,
"eval_samples_per_second": 464.164,
"eval_steps_per_second": 7.446,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.5994267463684082,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0149,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6865671641791045,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6301369863013698,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9274447949526814,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8963414634146342,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.20032353699207306,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8426812585499317,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.4012,
"eval_samples_per_second": 466.119,
"eval_steps_per_second": 7.478,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.22768262028694153,
"learning_rate": 1.65e-05,
"loss": 0.0155,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.7945205479452054,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6717557251908397,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6285714285714286,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9337539432176657,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9024390243902439,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2013421654701233,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.8347107438016529,
"eval_overall_precision": 0.7973684210526316,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.4059,
"eval_samples_per_second": 460.723,
"eval_steps_per_second": 7.391,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.4733757972717285,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0147,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6769230769230768,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6376811594202898,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9216300940438872,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8855421686746988,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.20686639845371246,
"eval_overall_accuracy": 0.9628436958137231,
"eval_overall_f1": 0.8386206896551723,
"eval_overall_precision": 0.8021108179419525,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.4015,
"eval_samples_per_second": 465.784,
"eval_steps_per_second": 7.472,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.21161212027072906,
"learning_rate": 1.55e-05,
"loss": 0.0139,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6917293233082706,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6388888888888888,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9269841269841269,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9012345679012346,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.19644662737846375,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8437067773167358,
"eval_overall_precision": 0.8090185676392573,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4039,
"eval_samples_per_second": 462.998,
"eval_steps_per_second": 7.428,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 1.607442021369934,
"learning_rate": 1.5e-05,
"loss": 0.0141,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6976744186046512,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6617647058823529,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9211356466876972,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8902439024390244,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8484848484848485,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8235294117647058,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.20234768092632294,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8460471567267683,
"eval_overall_precision": 0.8133333333333334,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4064,
"eval_samples_per_second": 460.185,
"eval_steps_per_second": 7.383,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.20785416662693024,
"learning_rate": 1.45e-05,
"loss": 0.0136,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6917293233082706,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6388888888888888,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9182389937106918,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8848484848484849,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.20758448541164398,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.837912087912088,
"eval_overall_precision": 0.7984293193717278,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4107,
"eval_samples_per_second": 455.343,
"eval_steps_per_second": 7.305,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 1.7999894618988037,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0135,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6818181818181818,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6338028169014085,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8484848484848485,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8235294117647058,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.20112010836601257,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8413793103448276,
"eval_overall_precision": 0.8047493403693932,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.409,
"eval_samples_per_second": 457.258,
"eval_steps_per_second": 7.336,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.046665601432323456,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0114,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.821917808219178,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6923076923076924,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6521739130434783,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9303797468354431,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.901840490797546,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8484848484848485,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8235294117647058,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.20439833402633667,
"eval_overall_accuracy": 0.966807034926926,
"eval_overall_f1": 0.850415512465374,
"eval_overall_precision": 0.8164893617021277,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.4081,
"eval_samples_per_second": 458.248,
"eval_steps_per_second": 7.352,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.4319368600845337,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0124,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.821917808219178,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6766917293233082,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9303797468354431,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.901840490797546,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8615384615384616,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8235294117647058,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2058665156364441,
"eval_overall_accuracy": 0.9658162001486252,
"eval_overall_f1": 0.8457300275482094,
"eval_overall_precision": 0.8078947368421052,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.4093,
"eval_samples_per_second": 456.88,
"eval_steps_per_second": 7.33,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.46784916520118713,
"learning_rate": 1.25e-05,
"loss": 0.0113,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6716417910447762,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6164383561643836,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9211356466876972,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8902439024390244,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.21380963921546936,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8367626886145405,
"eval_overall_precision": 0.7963446475195822,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4037,
"eval_samples_per_second": 463.253,
"eval_steps_per_second": 7.432,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.5961441397666931,
"learning_rate": 1.2e-05,
"loss": 0.0126,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6766917293233082,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9211356466876972,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8902439024390244,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8484848484848485,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8235294117647058,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.21406003832817078,
"eval_overall_accuracy": 0.9638345305920237,
"eval_overall_f1": 0.8438356164383563,
"eval_overall_precision": 0.8020833333333334,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.4046,
"eval_samples_per_second": 462.204,
"eval_steps_per_second": 7.415,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.5828773975372314,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0116,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6870229007633588,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6428571428571429,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9333333333333333,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9074074074074074,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8484848484848485,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8235294117647058,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.21130701899528503,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8488210818307905,
"eval_overall_precision": 0.816,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.404,
"eval_samples_per_second": 462.856,
"eval_steps_per_second": 7.426,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.6764857769012451,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0126,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6962962962962963,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6351351351351351,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9245283018867925,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8909090909090909,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8484848484848485,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8235294117647058,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.7941176470588235,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7297297297297297,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.21255819499492645,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8458390177353343,
"eval_overall_precision": 0.8010335917312662,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.4082,
"eval_samples_per_second": 458.124,
"eval_steps_per_second": 7.35,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.38964611291885376,
"learning_rate": 1.05e-05,
"loss": 0.0123,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.8251748251748252,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7972972972972973,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.682170542635659,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9303797468354431,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.901840490797546,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8484848484848485,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8235294117647058,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.20355309545993805,
"eval_overall_accuracy": 0.966807034926926,
"eval_overall_f1": 0.8495821727019499,
"eval_overall_precision": 0.8198924731182796,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4033,
"eval_samples_per_second": 463.657,
"eval_steps_per_second": 7.438,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.3479403257369995,
"learning_rate": 1e-05,
"loss": 0.0121,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6715328467153285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6052631578947368,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9269841269841269,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9012345679012346,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.21020622551441193,
"eval_overall_accuracy": 0.9635868218974486,
"eval_overall_f1": 0.8422496570644717,
"eval_overall_precision": 0.8015665796344648,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.4048,
"eval_samples_per_second": 461.968,
"eval_steps_per_second": 7.411,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.370176762342453,
"learning_rate": 9.5e-06,
"loss": 0.0104,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6766917293233082,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9269841269841269,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9012345679012346,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.21465693414211273,
"eval_overall_accuracy": 0.9633391132028735,
"eval_overall_f1": 0.8418156808803301,
"eval_overall_precision": 0.8031496062992126,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4029,
"eval_samples_per_second": 464.107,
"eval_steps_per_second": 7.446,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.28365227580070496,
"learning_rate": 9e-06,
"loss": 0.0108,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6715328467153285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6052631578947368,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9303797468354431,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.901840490797546,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22350215911865234,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.8403819918144612,
"eval_overall_precision": 0.7958656330749354,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.4037,
"eval_samples_per_second": 463.167,
"eval_steps_per_second": 7.43,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.8675772547721863,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0105,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6818181818181818,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6338028169014085,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9333333333333333,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9074074074074074,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.21032676100730896,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8437067773167358,
"eval_overall_precision": 0.8090185676392573,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4035,
"eval_samples_per_second": 463.458,
"eval_steps_per_second": 7.435,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 2.7571957111358643,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0107,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6870229007633588,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6428571428571429,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9363057324840764,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9130434782608695,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.21551497280597687,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8425414364640884,
"eval_overall_precision": 0.8068783068783069,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4034,
"eval_samples_per_second": 463.566,
"eval_steps_per_second": 7.437,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.0661739706993103,
"learning_rate": 7.5e-06,
"loss": 0.0103,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6818181818181818,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6338028169014085,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2167329490184784,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.837912087912088,
"eval_overall_precision": 0.7984293193717278,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4057,
"eval_samples_per_second": 460.971,
"eval_steps_per_second": 7.395,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 1.5372931957244873,
"learning_rate": 7.000000000000001e-06,
"loss": 0.01,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.676470588235294,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6133333333333333,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9211356466876972,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8902439024390244,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22136247158050537,
"eval_overall_accuracy": 0.964082239286599,
"eval_overall_f1": 0.8365122615803814,
"eval_overall_precision": 0.7912371134020618,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.4055,
"eval_samples_per_second": 461.202,
"eval_steps_per_second": 7.399,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.7345579266548157,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0101,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6865671641791045,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6301369863013698,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.215372234582901,
"eval_overall_accuracy": 0.964082239286599,
"eval_overall_f1": 0.8399452804377565,
"eval_overall_precision": 0.7974025974025974,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.4065,
"eval_samples_per_second": 460.02,
"eval_steps_per_second": 7.38,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.02773982100188732,
"learning_rate": 6e-06,
"loss": 0.0112,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6814814814814815,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6216216216216216,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9333333333333333,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9074074074074074,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.21471378207206726,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8438356164383563,
"eval_overall_precision": 0.8020833333333334,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.4027,
"eval_samples_per_second": 464.317,
"eval_steps_per_second": 7.449,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 1.2374390363693237,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0111,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6818181818181818,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6338028169014085,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.21400561928749084,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8406593406593407,
"eval_overall_precision": 0.8010471204188482,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4029,
"eval_samples_per_second": 464.12,
"eval_steps_per_second": 7.446,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 0.09918837249279022,
"learning_rate": 5e-06,
"loss": 0.0098,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7014925373134328,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6438356164383562,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9206349206349207,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8950617283950617,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22259807586669922,
"eval_overall_accuracy": 0.9638345305920237,
"eval_overall_f1": 0.839506172839506,
"eval_overall_precision": 0.7989556135770235,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4017,
"eval_samples_per_second": 465.48,
"eval_steps_per_second": 7.468,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.10904386639595032,
"learning_rate": 4.5e-06,
"loss": 0.0099,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.712121212121212,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6619718309859155,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9333333333333333,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9074074074074074,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.21591398119926453,
"eval_overall_accuracy": 0.9658162001486252,
"eval_overall_f1": 0.8476454293628809,
"eval_overall_precision": 0.8138297872340425,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4022,
"eval_samples_per_second": 464.95,
"eval_steps_per_second": 7.459,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 3.4749605655670166,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0102,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.712121212121212,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6619718309859155,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9303797468354431,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.901840490797546,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22017474472522736,
"eval_overall_accuracy": 0.9665593262323507,
"eval_overall_f1": 0.8484848484848484,
"eval_overall_precision": 0.8105263157894737,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.4038,
"eval_samples_per_second": 463.073,
"eval_steps_per_second": 7.429,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.8946192860603333,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0096,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6969696969696969,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.647887323943662,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22221431136131287,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8418156808803301,
"eval_overall_precision": 0.8031496062992126,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4021,
"eval_samples_per_second": 465.113,
"eval_steps_per_second": 7.462,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.0954521968960762,
"learning_rate": 3e-06,
"loss": 0.0092,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6865671641791045,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6301369863013698,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22241780161857605,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8383561643835618,
"eval_overall_precision": 0.796875,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4033,
"eval_samples_per_second": 463.727,
"eval_steps_per_second": 7.439,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 1.271582007408142,
"learning_rate": 2.5e-06,
"loss": 0.0087,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6917293233082706,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6388888888888888,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22204293310642242,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8402203856749312,
"eval_overall_precision": 0.8026315789473685,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.4038,
"eval_samples_per_second": 463.133,
"eval_steps_per_second": 7.43,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.26876676082611084,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0084,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6865671641791045,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6301369863013698,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2239730805158615,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8406593406593407,
"eval_overall_precision": 0.8010471204188482,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4038,
"eval_samples_per_second": 463.148,
"eval_steps_per_second": 7.43,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 1.1765313148498535,
"learning_rate": 1.5e-06,
"loss": 0.0087,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6917293233082706,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6388888888888888,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22398912906646729,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8418156808803301,
"eval_overall_precision": 0.8031496062992126,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4018,
"eval_samples_per_second": 465.353,
"eval_steps_per_second": 7.466,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.07008544355630875,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0088,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6917293233082706,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6388888888888888,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2226743996143341,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8406593406593407,
"eval_overall_precision": 0.8010471204188482,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4033,
"eval_samples_per_second": 463.678,
"eval_steps_per_second": 7.439,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.22727848589420319,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0086,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.821917808219178,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6865671641791045,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6301369863013698,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22218792140483856,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8418156808803301,
"eval_overall_precision": 0.8031496062992126,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4019,
"eval_samples_per_second": 465.321,
"eval_steps_per_second": 7.465,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.21861711144447327,
"learning_rate": 0.0,
"loss": 0.0084,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.821917808219178,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6865671641791045,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6301369863013698,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22297325730323792,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8418156808803301,
"eval_overall_precision": 0.8031496062992126,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.4008,
"eval_samples_per_second": 466.564,
"eval_steps_per_second": 7.485,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 5154303869081070.0,
"train_loss": 0.05378503026827326,
"train_runtime": 976.0836,
"train_samples_per_second": 172.834,
"train_steps_per_second": 10.86
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 5154303869081070.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}