nerugm-base-0 / trainer_state.json
apwic's picture
End of training
bc0c299 verified
raw
history blame
No virus
144 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 3.8788857460021973,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.3599,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.512396694214876,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.49206349206349204,
"eval_ORGANIZATION_recall": 0.5344827586206896,
"eval_PERSON_f1": 0.8625,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8214285714285714,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6363636363636364,
"eval_QUANTITY_recall": 0.7,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.1317242681980133,
"eval_overall_accuracy": 0.9569782330345711,
"eval_overall_f1": 0.7791842475386779,
"eval_overall_precision": 0.7426273458445041,
"eval_overall_recall": 0.8195266272189349,
"eval_runtime": 0.659,
"eval_samples_per_second": 283.783,
"eval_steps_per_second": 4.553,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 2.0066733360290527,
"learning_rate": 4.9e-05,
"loss": 0.1201,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7230769230769231,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6527777777777778,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.8860759493670887,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.6,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.525,
"eval_QUANTITY_recall": 0.7,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.14421768486499786,
"eval_overall_accuracy": 0.9580025608194622,
"eval_overall_f1": 0.8010973936899862,
"eval_overall_precision": 0.7468030690537084,
"eval_overall_recall": 0.863905325443787,
"eval_runtime": 0.6779,
"eval_samples_per_second": 275.835,
"eval_steps_per_second": 4.425,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 4.826297760009766,
"learning_rate": 4.85e-05,
"loss": 0.0789,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7218045112781956,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.852760736196319,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.7988505747126436,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8307692307692307,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.15757465362548828,
"eval_overall_accuracy": 0.954673495518566,
"eval_overall_f1": 0.819538670284939,
"eval_overall_precision": 0.7568922305764411,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.7577,
"eval_samples_per_second": 246.801,
"eval_steps_per_second": 3.959,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.5358341932296753,
"learning_rate": 4.8e-05,
"loss": 0.0497,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.765625,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.8980891719745223,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.15764029324054718,
"eval_overall_accuracy": 0.9628681177976952,
"eval_overall_f1": 0.8384401114206129,
"eval_overall_precision": 0.7921052631578948,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.6908,
"eval_samples_per_second": 270.686,
"eval_steps_per_second": 4.343,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 0.8067348003387451,
"learning_rate": 4.75e-05,
"loss": 0.0304,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.8591549295774648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8356164383561644,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6554621848739496,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.639344262295082,
"eval_ORGANIZATION_recall": 0.6724137931034483,
"eval_PERSON_f1": 0.8681672025723474,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.8881578947368421,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.18078266084194183,
"eval_overall_accuracy": 0.9603072983354674,
"eval_overall_f1": 0.8242074927953891,
"eval_overall_precision": 0.8033707865168539,
"eval_overall_recall": 0.8461538461538461,
"eval_runtime": 0.7144,
"eval_samples_per_second": 261.763,
"eval_steps_per_second": 4.199,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 2.896883010864258,
"learning_rate": 4.7e-05,
"loss": 0.0258,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6166666666666667,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.5967741935483871,
"eval_ORGANIZATION_recall": 0.6379310344827587,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.9013157894736842,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.18976914882659912,
"eval_overall_accuracy": 0.9590268886043534,
"eval_overall_f1": 0.8175388967468176,
"eval_overall_precision": 0.7831978319783198,
"eval_overall_recall": 0.8550295857988166,
"eval_runtime": 0.7567,
"eval_samples_per_second": 247.118,
"eval_steps_per_second": 3.964,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.08857329934835434,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.0151,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.84,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6491228070175439,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6607142857142857,
"eval_ORGANIZATION_recall": 0.6379310344827587,
"eval_PERSON_f1": 0.8789808917197451,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.84375,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.7692307692307692,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6944444444444444,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.22696857154369354,
"eval_overall_accuracy": 0.9587708066581306,
"eval_overall_f1": 0.8203677510608204,
"eval_overall_precision": 0.7859078590785907,
"eval_overall_recall": 0.8579881656804734,
"eval_runtime": 0.7647,
"eval_samples_per_second": 244.536,
"eval_steps_per_second": 3.923,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.24211041629314423,
"learning_rate": 4.600000000000001e-05,
"loss": 0.0124,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.8493150684931507,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.706766917293233,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6266666666666667,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.8761904761904762,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.2596437335014343,
"eval_overall_accuracy": 0.9569782330345711,
"eval_overall_f1": 0.83008356545961,
"eval_overall_precision": 0.7842105263157895,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.7892,
"eval_samples_per_second": 236.961,
"eval_steps_per_second": 3.802,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 0.5304147005081177,
"learning_rate": 4.55e-05,
"loss": 0.0088,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7401574803149606,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6811594202898551,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.8535825545171339,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8106508875739645,
"eval_PERSON_recall": 0.9013157894736842,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.26296016573905945,
"eval_overall_accuracy": 0.9562099871959027,
"eval_overall_f1": 0.83008356545961,
"eval_overall_precision": 0.7842105263157895,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8059,
"eval_samples_per_second": 232.037,
"eval_steps_per_second": 3.723,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 1.2787593603134155,
"learning_rate": 4.5e-05,
"loss": 0.0083,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.8513513513513514,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7703703703703704,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6753246753246753,
"eval_ORGANIZATION_recall": 0.896551724137931,
"eval_PERSON_f1": 0.9079365079365079,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7058823529411765,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.23285891115665436,
"eval_overall_accuracy": 0.963124199743918,
"eval_overall_f1": 0.8488210818307906,
"eval_overall_precision": 0.7989556135770235,
"eval_overall_recall": 0.9053254437869822,
"eval_runtime": 0.8566,
"eval_samples_per_second": 218.314,
"eval_steps_per_second": 3.502,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 2.0766656398773193,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.0088,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7154471544715447,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.676923076923077,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.875,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.78125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.23979602754116058,
"eval_overall_accuracy": 0.9610755441741358,
"eval_overall_f1": 0.8324022346368716,
"eval_overall_precision": 0.7883597883597884,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.7972,
"eval_samples_per_second": 234.561,
"eval_steps_per_second": 3.763,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 0.004628497175872326,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.007,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7704918032786885,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.734375,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.8758169934640522,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8701298701298701,
"eval_PERSON_recall": 0.881578947368421,
"eval_QUANTITY_f1": 0.7936507936507938,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7575757575757576,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.23579084873199463,
"eval_overall_accuracy": 0.9623559539052496,
"eval_overall_f1": 0.8395415472779371,
"eval_overall_precision": 0.8138888888888889,
"eval_overall_recall": 0.8668639053254438,
"eval_runtime": 0.8766,
"eval_samples_per_second": 213.313,
"eval_steps_per_second": 3.422,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.023974481970071793,
"learning_rate": 4.35e-05,
"loss": 0.0061,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.851063829787234,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8333333333333334,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6019417475728155,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6888888888888889,
"eval_ORGANIZATION_recall": 0.5344827586206896,
"eval_PERSON_f1": 0.8932038834951456,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8789808917197452,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.24468651413917542,
"eval_overall_accuracy": 0.9613316261203585,
"eval_overall_f1": 0.8301329394387003,
"eval_overall_precision": 0.8289085545722714,
"eval_overall_recall": 0.8313609467455622,
"eval_runtime": 0.8154,
"eval_samples_per_second": 229.344,
"eval_steps_per_second": 3.679,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 0.16095533967018127,
"learning_rate": 4.3e-05,
"loss": 0.0073,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.8551724137931034,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7500000000000001,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7258064516129032,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.8996763754045308,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8307692307692307,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.23856018483638763,
"eval_overall_accuracy": 0.9641485275288092,
"eval_overall_f1": 0.855507868383405,
"eval_overall_precision": 0.8282548476454293,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.7969,
"eval_samples_per_second": 234.66,
"eval_steps_per_second": 3.765,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 3.3597922325134277,
"learning_rate": 4.25e-05,
"loss": 0.0046,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.8493150684931507,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6857142857142857,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9055374592833876,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8571428571428572,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.23872800171375275,
"eval_overall_accuracy": 0.9651728553137003,
"eval_overall_f1": 0.8579545454545454,
"eval_overall_precision": 0.825136612021858,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.8079,
"eval_samples_per_second": 231.459,
"eval_steps_per_second": 3.713,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 4.114704608917236,
"learning_rate": 4.2e-05,
"loss": 0.003,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8493150684931507,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6363636363636364,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6730769230769231,
"eval_ORGANIZATION_recall": 0.603448275862069,
"eval_PERSON_f1": 0.9042904290429044,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9072847682119205,
"eval_PERSON_recall": 0.9013157894736842,
"eval_QUANTITY_f1": 0.8571428571428572,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.847457627118644,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.2643202841281891,
"eval_overall_accuracy": 0.9610755441741358,
"eval_overall_f1": 0.8399412628487519,
"eval_overall_precision": 0.8338192419825073,
"eval_overall_recall": 0.8461538461538461,
"eval_runtime": 0.7994,
"eval_samples_per_second": 233.932,
"eval_steps_per_second": 3.753,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.06794843822717667,
"learning_rate": 4.15e-05,
"loss": 0.0027,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.8724832214765101,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8125,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7538461538461538,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6805555555555556,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.8701298701298701,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.881578947368421,
"eval_QUANTITY_f1": 0.84375,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.279176265001297,
"eval_overall_accuracy": 0.9613316261203585,
"eval_overall_f1": 0.8466947960618846,
"eval_overall_precision": 0.806970509383378,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.8067,
"eval_samples_per_second": 231.813,
"eval_steps_per_second": 3.719,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.005153521429747343,
"learning_rate": 4.1e-05,
"loss": 0.0037,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7619047619047619,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7154471544715447,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.676923076923077,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8571428571428572,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.27270039916038513,
"eval_overall_accuracy": 0.9620998719590269,
"eval_overall_f1": 0.8443197755960729,
"eval_overall_precision": 0.8026666666666666,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.8021,
"eval_samples_per_second": 233.132,
"eval_steps_per_second": 3.74,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.6481520533561707,
"learning_rate": 4.05e-05,
"loss": 0.0046,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7258064516129032,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6818181818181818,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9155844155844156,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9038461538461539,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8571428571428572,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.24588538706302643,
"eval_overall_accuracy": 0.9636363636363636,
"eval_overall_f1": 0.855920114122682,
"eval_overall_precision": 0.8264462809917356,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.8194,
"eval_samples_per_second": 228.23,
"eval_steps_per_second": 3.661,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.020622072741389275,
"learning_rate": 4e-05,
"loss": 0.0048,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7317073170731708,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6923076923076923,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9003215434083601,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8571428571428572,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2616201937198639,
"eval_overall_accuracy": 0.9613316261203585,
"eval_overall_f1": 0.8443197755960729,
"eval_overall_precision": 0.8026666666666666,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.8054,
"eval_samples_per_second": 232.17,
"eval_steps_per_second": 3.725,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 3.6123130321502686,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0047,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.8666666666666666,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.736,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6865671641791045,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8932038834951456,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8789808917197452,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.9310344827586207,
"eval_loss": 0.24132052063941956,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.848314606741573,
"eval_overall_precision": 0.8074866310160428,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.8121,
"eval_samples_per_second": 230.255,
"eval_steps_per_second": 3.694,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.009204844012856483,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0041,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8476821192052981,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7804878048780488,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7384615384615385,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8860759493670886,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.78125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2953908145427704,
"eval_overall_accuracy": 0.9620998719590269,
"eval_overall_f1": 0.8428372739916552,
"eval_overall_precision": 0.7952755905511811,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.8088,
"eval_samples_per_second": 231.216,
"eval_steps_per_second": 3.709,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.007008604239672422,
"learning_rate": 3.85e-05,
"loss": 0.0034,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8435374149659864,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.765625,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9131832797427653,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8930817610062893,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.819672131147541,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8064516129032258,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.26445022225379944,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8551336146272854,
"eval_overall_precision": 0.8150134048257373,
"eval_overall_recall": 0.8994082840236687,
"eval_runtime": 0.797,
"eval_samples_per_second": 234.637,
"eval_steps_per_second": 3.764,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 0.31136611104011536,
"learning_rate": 3.8e-05,
"loss": 0.0021,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.8493150684931507,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7874015748031497,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7246376811594203,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.9067524115755626,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8867924528301887,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8135593220338982,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8275862068965517,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.27145740389823914,
"eval_overall_accuracy": 0.9654289372599232,
"eval_overall_f1": 0.8595744680851063,
"eval_overall_precision": 0.8256130790190735,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.8132,
"eval_samples_per_second": 229.963,
"eval_steps_per_second": 3.689,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.07211441546678543,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0022,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8551724137931034,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7500000000000001,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7258064516129032,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9025974025974026,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.26712566614151,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.8546762589928059,
"eval_overall_precision": 0.8319327731092437,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.8059,
"eval_samples_per_second": 232.043,
"eval_steps_per_second": 3.723,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 6.344851970672607,
"learning_rate": 3.7e-05,
"loss": 0.0021,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8311688311688311,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7529411764705882,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7419354838709677,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.696969696969697,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9025974025974026,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8333333333333334,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8333333333333334,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.30937761068344116,
"eval_overall_accuracy": 0.9623559539052496,
"eval_overall_f1": 0.8486562942008485,
"eval_overall_precision": 0.8130081300813008,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.8324,
"eval_samples_per_second": 224.639,
"eval_steps_per_second": 3.604,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.9656301736831665,
"learning_rate": 3.65e-05,
"loss": 0.0033,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7603305785123967,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7301587301587301,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9137380191693291,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8881987577639752,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2710714638233185,
"eval_overall_accuracy": 0.9651728553137003,
"eval_overall_f1": 0.8555240793201133,
"eval_overall_precision": 0.8206521739130435,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.802,
"eval_samples_per_second": 233.165,
"eval_steps_per_second": 3.741,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 0.023881729692220688,
"learning_rate": 3.6e-05,
"loss": 0.003,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7804878048780489,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7384615384615385,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9161290322580645,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8987341772151899,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.78125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2883354723453522,
"eval_overall_accuracy": 0.964404609475032,
"eval_overall_f1": 0.8563380281690142,
"eval_overall_precision": 0.8172043010752689,
"eval_overall_recall": 0.8994082840236687,
"eval_runtime": 0.8155,
"eval_samples_per_second": 229.295,
"eval_steps_per_second": 3.679,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.004700132180005312,
"learning_rate": 3.55e-05,
"loss": 0.0021,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7317073170731708,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6923076923076923,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.8996763754045308,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2531093657016754,
"eval_overall_accuracy": 0.9651728553137003,
"eval_overall_f1": 0.8530670470756063,
"eval_overall_precision": 0.8236914600550964,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.8176,
"eval_samples_per_second": 228.73,
"eval_steps_per_second": 3.669,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.1790827363729477,
"learning_rate": 3.5e-05,
"loss": 0.0016,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6434782608695653,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6491228070175439,
"eval_ORGANIZATION_recall": 0.6379310344827587,
"eval_PERSON_f1": 0.910828025477707,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8827160493827161,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.29236629605293274,
"eval_overall_accuracy": 0.9626120358514725,
"eval_overall_f1": 0.8356940509915014,
"eval_overall_precision": 0.8016304347826086,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.8083,
"eval_samples_per_second": 231.339,
"eval_steps_per_second": 3.711,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.0017360023921355605,
"learning_rate": 3.45e-05,
"loss": 0.0048,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8724832214765101,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8125,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.6885245901639345,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.65625,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.9003215434083601,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2867705523967743,
"eval_overall_accuracy": 0.9626120358514725,
"eval_overall_f1": 0.8446327683615819,
"eval_overall_precision": 0.8081081081081081,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.8033,
"eval_samples_per_second": 232.803,
"eval_steps_per_second": 3.735,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.009486394003033638,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0032,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7142857142857142,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6617647058823529,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.8974358974358975,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7878787878787877,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2836323380470276,
"eval_overall_accuracy": 0.9605633802816902,
"eval_overall_f1": 0.8324022346368716,
"eval_overall_precision": 0.7883597883597884,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8087,
"eval_samples_per_second": 231.245,
"eval_steps_per_second": 3.71,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.008940489031374454,
"learning_rate": 3.35e-05,
"loss": 0.004,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8611111111111112,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8266666666666667,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.735042735042735,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7288135593220338,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.879746835443038,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.25650379061698914,
"eval_overall_accuracy": 0.9656850192061459,
"eval_overall_f1": 0.8493543758967002,
"eval_overall_precision": 0.8245125348189415,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.8037,
"eval_samples_per_second": 232.687,
"eval_steps_per_second": 3.733,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.018895745277404785,
"learning_rate": 3.3e-05,
"loss": 0.0016,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7619047619047619,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6896551724137931,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6896551724137931,
"eval_ORGANIZATION_recall": 0.6896551724137931,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2746643126010895,
"eval_overall_accuracy": 0.9651728553137003,
"eval_overall_f1": 0.8429985855728428,
"eval_overall_precision": 0.8075880758807588,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8043,
"eval_samples_per_second": 232.493,
"eval_steps_per_second": 3.73,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.0035857518669217825,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0018,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.8590604026845639,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7479674796747967,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7076923076923077,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9096774193548387,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8924050632911392,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.870967741935484,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.84375,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.26389142870903015,
"eval_overall_accuracy": 0.9659411011523688,
"eval_overall_f1": 0.8611898016997167,
"eval_overall_precision": 0.8260869565217391,
"eval_overall_recall": 0.8994082840236687,
"eval_runtime": 0.822,
"eval_samples_per_second": 227.49,
"eval_steps_per_second": 3.65,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.0013648144667968154,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0032,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8904109589041096,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8441558441558441,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.717948717948718,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.711864406779661,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.919093851132686,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9044585987261147,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2595536410808563,
"eval_overall_accuracy": 0.9654289372599232,
"eval_overall_f1": 0.860832137733142,
"eval_overall_precision": 0.8356545961002786,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.8156,
"eval_samples_per_second": 229.278,
"eval_steps_per_second": 3.678,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.001226762542501092,
"learning_rate": 3.15e-05,
"loss": 0.0024,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.728813559322034,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7166666666666667,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9102564102564101,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8875,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.847457627118644,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.2782364785671234,
"eval_overall_accuracy": 0.9669654289372599,
"eval_overall_f1": 0.8595988538681948,
"eval_overall_precision": 0.8333333333333334,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.8106,
"eval_samples_per_second": 230.693,
"eval_steps_per_second": 3.701,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.0014669048832729459,
"learning_rate": 3.1e-05,
"loss": 0.002,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8590604026845639,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7704918032786885,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.734375,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9025974025974026,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.2879778742790222,
"eval_overall_accuracy": 0.9664532650448143,
"eval_overall_f1": 0.8571428571428571,
"eval_overall_precision": 0.8287292817679558,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.8881,
"eval_samples_per_second": 210.566,
"eval_steps_per_second": 3.378,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.008377453312277794,
"learning_rate": 3.05e-05,
"loss": 0.0027,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8724832214765101,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8125,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.71875,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6571428571428571,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8924050632911392,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8597560975609756,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8000000000000002,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2859266996383667,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.84593837535014,
"eval_overall_precision": 0.8031914893617021,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.8126,
"eval_samples_per_second": 230.123,
"eval_steps_per_second": 3.692,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 6.265191078186035,
"learning_rate": 3e-05,
"loss": 0.0028,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7704918032786885,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.734375,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.9166666666666667,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89375,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.27767661213874817,
"eval_overall_accuracy": 0.9674775928297055,
"eval_overall_f1": 0.8640226628895185,
"eval_overall_precision": 0.8288043478260869,
"eval_overall_recall": 0.9023668639053254,
"eval_runtime": 0.8112,
"eval_samples_per_second": 230.533,
"eval_steps_per_second": 3.698,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.01230549905449152,
"learning_rate": 2.95e-05,
"loss": 0.0013,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7540983606557378,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.71875,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.910828025477707,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8827160493827161,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8709677419354839,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.9310344827586207,
"eval_loss": 0.27420660853385925,
"eval_overall_accuracy": 0.9667093469910372,
"eval_overall_f1": 0.8579465541490858,
"eval_overall_precision": 0.8176943699731903,
"eval_overall_recall": 0.9023668639053254,
"eval_runtime": 0.804,
"eval_samples_per_second": 232.579,
"eval_steps_per_second": 3.731,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.0334417000412941,
"learning_rate": 2.9e-05,
"loss": 0.0035,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8904109589041096,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8441558441558441,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7603305785123967,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7301587301587301,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9050632911392406,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8719512195121951,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.7936507936507938,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7575757575757576,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.9310344827586207,
"eval_loss": 0.28786924481391907,
"eval_overall_accuracy": 0.9674775928297055,
"eval_overall_f1": 0.8631875881523273,
"eval_overall_precision": 0.8247978436657682,
"eval_overall_recall": 0.9053254437869822,
"eval_runtime": 0.9089,
"eval_samples_per_second": 205.735,
"eval_steps_per_second": 3.301,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.27700409293174744,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0014,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7580645161290323,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7121212121212122,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.877742946708464,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8383233532934131,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7741935483870969,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2879803478717804,
"eval_overall_accuracy": 0.9651728553137003,
"eval_overall_f1": 0.8443197755960729,
"eval_overall_precision": 0.8026666666666666,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.8107,
"eval_samples_per_second": 230.668,
"eval_steps_per_second": 3.701,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.5553054213523865,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.002,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.796875,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.8793103448275862,
"eval_PERSON_f1": 0.9161290322580645,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8987341772151899,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2945367693901062,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.867605633802817,
"eval_overall_precision": 0.8279569892473119,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.8052,
"eval_samples_per_second": 232.233,
"eval_steps_per_second": 3.726,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 0.12713950872421265,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.003,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8311688311688311,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7529411764705882,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7226890756302522,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7049180327868853,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9155844155844156,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9038461538461539,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.819672131147541,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8064516129032258,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2897718548774719,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8530670470756063,
"eval_overall_precision": 0.8236914600550964,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.8046,
"eval_samples_per_second": 232.414,
"eval_steps_per_second": 3.729,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.0031549884006381035,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0029,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8441558441558441,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7647058823529411,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.8125,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7428571428571429,
"eval_ORGANIZATION_recall": 0.896551724137931,
"eval_PERSON_f1": 0.9067524115755626,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8867924528301887,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.870967741935484,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.84375,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.310619056224823,
"eval_overall_accuracy": 0.9654289372599232,
"eval_overall_f1": 0.8650904033379694,
"eval_overall_precision": 0.8162729658792651,
"eval_overall_recall": 0.9201183431952663,
"eval_runtime": 0.8131,
"eval_samples_per_second": 229.995,
"eval_steps_per_second": 3.69,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.037439510226249695,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0033,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.8840579710144928,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8840579710144928,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6788990825688075,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7254901960784313,
"eval_ORGANIZATION_recall": 0.6379310344827587,
"eval_PERSON_f1": 0.9215686274509804,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9155844155844156,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8524590163934426,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8387096774193549,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.26650553941726685,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.8630952380952381,
"eval_overall_precision": 0.8682634730538922,
"eval_overall_recall": 0.8579881656804734,
"eval_runtime": 0.8111,
"eval_samples_per_second": 230.541,
"eval_steps_per_second": 3.699,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.005395154468715191,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0027,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8311688311688311,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7529411764705882,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7538461538461538,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6805555555555556,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.879746835443038,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3204702138900757,
"eval_overall_accuracy": 0.9605633802816902,
"eval_overall_f1": 0.8467966573816157,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8994082840236687,
"eval_runtime": 0.8068,
"eval_samples_per_second": 231.778,
"eval_steps_per_second": 3.718,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.010527399368584156,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0014,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8724832214765101,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8125,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7419354838709677,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.696969696969697,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9131832797427653,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8930817610062893,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.28002333641052246,
"eval_overall_accuracy": 0.9656850192061459,
"eval_overall_f1": 0.8640226628895185,
"eval_overall_precision": 0.8288043478260869,
"eval_overall_recall": 0.9023668639053254,
"eval_runtime": 0.8074,
"eval_samples_per_second": 231.603,
"eval_steps_per_second": 3.716,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 0.0005556904943659902,
"learning_rate": 2.5e-05,
"loss": 0.0005,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8590604026845639,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7441860465116279,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.676056338028169,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9067524115755626,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8867924528301887,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.30621612071990967,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8579465541490858,
"eval_overall_precision": 0.8176943699731903,
"eval_overall_recall": 0.9023668639053254,
"eval_runtime": 0.8061,
"eval_samples_per_second": 231.983,
"eval_steps_per_second": 3.722,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.002213704166933894,
"learning_rate": 2.45e-05,
"loss": 0.0009,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7200000000000001,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6716417910447762,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.8974358974358975,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3094327747821808,
"eval_overall_accuracy": 0.9615877080665813,
"eval_overall_f1": 0.8429985855728428,
"eval_overall_precision": 0.8075880758807588,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8118,
"eval_samples_per_second": 230.354,
"eval_steps_per_second": 3.696,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.12124722450971603,
"learning_rate": 2.4e-05,
"loss": 0.0007,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8493150684931507,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7226890756302522,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7049180327868853,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9003215434083601,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.870967741935484,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.84375,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2926962077617645,
"eval_overall_accuracy": 0.9651728553137003,
"eval_overall_f1": 0.8538681948424068,
"eval_overall_precision": 0.8277777777777777,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8047,
"eval_samples_per_second": 232.378,
"eval_steps_per_second": 3.728,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.007010570261627436,
"learning_rate": 2.35e-05,
"loss": 0.0005,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8413793103448277,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7166666666666668,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6935483870967742,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9038461538461539,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3106415271759033,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.8497854077253219,
"eval_overall_precision": 0.8227146814404432,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.8081,
"eval_samples_per_second": 231.4,
"eval_steps_per_second": 3.712,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.0005368912825360894,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0006,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8472222222222223,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7241379310344829,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7241379310344828,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.9102564102564101,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8875,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3165185749530792,
"eval_overall_accuracy": 0.9649167733674776,
"eval_overall_f1": 0.8546762589928059,
"eval_overall_precision": 0.8319327731092437,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.8064,
"eval_samples_per_second": 231.905,
"eval_steps_per_second": 3.72,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.0005507151363417506,
"learning_rate": 2.25e-05,
"loss": 0.0008,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8920863309352518,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8857142857142857,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6915887850467289,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7551020408163265,
"eval_ORGANIZATION_recall": 0.6379310344827587,
"eval_PERSON_f1": 0.9061488673139159,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89171974522293,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.28772225975990295,
"eval_overall_accuracy": 0.9677336747759283,
"eval_overall_f1": 0.8579881656804734,
"eval_overall_precision": 0.8579881656804734,
"eval_overall_recall": 0.8579881656804734,
"eval_runtime": 0.8028,
"eval_samples_per_second": 232.926,
"eval_steps_per_second": 3.737,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.004189824219793081,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0013,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8965517241379309,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8552631578947368,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.6956521739130435,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7017543859649122,
"eval_ORGANIZATION_recall": 0.6896551724137931,
"eval_PERSON_f1": 0.9126213592233009,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8980891719745223,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8524590163934426,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8387096774193549,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2933734357357025,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.861271676300578,
"eval_overall_precision": 0.8418079096045198,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8184,
"eval_samples_per_second": 228.501,
"eval_steps_per_second": 3.666,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.00032704288605600595,
"learning_rate": 2.15e-05,
"loss": 0.0003,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8904109589041096,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8441558441558441,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.6956521739130435,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7017543859649122,
"eval_ORGANIZATION_recall": 0.6896551724137931,
"eval_PERSON_f1": 0.9096774193548387,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8924050632911392,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.31640374660491943,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.8563218390804598,
"eval_overall_precision": 0.8324022346368715,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8095,
"eval_samples_per_second": 231.007,
"eval_steps_per_second": 3.706,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.0005215631099417806,
"learning_rate": 2.1e-05,
"loss": 0.0004,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8843537414965987,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8333333333333334,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7107438016528926,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6825396825396826,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9096774193548387,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8924050632911392,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.32982975244522095,
"eval_overall_accuracy": 0.9628681177976952,
"eval_overall_f1": 0.8575498575498575,
"eval_overall_precision": 0.8269230769230769,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.8776,
"eval_samples_per_second": 213.09,
"eval_steps_per_second": 3.419,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.13604550063610077,
"learning_rate": 2.05e-05,
"loss": 0.0006,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8965517241379309,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8552631578947368,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.6371681415929203,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6545454545454545,
"eval_ORGANIZATION_recall": 0.6206896551724138,
"eval_PERSON_f1": 0.9131832797427653,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8930817610062893,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3474750220775604,
"eval_overall_accuracy": 0.9618437900128041,
"eval_overall_f1": 0.8513708513708513,
"eval_overall_precision": 0.8309859154929577,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.812,
"eval_samples_per_second": 230.289,
"eval_steps_per_second": 3.694,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.0007290157955139875,
"learning_rate": 2e-05,
"loss": 0.0009,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8783783783783783,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8227848101265823,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7731092436974789,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7540983606557377,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9096774193548387,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8924050632911392,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3445851802825928,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8673323823109843,
"eval_overall_precision": 0.837465564738292,
"eval_overall_recall": 0.8994082840236687,
"eval_runtime": 0.8135,
"eval_samples_per_second": 229.871,
"eval_steps_per_second": 3.688,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.01683318056166172,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0005,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8666666666666666,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7200000000000001,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6716417910447762,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9003215434083601,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3661682605743408,
"eval_overall_accuracy": 0.9610755441741358,
"eval_overall_f1": 0.8519040902679831,
"eval_overall_precision": 0.8140161725067385,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.8073,
"eval_samples_per_second": 231.639,
"eval_steps_per_second": 3.716,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.0029261417221277952,
"learning_rate": 1.9e-05,
"loss": 0.002,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8965517241379309,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8552631578947368,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7377049180327868,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.703125,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9067524115755626,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8867924528301887,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7936507936507938,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7575757575757576,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.31876397132873535,
"eval_overall_accuracy": 0.9664532650448143,
"eval_overall_f1": 0.861626248216833,
"eval_overall_precision": 0.8319559228650137,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.8044,
"eval_samples_per_second": 232.462,
"eval_steps_per_second": 3.729,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.0014877787325531244,
"learning_rate": 1.85e-05,
"loss": 0.0005,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8951048951048951,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8648648648648649,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7603305785123967,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7301587301587301,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9003215434083601,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.819672131147541,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8064516129032258,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3222368061542511,
"eval_overall_accuracy": 0.9669654289372599,
"eval_overall_f1": 0.864942528735632,
"eval_overall_precision": 0.840782122905028,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.8114,
"eval_samples_per_second": 230.457,
"eval_steps_per_second": 3.697,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.000210550642805174,
"learning_rate": 1.8e-05,
"loss": 0.0003,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7642276422764227,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7230769230769231,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.9003215434083601,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.32881781458854675,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8603988603988605,
"eval_overall_precision": 0.8296703296703297,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.8114,
"eval_samples_per_second": 230.476,
"eval_steps_per_second": 3.697,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.0021329650189727545,
"learning_rate": 1.75e-05,
"loss": 0.0003,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7704918032786885,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.734375,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.8987341772151899,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8658536585365854,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.33311548829078674,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8628005657708628,
"eval_overall_precision": 0.8265582655826558,
"eval_overall_recall": 0.9023668639053254,
"eval_runtime": 0.8037,
"eval_samples_per_second": 232.685,
"eval_steps_per_second": 3.733,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.0006951324758119881,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0003,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.881118881118881,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8513513513513513,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6666666666666667,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6981132075471698,
"eval_ORGANIZATION_recall": 0.6379310344827587,
"eval_PERSON_f1": 0.9090909090909091,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8974358974358975,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.31618252396583557,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8525547445255474,
"eval_overall_precision": 0.8414985590778098,
"eval_overall_recall": 0.863905325443787,
"eval_runtime": 0.8125,
"eval_samples_per_second": 230.14,
"eval_steps_per_second": 3.692,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.0028227961156517267,
"learning_rate": 1.65e-05,
"loss": 0.0024,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7438016528925621,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9114754098360655,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9084967320261438,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3060024380683899,
"eval_overall_accuracy": 0.9672215108834827,
"eval_overall_f1": 0.8575539568345324,
"eval_overall_precision": 0.834733893557423,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8036,
"eval_samples_per_second": 232.709,
"eval_steps_per_second": 3.733,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.0007019271142780781,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.002,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.8904109589041096,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8441558441558441,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.6851851851851852,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.74,
"eval_ORGANIZATION_recall": 0.6379310344827587,
"eval_PERSON_f1": 0.9155844155844156,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9038461538461539,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3085281252861023,
"eval_overall_accuracy": 0.9651728553137003,
"eval_overall_f1": 0.8600583090379009,
"eval_overall_precision": 0.8477011494252874,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.8099,
"eval_samples_per_second": 230.884,
"eval_steps_per_second": 3.704,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 13.608760833740234,
"learning_rate": 1.55e-05,
"loss": 0.0014,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8904109589041096,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8441558441558441,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7086614173228347,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6521739130434783,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.89171974522293,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.888888888888889,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8484848484848485,
"eval_QUANTITY_recall": 0.9333333333333333,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.30335918068885803,
"eval_overall_accuracy": 0.9649167733674776,
"eval_overall_f1": 0.8551336146272854,
"eval_overall_precision": 0.8150134048257373,
"eval_overall_recall": 0.8994082840236687,
"eval_runtime": 0.8074,
"eval_samples_per_second": 231.614,
"eval_steps_per_second": 3.716,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.00710656400769949,
"learning_rate": 1.5e-05,
"loss": 0.0006,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7244094488188977,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8064516129032258,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3125246465206146,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8466947960618846,
"eval_overall_precision": 0.806970509383378,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.8058,
"eval_samples_per_second": 232.071,
"eval_steps_per_second": 3.723,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.00047848603571765125,
"learning_rate": 1.45e-05,
"loss": 0.0009,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.8749999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7301587301587301,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6764705882352942,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8952380952380953,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8650306748466258,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.7666666666666667,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7419354838709677,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.3196626901626587,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.843441466854725,
"eval_overall_precision": 0.8059299191374663,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.8027,
"eval_samples_per_second": 232.972,
"eval_steps_per_second": 3.738,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.002629638649523258,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0009,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7317073170731708,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6923076923076923,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9073482428115016,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8819875776397516,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.3206939697265625,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8526912181303117,
"eval_overall_precision": 0.8179347826086957,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.8794,
"eval_samples_per_second": 212.64,
"eval_steps_per_second": 3.411,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.0006528229569084942,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0006,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7049180327868853,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.671875,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9061488673139159,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89171974522293,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.32062897086143494,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8502139800285307,
"eval_overall_precision": 0.8209366391184573,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8113,
"eval_samples_per_second": 230.503,
"eval_steps_per_second": 3.698,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.0003340624098200351,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0004,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7213114754098361,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6875,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.8990228013029316,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.32088541984558105,
"eval_overall_accuracy": 0.9641485275288092,
"eval_overall_f1": 0.8497854077253219,
"eval_overall_precision": 0.8227146814404432,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.8194,
"eval_samples_per_second": 228.212,
"eval_steps_per_second": 3.661,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.0001975786144612357,
"learning_rate": 1.25e-05,
"loss": 0.0003,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8936170212765957,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.875,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6991869918699186,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6615384615384615,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8996763754045308,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.32191890478134155,
"eval_overall_accuracy": 0.9636363636363636,
"eval_overall_f1": 0.8493543758967002,
"eval_overall_precision": 0.8245125348189415,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.7893,
"eval_samples_per_second": 236.92,
"eval_steps_per_second": 3.801,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.0004086096887476742,
"learning_rate": 1.2e-05,
"loss": 0.0003,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.732824427480916,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6575342465753424,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9038461538461539,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3355537950992584,
"eval_overall_accuracy": 0.963124199743918,
"eval_overall_f1": 0.85273492286115,
"eval_overall_precision": 0.8106666666666666,
"eval_overall_recall": 0.8994082840236687,
"eval_runtime": 0.8123,
"eval_samples_per_second": 230.209,
"eval_steps_per_second": 3.693,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.000383577193133533,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0002,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8951048951048951,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8648648648648649,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7166666666666668,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6935483870967742,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9003215434083601,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3264581859111786,
"eval_overall_accuracy": 0.9656850192061459,
"eval_overall_f1": 0.8550932568149211,
"eval_overall_precision": 0.83008356545961,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8006,
"eval_samples_per_second": 233.575,
"eval_steps_per_second": 3.747,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.0004785690689459443,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0002,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7213114754098361,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6875,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.9003215434083601,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.32919907569885254,
"eval_overall_accuracy": 0.9649167733674776,
"eval_overall_f1": 0.8530670470756063,
"eval_overall_precision": 0.8236914600550964,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.7937,
"eval_samples_per_second": 235.609,
"eval_steps_per_second": 3.78,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.8365729451179504,
"learning_rate": 1.05e-05,
"loss": 0.0003,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7154471544715447,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.676923076923077,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.891025641025641,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.333362877368927,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8490028490028488,
"eval_overall_precision": 0.8186813186813187,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8323,
"eval_samples_per_second": 224.68,
"eval_steps_per_second": 3.604,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.0004933515447191894,
"learning_rate": 1e-05,
"loss": 0.0006,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8951048951048951,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8648648648648649,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6890756302521007,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6721311475409836,
"eval_ORGANIZATION_recall": 0.7068965517241379,
"eval_PERSON_f1": 0.9055374592833876,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.870967741935484,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.84375,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.33931657671928406,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8554913294797689,
"eval_overall_precision": 0.8361581920903954,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.8001,
"eval_samples_per_second": 233.722,
"eval_steps_per_second": 3.75,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.0009226278634741902,
"learning_rate": 9.5e-06,
"loss": 0.0002,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7213114754098361,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6875,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.8990228013029316,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3536657691001892,
"eval_overall_accuracy": 0.964404609475032,
"eval_overall_f1": 0.8522238163558107,
"eval_overall_precision": 0.8272980501392758,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.8023,
"eval_samples_per_second": 233.087,
"eval_steps_per_second": 3.739,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.001014114823192358,
"learning_rate": 9e-06,
"loss": 0.0003,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.719298245614035,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7321428571428571,
"eval_ORGANIZATION_recall": 0.7068965517241379,
"eval_PERSON_f1": 0.8961038961038961,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3606484830379486,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.8505079825834543,
"eval_overall_precision": 0.8347578347578347,
"eval_overall_recall": 0.8668639053254438,
"eval_runtime": 0.8129,
"eval_samples_per_second": 230.048,
"eval_steps_per_second": 3.691,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.0005941664567217231,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0006,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.9090909090909092,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8783783783783784,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.6545454545454545,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6923076923076923,
"eval_ORGANIZATION_recall": 0.6206896551724138,
"eval_PERSON_f1": 0.9055374592833876,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.35767465829849243,
"eval_overall_accuracy": 0.9641485275288092,
"eval_overall_f1": 0.8491947291361641,
"eval_overall_precision": 0.8405797101449275,
"eval_overall_recall": 0.8579881656804734,
"eval_runtime": 0.8106,
"eval_samples_per_second": 230.7,
"eval_steps_per_second": 3.701,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.0007156149367801845,
"learning_rate": 8.000000000000001e-06,
"loss": 0.001,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.9027777777777778,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8666666666666667,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.6548672566371682,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6727272727272727,
"eval_ORGANIZATION_recall": 0.6379310344827587,
"eval_PERSON_f1": 0.8961038961038961,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.36741259694099426,
"eval_overall_accuracy": 0.9618437900128041,
"eval_overall_f1": 0.8430232558139535,
"eval_overall_precision": 0.8285714285714286,
"eval_overall_recall": 0.8579881656804734,
"eval_runtime": 0.799,
"eval_samples_per_second": 234.039,
"eval_steps_per_second": 3.755,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.00027448913897387683,
"learning_rate": 7.5e-06,
"loss": 0.0006,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.9090909090909092,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8783783783783784,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.6725663716814159,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6909090909090909,
"eval_ORGANIZATION_recall": 0.6551724137931034,
"eval_PERSON_f1": 0.8932038834951456,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8789808917197452,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.36387643218040466,
"eval_overall_accuracy": 0.9615877080665813,
"eval_overall_f1": 0.8488372093023255,
"eval_overall_precision": 0.8342857142857143,
"eval_overall_recall": 0.863905325443787,
"eval_runtime": 0.8034,
"eval_samples_per_second": 232.767,
"eval_steps_per_second": 3.734,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.0002620484447106719,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0004,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8936170212765957,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.875,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6851851851851852,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.74,
"eval_ORGANIZATION_recall": 0.6379310344827587,
"eval_PERSON_f1": 0.8996763754045308,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3683052957057953,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8516886930983848,
"eval_overall_precision": 0.8454810495626822,
"eval_overall_recall": 0.8579881656804734,
"eval_runtime": 0.796,
"eval_samples_per_second": 234.923,
"eval_steps_per_second": 3.769,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.00031526130624115467,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0005,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6846846846846846,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7169811320754716,
"eval_ORGANIZATION_recall": 0.6551724137931034,
"eval_PERSON_f1": 0.8961038961038961,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.35311439633369446,
"eval_overall_accuracy": 0.9626120358514725,
"eval_overall_f1": 0.8483965014577258,
"eval_overall_precision": 0.8362068965517241,
"eval_overall_recall": 0.8609467455621301,
"eval_runtime": 0.7988,
"eval_samples_per_second": 234.112,
"eval_steps_per_second": 3.756,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.0015132308471947908,
"learning_rate": 6e-06,
"loss": 0.0002,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.881118881118881,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8513513513513513,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6909090909090909,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7307692307692307,
"eval_ORGANIZATION_recall": 0.6551724137931034,
"eval_PERSON_f1": 0.9025974025974026,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3533298671245575,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8508771929824561,
"eval_overall_precision": 0.8410404624277457,
"eval_overall_recall": 0.8609467455621301,
"eval_runtime": 0.8072,
"eval_samples_per_second": 231.657,
"eval_steps_per_second": 3.716,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.00042143117752857506,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0002,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.881118881118881,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8513513513513513,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.719298245614035,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7321428571428571,
"eval_ORGANIZATION_recall": 0.7068965517241379,
"eval_PERSON_f1": 0.8961038961038961,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.35247281193733215,
"eval_overall_accuracy": 0.9636363636363636,
"eval_overall_f1": 0.8517441860465117,
"eval_overall_precision": 0.8371428571428572,
"eval_overall_recall": 0.8668639053254438,
"eval_runtime": 0.8068,
"eval_samples_per_second": 231.777,
"eval_steps_per_second": 3.718,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 0.0002251994446851313,
"learning_rate": 5e-06,
"loss": 0.0002,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7241379310344829,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7241379310344828,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.9025974025974026,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.35829171538352966,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8567293777134587,
"eval_overall_precision": 0.8385269121813032,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.813,
"eval_samples_per_second": 230.023,
"eval_steps_per_second": 3.69,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.0003033955581486225,
"learning_rate": 4.5e-06,
"loss": 0.0002,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8965517241379309,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8552631578947368,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.735042735042735,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7288135593220338,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8961038961038961,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3626328408718109,
"eval_overall_accuracy": 0.963124199743918,
"eval_overall_f1": 0.8571428571428573,
"eval_overall_precision": 0.8366197183098592,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.791,
"eval_samples_per_second": 236.421,
"eval_steps_per_second": 3.793,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.00020177336409687996,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0005,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.881118881118881,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8513513513513513,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7304347826086957,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7368421052631579,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8961038961038961,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3607942759990692,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8534107402031931,
"eval_overall_precision": 0.8376068376068376,
"eval_overall_recall": 0.8698224852071006,
"eval_runtime": 0.8031,
"eval_samples_per_second": 232.851,
"eval_steps_per_second": 3.736,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.0001372557453578338,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0002,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.728813559322034,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7166666666666667,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9025974025974026,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3570501208305359,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8571428571428573,
"eval_overall_precision": 0.8366197183098592,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.8126,
"eval_samples_per_second": 230.138,
"eval_steps_per_second": 3.692,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.00034642827813513577,
"learning_rate": 3e-06,
"loss": 0.0002,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.728813559322034,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7166666666666667,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9025974025974026,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3574298322200775,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8571428571428573,
"eval_overall_precision": 0.8366197183098592,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.8062,
"eval_samples_per_second": 231.955,
"eval_steps_per_second": 3.721,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.0005071151535958052,
"learning_rate": 2.5e-06,
"loss": 0.0004,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8951048951048951,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8648648648648649,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7166666666666668,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6935483870967742,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9025974025974026,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.35781243443489075,
"eval_overall_accuracy": 0.9641485275288092,
"eval_overall_f1": 0.8559077809798271,
"eval_overall_precision": 0.8342696629213483,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.8038,
"eval_samples_per_second": 232.657,
"eval_steps_per_second": 3.732,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.000192229199456051,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0003,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8951048951048951,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8648648648648649,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7166666666666668,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6935483870967742,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8961038961038961,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.35879892110824585,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.8530259365994237,
"eval_overall_precision": 0.8314606741573034,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.8034,
"eval_samples_per_second": 232.77,
"eval_steps_per_second": 3.734,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.00012044800678268075,
"learning_rate": 1.5e-06,
"loss": 0.0004,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7166666666666668,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6935483870967742,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9025974025974026,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3565698266029358,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.8546762589928059,
"eval_overall_precision": 0.8319327731092437,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.8012,
"eval_samples_per_second": 233.392,
"eval_steps_per_second": 3.744,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.0002169125946238637,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0003,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7107438016528926,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6825396825396826,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9025974025974026,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3576311767101288,
"eval_overall_accuracy": 0.9636363636363636,
"eval_overall_f1": 0.8534482758620691,
"eval_overall_precision": 0.8296089385474861,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.7986,
"eval_samples_per_second": 234.172,
"eval_steps_per_second": 3.757,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.0006560708279721439,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0004,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8965517241379309,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8552631578947368,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7166666666666668,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6935483870967742,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9025974025974026,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3574199676513672,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.8563218390804598,
"eval_overall_precision": 0.8324022346368715,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.7986,
"eval_samples_per_second": 234.152,
"eval_steps_per_second": 3.756,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.0002968113112729043,
"learning_rate": 0.0,
"loss": 0.0002,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8965517241379309,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8552631578947368,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7166666666666668,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6935483870967742,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9025974025974026,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.35746997594833374,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.8563218390804598,
"eval_overall_precision": 0.8324022346368715,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.8145,
"eval_samples_per_second": 229.593,
"eval_steps_per_second": 3.683,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4488439619319522.0,
"train_loss": 0.00870023393810217,
"train_runtime": 2597.4084,
"train_samples_per_second": 64.949,
"train_steps_per_second": 4.081
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4488439619319522.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}