nerugm-base-2 / trainer_state.json
apwic's picture
End of training
a93afc0 verified
raw
history blame
144 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 4.555638790130615,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.3502,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.751592356687898,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6941176470588235,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7305389221556886,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6630434782608695,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8976897689768978,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.5423728813559322,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.4444444444444444,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.6779661016949152,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6060606060606061,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.16481448709964752,
"eval_overall_accuracy": 0.9522141606204654,
"eval_overall_f1": 0.7838926174496645,
"eval_overall_precision": 0.7192118226600985,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.8792,
"eval_samples_per_second": 212.683,
"eval_steps_per_second": 3.412,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 3.0741477012634277,
"learning_rate": 4.9e-05,
"loss": 0.1178,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7100000000000001,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.568,
"eval_ORGANIZATION_recall": 0.9466666666666667,
"eval_PERSON_f1": 0.9047619047619047,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8807947019867549,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.5614035087719297,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.47058823529411764,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.14857080578804016,
"eval_overall_accuracy": 0.9537152864648486,
"eval_overall_f1": 0.8079470198675497,
"eval_overall_precision": 0.7331730769230769,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.9505,
"eval_samples_per_second": 196.731,
"eval_steps_per_second": 3.156,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 2.83402419090271,
"learning_rate": 4.85e-05,
"loss": 0.0781,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.8299319727891157,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7777777777777778,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.9333333333333333,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7083333333333334,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.68,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15726295113563538,
"eval_overall_accuracy": 0.9552164123092319,
"eval_overall_f1": 0.8363136176066025,
"eval_overall_precision": 0.7835051546391752,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.8869,
"eval_samples_per_second": 210.857,
"eval_steps_per_second": 3.383,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 2.320517063140869,
"learning_rate": 4.8e-05,
"loss": 0.0572,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7651006711409396,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7702702702702703,
"eval_ORGANIZATION_recall": 0.76,
"eval_PERSON_f1": 0.9019607843137255,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6415094339622641,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5666666666666667,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7368421052631579,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6774193548387096,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.17222364246845245,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8230337078651685,
"eval_overall_precision": 0.7855227882037533,
"eval_overall_recall": 0.8643067846607669,
"eval_runtime": 0.9001,
"eval_samples_per_second": 207.754,
"eval_steps_per_second": 3.333,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 0.44582077860832214,
"learning_rate": 4.75e-05,
"loss": 0.0359,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.8258064516129032,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7710843373493976,
"eval_LOCATION_recall": 0.8888888888888888,
"eval_ORGANIZATION_f1": 0.7951807228915663,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7252747252747253,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9152542372881356,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8881578947368421,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7450980392156864,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6785714285714286,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8799999999999999,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.9166666666666666,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.15475203096866608,
"eval_overall_accuracy": 0.9642231673755316,
"eval_overall_f1": 0.8535564853556487,
"eval_overall_precision": 0.8095238095238095,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.9396,
"eval_samples_per_second": 199.021,
"eval_steps_per_second": 3.193,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 0.24779094755649567,
"learning_rate": 4.7e-05,
"loss": 0.0236,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7808219178082192,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7702702702702703,
"eval_LOCATION_recall": 0.7916666666666666,
"eval_ORGANIZATION_f1": 0.7564102564102564,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7283950617283951,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.18202847242355347,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8193456614509247,
"eval_overall_precision": 0.7912087912087912,
"eval_overall_recall": 0.8495575221238938,
"eval_runtime": 0.9076,
"eval_samples_per_second": 206.029,
"eval_steps_per_second": 3.305,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.0966544821858406,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.0164,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.8181818181818181,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.744186046511628,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6597938144329897,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9072847682119206,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7547169811320754,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.7719298245614036,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7096774193548387,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.2388230413198471,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8292682926829268,
"eval_overall_precision": 0.7669172932330827,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.9186,
"eval_samples_per_second": 203.564,
"eval_steps_per_second": 3.266,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 6.724938869476318,
"learning_rate": 4.600000000000001e-05,
"loss": 0.0131,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.8157894736842106,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7341772151898734,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6987951807228916,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.8754208754208753,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8441558441558441,
"eval_PERSON_recall": 0.9090909090909091,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.6779661016949152,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6060606060606061,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.21797136962413788,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8022284122562674,
"eval_overall_precision": 0.7598944591029023,
"eval_overall_recall": 0.8495575221238938,
"eval_runtime": 0.906,
"eval_samples_per_second": 206.4,
"eval_steps_per_second": 3.311,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.854614019393921,
"learning_rate": 4.55e-05,
"loss": 0.0091,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.8435374149659863,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8266666666666667,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.788235294117647,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7052631578947368,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8837209302325583,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8417721518987342,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.26150327920913696,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8314917127071824,
"eval_overall_precision": 0.7818181818181819,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9105,
"eval_samples_per_second": 205.388,
"eval_steps_per_second": 3.295,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 1.278331995010376,
"learning_rate": 4.5e-05,
"loss": 0.0099,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7500000000000001,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7058823529411765,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9183673469387755,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8940397350993378,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.24217499792575836,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.8349788434414668,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9185,
"eval_samples_per_second": 203.602,
"eval_steps_per_second": 3.266,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.09772255271673203,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.0059,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7972972972972973,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7619047619047621,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6881720430107527,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.907849829351536,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8866666666666667,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.2546893060207367,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8307692307692307,
"eval_overall_precision": 0.7898936170212766,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9121,
"eval_samples_per_second": 205.026,
"eval_steps_per_second": 3.289,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 0.023314962163567543,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.0062,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7945205479452055,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7837837837837838,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.8074534161490684,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7558139534883721,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8829431438127091,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8461538461538461,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6538461538461539,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5862068965517241,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.2780083119869232,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8274894810659187,
"eval_overall_precision": 0.7887700534759359,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9675,
"eval_samples_per_second": 193.282,
"eval_steps_per_second": 3.101,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 3.4945220947265625,
"learning_rate": 4.35e-05,
"loss": 0.0037,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7417218543046358,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7368421052631579,
"eval_ORGANIZATION_recall": 0.7466666666666667,
"eval_PERSON_f1": 0.9163879598662208,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8727272727272727,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.2757226526737213,
"eval_overall_accuracy": 0.9627220415311484,
"eval_overall_f1": 0.8326300984528833,
"eval_overall_precision": 0.7956989247311828,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9689,
"eval_samples_per_second": 193.003,
"eval_steps_per_second": 3.096,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 0.025552373379468918,
"learning_rate": 4.3e-05,
"loss": 0.005,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7341772151898734,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6987951807228916,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.9023569023569024,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8701298701298701,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.280028760433197,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8305084745762712,
"eval_overall_precision": 0.7967479674796748,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.9073,
"eval_samples_per_second": 206.107,
"eval_steps_per_second": 3.307,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 0.192918598651886,
"learning_rate": 4.25e-05,
"loss": 0.0058,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.8356164383561645,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7784431137724551,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7065217391304348,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.64,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8070175438596492,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7419354838709677,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.2716998755931854,
"eval_overall_accuracy": 0.9629722291718789,
"eval_overall_f1": 0.8340306834030684,
"eval_overall_precision": 0.791005291005291,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.91,
"eval_samples_per_second": 205.503,
"eval_steps_per_second": 3.297,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 0.09364385157823563,
"learning_rate": 4.2e-05,
"loss": 0.0046,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.735632183908046,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6464646464646465,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7931034482758621,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.71875,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.30642953515052795,
"eval_overall_accuracy": 0.9539654741055792,
"eval_overall_f1": 0.8169398907103824,
"eval_overall_precision": 0.7608142493638677,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9036,
"eval_samples_per_second": 206.952,
"eval_steps_per_second": 3.32,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 4.5664825439453125,
"learning_rate": 4.15e-05,
"loss": 0.0063,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7922077922077922,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7721518987341772,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.28576722741127014,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8263305322128851,
"eval_overall_precision": 0.7866666666666666,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9045,
"eval_samples_per_second": 206.753,
"eval_steps_per_second": 3.317,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.04714202508330345,
"learning_rate": 4.1e-05,
"loss": 0.0033,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.779874213836478,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7380952380952381,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.30405738949775696,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.8333333333333335,
"eval_overall_precision": 0.7874015748031497,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.903,
"eval_samples_per_second": 207.088,
"eval_steps_per_second": 3.322,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.008477783761918545,
"learning_rate": 4.05e-05,
"loss": 0.0033,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8413793103448277,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8356164383561644,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8101265822784811,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7710843373493976,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8979591836734694,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8741721854304636,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3013346493244171,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.844950213371266,
"eval_overall_precision": 0.8159340659340659,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9229,
"eval_samples_per_second": 202.623,
"eval_steps_per_second": 3.251,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.0049218675121665,
"learning_rate": 4e-05,
"loss": 0.0036,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.8,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7333333333333333,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9023569023569024,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8701298701298701,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6538461538461539,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5862068965517241,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.2967695891857147,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8387096774193548,
"eval_overall_precision": 0.7994652406417112,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9818,
"eval_samples_per_second": 190.457,
"eval_steps_per_second": 3.055,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 0.03995713219046593,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0038,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.7625899280575541,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7910447761194029,
"eval_LOCATION_recall": 0.7361111111111112,
"eval_ORGANIZATION_f1": 0.7374999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6941176470588235,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.9047619047619047,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8807947019867549,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.2894110381603241,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8177905308464849,
"eval_overall_precision": 0.7960893854748603,
"eval_overall_recall": 0.8407079646017699,
"eval_runtime": 0.9338,
"eval_samples_per_second": 200.266,
"eval_steps_per_second": 3.213,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.001287546823732555,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.004,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7051282051282051,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6790123456790124,
"eval_ORGANIZATION_recall": 0.7333333333333333,
"eval_PERSON_f1": 0.8986486486486487,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.869281045751634,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.29990673065185547,
"eval_overall_accuracy": 0.9554665999499625,
"eval_overall_f1": 0.8203677510608203,
"eval_overall_precision": 0.7880434782608695,
"eval_overall_recall": 0.855457227138643,
"eval_runtime": 0.9065,
"eval_samples_per_second": 206.288,
"eval_steps_per_second": 3.309,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.01974656991660595,
"learning_rate": 3.85e-05,
"loss": 0.003,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8074534161490684,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7558139534883721,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3059156537055969,
"eval_overall_accuracy": 0.9622216662496873,
"eval_overall_f1": 0.8443197755960731,
"eval_overall_precision": 0.8048128342245989,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9125,
"eval_samples_per_second": 204.922,
"eval_steps_per_second": 3.288,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 2.60111141204834,
"learning_rate": 3.8e-05,
"loss": 0.0038,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7471264367816093,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6565656565656566,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9152542372881356,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8881578947368421,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3071446716785431,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.828060522696011,
"eval_overall_precision": 0.7757731958762887,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9115,
"eval_samples_per_second": 205.145,
"eval_steps_per_second": 3.291,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 5.347325801849365,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0039,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.729559748427673,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6904761904761905,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3066267967224121,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8133704735376045,
"eval_overall_precision": 0.7704485488126649,
"eval_overall_recall": 0.8613569321533924,
"eval_runtime": 0.909,
"eval_samples_per_second": 205.719,
"eval_steps_per_second": 3.3,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.00547376973554492,
"learning_rate": 3.7e-05,
"loss": 0.0031,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8137931034482759,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8082191780821918,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7701863354037267,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7209302325581395,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8837209302325583,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8417721518987342,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3245824873447418,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8286516853932584,
"eval_overall_precision": 0.7908847184986595,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9241,
"eval_samples_per_second": 202.35,
"eval_steps_per_second": 3.246,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.009228230454027653,
"learning_rate": 3.65e-05,
"loss": 0.0026,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7407407407407408,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6896551724137931,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.903654485049834,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.32465118169784546,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8324022346368715,
"eval_overall_precision": 0.7904509283819628,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.8984,
"eval_samples_per_second": 208.15,
"eval_steps_per_second": 3.339,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 3.7562034130096436,
"learning_rate": 3.6e-05,
"loss": 0.0041,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7972972972972973,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7469879518072289,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6813186813186813,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3042037785053253,
"eval_overall_accuracy": 0.9592194145609206,
"eval_overall_f1": 0.8286516853932584,
"eval_overall_precision": 0.7908847184986595,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9162,
"eval_samples_per_second": 204.094,
"eval_steps_per_second": 3.274,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 5.308003902435303,
"learning_rate": 3.55e-05,
"loss": 0.0034,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8413793103448277,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8356164383561644,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7975460122699386,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7386363636363636,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9146757679180888,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8933333333333333,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3232886493206024,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.851063829787234,
"eval_overall_precision": 0.819672131147541,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9849,
"eval_samples_per_second": 189.867,
"eval_steps_per_second": 3.046,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.0021002369467169046,
"learning_rate": 3.5e-05,
"loss": 0.0027,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8356164383561645,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.732919254658385,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.686046511627907,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.9121621621621621,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8823529411764706,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.7586206896551724,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6875,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.34255892038345337,
"eval_overall_accuracy": 0.9577182887165374,
"eval_overall_f1": 0.8296089385474861,
"eval_overall_precision": 0.7877984084880637,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9051,
"eval_samples_per_second": 206.618,
"eval_steps_per_second": 3.315,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.00587083725258708,
"learning_rate": 3.45e-05,
"loss": 0.0049,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7305389221556886,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6630434782608695,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9152542372881356,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8881578947368421,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.31757453083992004,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.8314606741573034,
"eval_overall_precision": 0.7935656836461126,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9036,
"eval_samples_per_second": 206.959,
"eval_steps_per_second": 3.32,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.03227420523762703,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0027,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7625,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7176470588235294,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9215017064846417,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.9,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7083333333333334,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.68,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8846153846153846,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8846153846153846,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.29548466205596924,
"eval_overall_accuracy": 0.9627220415311484,
"eval_overall_f1": 0.8473609129814551,
"eval_overall_precision": 0.8204419889502762,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9155,
"eval_samples_per_second": 204.26,
"eval_steps_per_second": 3.277,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.016770539805293083,
"learning_rate": 3.35e-05,
"loss": 0.0017,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7974683544303797,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7590361445783133,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9054054054054055,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8758169934640523,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3393411338329315,
"eval_overall_accuracy": 0.9592194145609206,
"eval_overall_f1": 0.8354430379746836,
"eval_overall_precision": 0.7983870967741935,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9082,
"eval_samples_per_second": 205.908,
"eval_steps_per_second": 3.303,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.003996172454208136,
"learning_rate": 3.3e-05,
"loss": 0.0017,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8227848101265823,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7831325301204819,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.910958904109589,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8926174496644296,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7555555555555555,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7727272727272727,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3279131352901459,
"eval_overall_accuracy": 0.9644733550162622,
"eval_overall_f1": 0.8575539568345324,
"eval_overall_precision": 0.8370786516853933,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9098,
"eval_samples_per_second": 205.55,
"eval_steps_per_second": 3.298,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.0200356375426054,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.002,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.8,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7333333333333333,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9016949152542374,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.33025962114334106,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8398876404494382,
"eval_overall_precision": 0.8016085790884718,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9088,
"eval_samples_per_second": 205.758,
"eval_steps_per_second": 3.301,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.04783305525779724,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0012,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7875000000000001,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7411764705882353,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9010238907849829,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.88,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.33322834968566895,
"eval_overall_accuracy": 0.9637227920940705,
"eval_overall_f1": 0.8441926345609065,
"eval_overall_precision": 0.8119891008174387,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9959,
"eval_samples_per_second": 187.774,
"eval_steps_per_second": 3.012,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.0011351928114891052,
"learning_rate": 3.15e-05,
"loss": 0.001,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7710843373493976,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7032967032967034,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.910958904109589,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8926174496644296,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8235294117647058,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.84,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.33810704946517944,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8385269121813032,
"eval_overall_precision": 0.8065395095367848,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9038,
"eval_samples_per_second": 206.905,
"eval_steps_per_second": 3.319,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 12.923250198364258,
"learning_rate": 3.1e-05,
"loss": 0.0021,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7721518987341773,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7349397590361446,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9158249158249158,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8831168831168831,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3416782021522522,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8425531914893618,
"eval_overall_precision": 0.8114754098360656,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9052,
"eval_samples_per_second": 206.591,
"eval_steps_per_second": 3.314,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.05247601494193077,
"learning_rate": 3.05e-05,
"loss": 0.0026,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.7891156462585034,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7733333333333333,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7974683544303797,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7590361445783133,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.37723416090011597,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8338028169014085,
"eval_overall_precision": 0.7978436657681941,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9093,
"eval_samples_per_second": 205.644,
"eval_steps_per_second": 3.299,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.0038078853394836187,
"learning_rate": 3e-05,
"loss": 0.0021,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.7891156462585034,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7733333333333333,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7894736842105264,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7792207792207793,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9146757679180888,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8933333333333333,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7272727272727272,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7619047619047619,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.331974595785141,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8393632416787264,
"eval_overall_precision": 0.8238636363636364,
"eval_overall_recall": 0.855457227138643,
"eval_runtime": 0.902,
"eval_samples_per_second": 207.323,
"eval_steps_per_second": 3.326,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.0014568913029506803,
"learning_rate": 2.95e-05,
"loss": 0.0013,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7425149700598803,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6739130434782609,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9090909090909092,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8766233766233766,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.76,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7037037037037037,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8627450980392156,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.88,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3371780812740326,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.8375350140056023,
"eval_overall_precision": 0.7973333333333333,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9175,
"eval_samples_per_second": 203.81,
"eval_steps_per_second": 3.27,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.01008665468543768,
"learning_rate": 2.9e-05,
"loss": 0.0013,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.779874213836478,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7380952380952381,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9023569023569024,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8701298701298701,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3549456298351288,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8333333333333334,
"eval_overall_precision": 0.7994579945799458,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9061,
"eval_samples_per_second": 206.389,
"eval_steps_per_second": 3.311,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.0012029644567519426,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0003,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7682926829268292,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7078651685393258,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9060402684563759,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8846153846153846,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8846153846153846,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.36216506361961365,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.836111111111111,
"eval_overall_precision": 0.7900262467191601,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9049,
"eval_samples_per_second": 206.658,
"eval_steps_per_second": 3.315,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.04154082387685776,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0032,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7619047619047621,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6881720430107527,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9060402684563759,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.35855501890182495,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8314917127071824,
"eval_overall_precision": 0.7818181818181819,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9082,
"eval_samples_per_second": 205.905,
"eval_steps_per_second": 3.303,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 0.002047579735517502,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.001,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7950310559006211,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7441860465116279,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9158249158249158,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8831168831168831,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.36997854709625244,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.847124824684432,
"eval_overall_precision": 0.8074866310160428,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9062,
"eval_samples_per_second": 206.36,
"eval_steps_per_second": 3.311,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.0037038603331893682,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0034,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8333333333333334,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8333333333333334,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7924528301886793,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9121621621621621,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8823529411764706,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.33895859122276306,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8494318181818181,
"eval_overall_precision": 0.8191780821917808,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9121,
"eval_samples_per_second": 205.028,
"eval_steps_per_second": 3.289,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.0005634190747514367,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0018,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7564102564102564,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7283950617283951,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.9060402684563759,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3375060260295868,
"eval_overall_accuracy": 0.9632224168126094,
"eval_overall_f1": 0.8373408769448375,
"eval_overall_precision": 0.8043478260869565,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9199,
"eval_samples_per_second": 203.274,
"eval_steps_per_second": 3.261,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.0028315193485468626,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0017,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7974683544303797,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7590361445783133,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9183673469387755,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8940397350993378,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.33102044463157654,
"eval_overall_accuracy": 0.9632224168126094,
"eval_overall_f1": 0.8473609129814551,
"eval_overall_precision": 0.8204419889502762,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9017,
"eval_samples_per_second": 207.378,
"eval_steps_per_second": 3.327,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.009939000010490417,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0014,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8299319727891157,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8074534161490684,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7558139534883721,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9121621621621621,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8823529411764706,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7450980392156864,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6785714285714286,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8627450980392156,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.88,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.32123759388923645,
"eval_overall_accuracy": 0.9624718538904178,
"eval_overall_f1": 0.8555240793201133,
"eval_overall_precision": 0.8228882833787466,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9187,
"eval_samples_per_second": 203.539,
"eval_steps_per_second": 3.265,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 0.7588798403739929,
"learning_rate": 2.5e-05,
"loss": 0.0011,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7924528301886793,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9152542372881356,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8881578947368421,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3109734356403351,
"eval_overall_accuracy": 0.9622216662496873,
"eval_overall_f1": 0.8453900709219858,
"eval_overall_precision": 0.8142076502732241,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9093,
"eval_samples_per_second": 205.655,
"eval_steps_per_second": 3.299,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.0009810138726606965,
"learning_rate": 2.45e-05,
"loss": 0.0005,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8299319727891157,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.825,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7764705882352941,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9246575342465754,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.9060402684563759,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.30816784501075745,
"eval_overall_accuracy": 0.9659744808606455,
"eval_overall_f1": 0.8607954545454546,
"eval_overall_precision": 0.8301369863013699,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.914,
"eval_samples_per_second": 204.601,
"eval_steps_per_second": 3.282,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.0026644645258784294,
"learning_rate": 2.4e-05,
"loss": 0.0003,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8157894736842106,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8024691358024691,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7471264367816092,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9183673469387755,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8940397350993378,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.693877551020408,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6538461538461539,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3176332414150238,
"eval_overall_accuracy": 0.9647235426569928,
"eval_overall_f1": 0.849507735583685,
"eval_overall_precision": 0.8118279569892473,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9767,
"eval_samples_per_second": 191.467,
"eval_steps_per_second": 3.072,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.0603233277797699,
"learning_rate": 2.35e-05,
"loss": 0.0004,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8356164383561645,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8121212121212122,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7444444444444445,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9215017064846417,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.9,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3314068019390106,
"eval_overall_accuracy": 0.9647235426569928,
"eval_overall_f1": 0.8559322033898304,
"eval_overall_precision": 0.8211382113821138,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.9085,
"eval_samples_per_second": 205.826,
"eval_steps_per_second": 3.302,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.00044817946036346257,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0002,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8050314465408804,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7619047619047619,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.925170068027211,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.9006622516556292,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.693877551020408,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6538461538461539,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3241828978061676,
"eval_overall_accuracy": 0.9657242932199149,
"eval_overall_f1": 0.8543140028288544,
"eval_overall_precision": 0.8206521739130435,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9117,
"eval_samples_per_second": 205.114,
"eval_steps_per_second": 3.291,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.0010649035684764385,
"learning_rate": 2.25e-05,
"loss": 0.0005,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7875000000000001,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7411764705882353,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9220338983050849,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8947368421052632,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.33954718708992004,
"eval_overall_accuracy": 0.9627220415311484,
"eval_overall_f1": 0.849507735583685,
"eval_overall_precision": 0.8118279569892473,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9361,
"eval_samples_per_second": 199.766,
"eval_steps_per_second": 3.205,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.0006854601670056581,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0001,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7826086956521738,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7325581395348837,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.925170068027211,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.9006622516556292,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7083333333333334,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.68,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3326149582862854,
"eval_overall_accuracy": 0.9647235426569928,
"eval_overall_f1": 0.8519040902679831,
"eval_overall_precision": 0.8162162162162162,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9055,
"eval_samples_per_second": 206.509,
"eval_steps_per_second": 3.313,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.0004171407490503043,
"learning_rate": 2.15e-05,
"loss": 0.0008,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7950310559006211,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7441860465116279,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9090909090909092,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8766233766233766,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3388373553752899,
"eval_overall_accuracy": 0.9639729797348011,
"eval_overall_f1": 0.8455056179775281,
"eval_overall_precision": 0.806970509383378,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9161,
"eval_samples_per_second": 204.134,
"eval_steps_per_second": 3.275,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.000792400271166116,
"learning_rate": 2.1e-05,
"loss": 0.0005,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.8121212121212122,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7444444444444445,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.693877551020408,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6538461538461539,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3484926223754883,
"eval_overall_accuracy": 0.9622216662496873,
"eval_overall_f1": 0.8479776847977685,
"eval_overall_precision": 0.8042328042328042,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.9061,
"eval_samples_per_second": 206.382,
"eval_steps_per_second": 3.311,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.0005213640397414565,
"learning_rate": 2.05e-05,
"loss": 0.0004,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7950310559006211,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7441860465116279,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9215017064846417,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.9,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8627450980392156,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.88,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.34474921226501465,
"eval_overall_accuracy": 0.9627220415311484,
"eval_overall_f1": 0.8486562942008488,
"eval_overall_precision": 0.8152173913043478,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9086,
"eval_samples_per_second": 205.807,
"eval_steps_per_second": 3.302,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.0031596734188497066,
"learning_rate": 2e-05,
"loss": 0.0017,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.783625730994152,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6979166666666666,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3943552076816559,
"eval_overall_accuracy": 0.9559669752314236,
"eval_overall_f1": 0.8363136176066025,
"eval_overall_precision": 0.7835051546391752,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.9068,
"eval_samples_per_second": 206.222,
"eval_steps_per_second": 3.308,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.0038910319563001394,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0002,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7333333333333333,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7346938775510203,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.38600656390190125,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8447552447552448,
"eval_overall_precision": 0.8031914893617021,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9064,
"eval_samples_per_second": 206.303,
"eval_steps_per_second": 3.31,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.008979488164186478,
"learning_rate": 1.9e-05,
"loss": 0.0001,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8176100628930819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7738095238095238,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9047619047619047,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8807947019867549,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7083333333333334,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.68,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3512948453426361,
"eval_overall_accuracy": 0.9629722291718789,
"eval_overall_f1": 0.8477951635846371,
"eval_overall_precision": 0.8186813186813187,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9032,
"eval_samples_per_second": 207.035,
"eval_steps_per_second": 3.321,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.00276816263794899,
"learning_rate": 1.85e-05,
"loss": 0.0013,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7904191616766466,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.717391304347826,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9060402684563759,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7083333333333334,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.68,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3540952205657959,
"eval_overall_accuracy": 0.9629722291718789,
"eval_overall_f1": 0.8440111420612812,
"eval_overall_precision": 0.7994722955145118,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.9089,
"eval_samples_per_second": 205.74,
"eval_steps_per_second": 3.301,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.010789873078465462,
"learning_rate": 1.8e-05,
"loss": 0.0007,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7848101265822784,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7469879518072289,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9090909090909092,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8766233766233766,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.34456735849380493,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.8344923504867873,
"eval_overall_precision": 0.7894736842105263,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9096,
"eval_samples_per_second": 205.587,
"eval_steps_per_second": 3.298,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.0003090931277256459,
"learning_rate": 1.75e-05,
"loss": 0.0008,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.8181818181818181,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.782051282051282,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7530864197530864,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7346938775510203,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3443866968154907,
"eval_overall_accuracy": 0.9629722291718789,
"eval_overall_f1": 0.8429985855728431,
"eval_overall_precision": 0.8097826086956522,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.906,
"eval_samples_per_second": 206.397,
"eval_steps_per_second": 3.311,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.008000018075108528,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0007,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7564102564102564,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7283950617283951,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.9121621621621621,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8823529411764706,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7083333333333334,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.68,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3399989902973175,
"eval_overall_accuracy": 0.9627220415311484,
"eval_overall_f1": 0.8385269121813032,
"eval_overall_precision": 0.8065395095367848,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9215,
"eval_samples_per_second": 202.925,
"eval_steps_per_second": 3.255,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.00037926252116449177,
"learning_rate": 1.65e-05,
"loss": 0.0004,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.8148148148148148,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7586206896551724,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9090909090909092,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8766233766233766,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3691372275352478,
"eval_overall_accuracy": 0.96347260445334,
"eval_overall_f1": 0.853932584269663,
"eval_overall_precision": 0.8150134048257373,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.9131,
"eval_samples_per_second": 204.802,
"eval_steps_per_second": 3.286,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.0003724870621226728,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0012,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8280254777070064,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7926829268292683,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9121621621621621,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8823529411764706,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7083333333333334,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.68,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8627450980392156,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.88,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.33306267857551575,
"eval_overall_accuracy": 0.9654741055791843,
"eval_overall_f1": 0.8587731811697574,
"eval_overall_precision": 0.8314917127071824,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9838,
"eval_samples_per_second": 190.074,
"eval_steps_per_second": 3.049,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.0002074290969176218,
"learning_rate": 1.55e-05,
"loss": 0.0003,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.8170731707317072,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7528089887640449,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9054054054054055,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8758169934640523,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.373975545167923,
"eval_overall_accuracy": 0.96347260445334,
"eval_overall_f1": 0.8551336146272857,
"eval_overall_precision": 0.8172043010752689,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.9156,
"eval_samples_per_second": 204.238,
"eval_steps_per_second": 3.277,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.00042664690408855677,
"learning_rate": 1.5e-05,
"loss": 0.0001,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8025477707006369,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7682926829268293,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9054054054054055,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8758169934640523,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.37100422382354736,
"eval_overall_accuracy": 0.96347260445334,
"eval_overall_f1": 0.8494318181818181,
"eval_overall_precision": 0.8191780821917808,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9101,
"eval_samples_per_second": 205.482,
"eval_steps_per_second": 3.297,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.0007093641324900091,
"learning_rate": 1.45e-05,
"loss": 0.0002,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8101265822784811,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7710843373493976,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.91156462585034,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8874172185430463,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7083333333333334,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.68,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3477381467819214,
"eval_overall_accuracy": 0.9647235426569928,
"eval_overall_f1": 0.8518518518518517,
"eval_overall_precision": 0.8236914600550964,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9072,
"eval_samples_per_second": 206.129,
"eval_steps_per_second": 3.307,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.00021990617096889764,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0002,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7950310559006211,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7441860465116279,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.36287015676498413,
"eval_overall_accuracy": 0.9642231673755316,
"eval_overall_f1": 0.8478873239436621,
"eval_overall_precision": 0.8113207547169812,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9141,
"eval_samples_per_second": 204.572,
"eval_steps_per_second": 3.282,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.00021961626771371812,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0002,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8181818181818181,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7643312101910827,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7317073170731707,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.91156462585034,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8874172185430463,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3637426495552063,
"eval_overall_accuracy": 0.9639729797348011,
"eval_overall_f1": 0.8413597733711049,
"eval_overall_precision": 0.8092643051771117,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.909,
"eval_samples_per_second": 205.714,
"eval_steps_per_second": 3.3,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.00018741752137430012,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0001,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8181818181818181,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.751592356687898,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7195121951219512,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.9047619047619047,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8807947019867549,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3637796938419342,
"eval_overall_accuracy": 0.9632224168126094,
"eval_overall_f1": 0.8356940509915013,
"eval_overall_precision": 0.8038147138964578,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9145,
"eval_samples_per_second": 204.477,
"eval_steps_per_second": 3.28,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.0007877243915572762,
"learning_rate": 1.25e-05,
"loss": 0.0001,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7919463087248321,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7972972972972973,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3778810501098633,
"eval_overall_accuracy": 0.9649737302977233,
"eval_overall_f1": 0.8493543758967002,
"eval_overall_precision": 0.8268156424581006,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.9077,
"eval_samples_per_second": 206.004,
"eval_steps_per_second": 3.305,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.005742947105318308,
"learning_rate": 1.2e-05,
"loss": 0.0001,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7894736842105264,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7792207792207793,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9054054054054055,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8758169934640523,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7346938775510203,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3797122836112976,
"eval_overall_accuracy": 0.9644733550162622,
"eval_overall_f1": 0.8461538461538463,
"eval_overall_precision": 0.8181818181818182,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9011,
"eval_samples_per_second": 207.522,
"eval_steps_per_second": 3.329,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.00030839102691970766,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0004,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.8024691358024691,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7471264367816092,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8963210702341137,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8589743589743589,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.76,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7037037037037037,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.40759775042533875,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.8475524475524475,
"eval_overall_precision": 0.8058510638297872,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.9103,
"eval_samples_per_second": 205.428,
"eval_steps_per_second": 3.296,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.00025188998552039266,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0005,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8400000000000001,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7950310559006211,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7441860465116279,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7346938775510203,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.39274299144744873,
"eval_overall_accuracy": 0.9624718538904178,
"eval_overall_f1": 0.849507735583685,
"eval_overall_precision": 0.8118279569892473,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9103,
"eval_samples_per_second": 205.436,
"eval_steps_per_second": 3.296,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.00023670213704463094,
"learning_rate": 1.05e-05,
"loss": 0.0003,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7468354430379747,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7108433734939759,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.9023569023569024,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8701298701298701,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7450980392156864,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6785714285714286,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.4000164866447449,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8330995792426367,
"eval_overall_precision": 0.7941176470588235,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9149,
"eval_samples_per_second": 204.395,
"eval_steps_per_second": 3.279,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.000326380948536098,
"learning_rate": 1e-05,
"loss": 0.0001,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7483870967741936,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.725,
"eval_ORGANIZATION_recall": 0.7733333333333333,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3888261020183563,
"eval_overall_accuracy": 0.9629722291718789,
"eval_overall_f1": 0.8416547788873039,
"eval_overall_precision": 0.8149171270718232,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9033,
"eval_samples_per_second": 207.02,
"eval_steps_per_second": 3.321,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.0005148330819793046,
"learning_rate": 9.5e-06,
"loss": 0.0001,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7643312101910827,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7317073170731707,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3981935977935791,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.836619718309859,
"eval_overall_precision": 0.8005390835579514,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.9078,
"eval_samples_per_second": 205.981,
"eval_steps_per_second": 3.305,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.0001784728665370494,
"learning_rate": 9e-06,
"loss": 0.0003,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8378378378378377,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7870967741935484,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7625,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.91156462585034,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8874172185430463,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3737158179283142,
"eval_overall_accuracy": 0.9647235426569928,
"eval_overall_f1": 0.8538681948424068,
"eval_overall_precision": 0.83008356545961,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.9108,
"eval_samples_per_second": 205.324,
"eval_steps_per_second": 3.294,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.00012157092714915052,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0002,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7975460122699386,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7386363636363636,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9047619047619047,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8807947019867549,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3761243224143982,
"eval_overall_accuracy": 0.9632224168126094,
"eval_overall_f1": 0.8502824858757062,
"eval_overall_precision": 0.8157181571815718,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9121,
"eval_samples_per_second": 205.019,
"eval_steps_per_second": 3.289,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.01326628215610981,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0001,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8025477707006369,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7682926829268293,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9047619047619047,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8807947019867549,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.37578248977661133,
"eval_overall_accuracy": 0.9639729797348011,
"eval_overall_f1": 0.8530670470756063,
"eval_overall_precision": 0.8259668508287292,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.9306,
"eval_samples_per_second": 200.941,
"eval_steps_per_second": 3.224,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.006039230152964592,
"learning_rate": 7.5e-06,
"loss": 0.0004,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7975460122699386,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7386363636363636,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9016949152542374,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7346938775510203,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3836413621902466,
"eval_overall_accuracy": 0.9629722291718789,
"eval_overall_f1": 0.8478873239436621,
"eval_overall_precision": 0.8113207547169812,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9049,
"eval_samples_per_second": 206.647,
"eval_steps_per_second": 3.315,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.00042766937986016273,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0005,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8076923076923077,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7777777777777778,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9016949152542374,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7346938775510203,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3791405260562897,
"eval_overall_accuracy": 0.9642231673755316,
"eval_overall_f1": 0.8506401137980086,
"eval_overall_precision": 0.8214285714285714,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.904,
"eval_samples_per_second": 206.855,
"eval_steps_per_second": 3.319,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.0006120882462710142,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0004,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8025477707006369,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7682926829268293,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9023569023569024,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8701298701298701,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7346938775510203,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.38632336258888245,
"eval_overall_accuracy": 0.9639729797348011,
"eval_overall_f1": 0.8514851485148515,
"eval_overall_precision": 0.8179347826086957,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9113,
"eval_samples_per_second": 205.193,
"eval_steps_per_second": 3.292,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.0006923701730556786,
"learning_rate": 6e-06,
"loss": 0.0004,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7875000000000001,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7411764705882353,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.907849829351536,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8866666666666667,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.9056603773584906,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.3742952346801758,
"eval_overall_accuracy": 0.9647235426569928,
"eval_overall_f1": 0.851063829787234,
"eval_overall_precision": 0.819672131147541,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9099,
"eval_samples_per_second": 205.512,
"eval_steps_per_second": 3.297,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.0163017176091671,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0006,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7894736842105264,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7792207792207793,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.907849829351536,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8866666666666667,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.9056603773584906,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.3696248233318329,
"eval_overall_accuracy": 0.966224668501376,
"eval_overall_f1": 0.8513708513708513,
"eval_overall_precision": 0.8333333333333334,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9099,
"eval_samples_per_second": 205.507,
"eval_steps_per_second": 3.297,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 15.17189884185791,
"learning_rate": 5e-06,
"loss": 0.0002,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7894736842105264,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7792207792207793,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.907849829351536,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8866666666666667,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.9056603773584906,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.3719424605369568,
"eval_overall_accuracy": 0.966224668501376,
"eval_overall_f1": 0.8477011494252874,
"eval_overall_precision": 0.8263305322128851,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.9059,
"eval_samples_per_second": 206.432,
"eval_steps_per_second": 3.312,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.00020513041818048805,
"learning_rate": 4.5e-06,
"loss": 0.0002,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8205128205128205,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7901234567901234,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.9056603773584906,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.3863327205181122,
"eval_overall_accuracy": 0.9642231673755316,
"eval_overall_f1": 0.8587731811697574,
"eval_overall_precision": 0.8314917127071824,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9044,
"eval_samples_per_second": 206.761,
"eval_steps_per_second": 3.317,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.0004068514099344611,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0004,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8129032258064516,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7875,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.91156462585034,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8874172185430463,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.9056603773584906,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.38287997245788574,
"eval_overall_accuracy": 0.9644733550162622,
"eval_overall_f1": 0.8583690987124464,
"eval_overall_precision": 0.8333333333333334,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.9043,
"eval_samples_per_second": 206.779,
"eval_steps_per_second": 3.317,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.00010082097287522629,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0002,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8104575163398693,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7948717948717948,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.9056603773584906,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.37826383113861084,
"eval_overall_accuracy": 0.9652239179384539,
"eval_overall_f1": 0.8567335243553009,
"eval_overall_precision": 0.8328690807799443,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.918,
"eval_samples_per_second": 203.7,
"eval_steps_per_second": 3.268,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.000542107445653528,
"learning_rate": 3e-06,
"loss": 0.0001,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8076923076923077,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7777777777777778,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.9056603773584906,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.38576415181159973,
"eval_overall_accuracy": 0.9642231673755316,
"eval_overall_f1": 0.8575498575498576,
"eval_overall_precision": 0.8292011019283747,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9111,
"eval_samples_per_second": 205.24,
"eval_steps_per_second": 3.293,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.044874146580696106,
"learning_rate": 2.5e-06,
"loss": 0.0001,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8076923076923077,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7777777777777778,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7499999999999999,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.72,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.38630810379981995,
"eval_overall_accuracy": 0.9639729797348011,
"eval_overall_f1": 0.856330014224751,
"eval_overall_precision": 0.8269230769230769,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.8986,
"eval_samples_per_second": 208.113,
"eval_steps_per_second": 3.339,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.0001308424398303032,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0001,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8076923076923077,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7777777777777778,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.76,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7037037037037037,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3916187286376953,
"eval_overall_accuracy": 0.9637227920940705,
"eval_overall_f1": 0.8539007092198581,
"eval_overall_precision": 0.8224043715846995,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9154,
"eval_samples_per_second": 204.278,
"eval_steps_per_second": 3.277,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.00018677054322324693,
"learning_rate": 1.5e-06,
"loss": 0.0001,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8101265822784811,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7710843373493976,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.76,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7037037037037037,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3897801339626312,
"eval_overall_accuracy": 0.9642231673755316,
"eval_overall_f1": 0.8543140028288544,
"eval_overall_precision": 0.8206521739130435,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9174,
"eval_samples_per_second": 203.839,
"eval_steps_per_second": 3.27,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.004196417052298784,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0001,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8101265822784811,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7710843373493976,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.76,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7037037037037037,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.38807475566864014,
"eval_overall_accuracy": 0.9644733550162622,
"eval_overall_f1": 0.8543140028288544,
"eval_overall_precision": 0.8206521739130435,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.9056,
"eval_samples_per_second": 206.492,
"eval_steps_per_second": 3.313,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.0001258315023733303,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0001,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8101265822784811,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7710843373493976,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3856855630874634,
"eval_overall_accuracy": 0.9642231673755316,
"eval_overall_f1": 0.8514851485148515,
"eval_overall_precision": 0.8179347826086957,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9072,
"eval_samples_per_second": 206.127,
"eval_steps_per_second": 3.307,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.00010668273171177134,
"learning_rate": 0.0,
"loss": 0.0001,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8101265822784811,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7710843373493976,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.9084745762711864,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.881578947368421,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3857269287109375,
"eval_overall_accuracy": 0.9642231673755316,
"eval_overall_f1": 0.8514851485148515,
"eval_overall_precision": 0.8179347826086957,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.9906,
"eval_samples_per_second": 188.783,
"eval_steps_per_second": 3.029,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4502314993613766.0,
"train_loss": 0.008494841067761815,
"train_runtime": 2623.6324,
"train_samples_per_second": 64.3,
"train_steps_per_second": 4.04
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4502314993613766.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}