nerugm-base-3 / trainer_state.json
apwic's picture
End of training
8734e62 verified
raw
history blame
145 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 3.6827080249786377,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.3501,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.7483870967741935,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6904761904761905,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.6709677419354838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5777777777777777,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8679245283018867,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8214285714285714,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7123287671232875,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.13337989151477814,
"eval_overall_accuracy": 0.953443258971872,
"eval_overall_f1": 0.7905138339920948,
"eval_overall_precision": 0.7281553398058253,
"eval_overall_recall": 0.8645533141210374,
"eval_runtime": 0.9448,
"eval_samples_per_second": 197.919,
"eval_steps_per_second": 3.175,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 2.115112781524658,
"learning_rate": 4.9e-05,
"loss": 0.1148,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.7612903225806451,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7023809523809523,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.697986577181208,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6190476190476191,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8996763754045306,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8742138364779874,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6329113924050633,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5434782608695652,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.7692307692307693,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6756756756756757,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1362091302871704,
"eval_overall_accuracy": 0.9558680892337537,
"eval_overall_f1": 0.7926023778071334,
"eval_overall_precision": 0.7317073170731707,
"eval_overall_recall": 0.8645533141210374,
"eval_runtime": 0.9986,
"eval_samples_per_second": 187.27,
"eval_steps_per_second": 3.004,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 2.7631375789642334,
"learning_rate": 4.85e-05,
"loss": 0.0732,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7702702702702702,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6867469879518072,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8766233766233766,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.806451612903226,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7352941176470589,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14412528276443481,
"eval_overall_accuracy": 0.9573229873908826,
"eval_overall_f1": 0.8221024258760108,
"eval_overall_precision": 0.7721518987341772,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.9223,
"eval_samples_per_second": 202.756,
"eval_steps_per_second": 3.253,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.3901716470718384,
"learning_rate": 4.8e-05,
"loss": 0.0453,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7123287671232877,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6419753086419753,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8996763754045306,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8742138364779874,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8214285714285714,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8214285714285714,
"eval_loss": 0.1702796369791031,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8260869565217391,
"eval_overall_precision": 0.781491002570694,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.94,
"eval_samples_per_second": 198.941,
"eval_steps_per_second": 3.192,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 0.532292902469635,
"learning_rate": 4.75e-05,
"loss": 0.0312,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7832167832167831,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.717948717948718,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8810289389067525,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.17514730989933014,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8324324324324324,
"eval_overall_precision": 0.7837150127226463,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.9647,
"eval_samples_per_second": 193.847,
"eval_steps_per_second": 3.11,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 5.477240085601807,
"learning_rate": 4.7e-05,
"loss": 0.0236,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7712418300653594,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7482993197278912,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6707317073170732,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.20889906585216522,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8197596795727637,
"eval_overall_precision": 0.763681592039801,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.9433,
"eval_samples_per_second": 198.231,
"eval_steps_per_second": 3.18,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 2.7495665550231934,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.017,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.8275862068965518,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.763888888888889,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6962025316455697,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8925081433224756,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8108108108108109,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7317073170731707,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.21119879186153412,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8406593406593407,
"eval_overall_precision": 0.8031496062992126,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.9486,
"eval_samples_per_second": 197.142,
"eval_steps_per_second": 3.163,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.43028321862220764,
"learning_rate": 4.600000000000001e-05,
"loss": 0.0133,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7862068965517242,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7125,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8996763754045306,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8742138364779874,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8108108108108109,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7317073170731707,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.21715472638607025,
"eval_overall_accuracy": 0.9602327837051406,
"eval_overall_f1": 0.8466757123473542,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9553,
"eval_samples_per_second": 195.744,
"eval_steps_per_second": 3.14,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 0.03873327746987343,
"learning_rate": 4.55e-05,
"loss": 0.0096,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7482993197278912,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6707317073170732,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9019607843137256,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7887323943661972,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7368421052631579,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.23949624598026276,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8365122615803814,
"eval_overall_precision": 0.7932816537467701,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 1.0163,
"eval_samples_per_second": 183.996,
"eval_steps_per_second": 2.952,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 1.984230875968933,
"learning_rate": 4.5e-05,
"loss": 0.0077,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8996763754045306,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8742138364779874,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.806451612903226,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7352941176470589,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.26252666115760803,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8268456375838926,
"eval_overall_precision": 0.7738693467336684,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.952,
"eval_samples_per_second": 196.421,
"eval_steps_per_second": 3.151,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.09802401065826416,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.0059,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.8400000000000001,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7659574468085107,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7105263157894737,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8823529411764707,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8169014084507042,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7631578947368421,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.235382542014122,
"eval_overall_accuracy": 0.9648399612027158,
"eval_overall_f1": 0.8418156808803301,
"eval_overall_precision": 0.8052631578947368,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.9545,
"eval_samples_per_second": 195.917,
"eval_steps_per_second": 3.143,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 0.4382927417755127,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.0078,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.8251748251748252,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8194444444444444,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.8201438848920863,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7702702702702703,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8734177215189873,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8115942028985507,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7777777777777778,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.21610549092292786,
"eval_overall_accuracy": 0.9675072744907857,
"eval_overall_f1": 0.8575418994413407,
"eval_overall_precision": 0.8319783197831978,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.9504,
"eval_samples_per_second": 196.751,
"eval_steps_per_second": 3.156,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 2.4125523567199707,
"learning_rate": 4.35e-05,
"loss": 0.0044,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.8181818181818181,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7552447552447553,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6923076923076923,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.9042904290429042,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8954248366013072,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.821917808219178,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.26299452781677246,
"eval_overall_accuracy": 0.962172647914646,
"eval_overall_f1": 0.8469945355191256,
"eval_overall_precision": 0.8051948051948052,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.9454,
"eval_samples_per_second": 197.792,
"eval_steps_per_second": 3.173,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 0.6766614317893982,
"learning_rate": 4.3e-05,
"loss": 0.0047,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.8493150684931506,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8266666666666667,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7862068965517242,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7125,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8802588996763754,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.9090909090909091,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.9259259259259259,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.25089046359062195,
"eval_overall_accuracy": 0.9638700290979632,
"eval_overall_f1": 0.8500687757909215,
"eval_overall_precision": 0.8131578947368421,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.9494,
"eval_samples_per_second": 196.976,
"eval_steps_per_second": 3.16,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 2.052441358566284,
"learning_rate": 4.25e-05,
"loss": 0.0041,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7755102040816327,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6951219512195121,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8831168831168831,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.821917808219178,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.2882152795791626,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8306451612903226,
"eval_overall_precision": 0.7783375314861462,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.9611,
"eval_samples_per_second": 194.573,
"eval_steps_per_second": 3.121,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 0.014275839552283287,
"learning_rate": 4.2e-05,
"loss": 0.0044,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8053691275167785,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7945205479452054,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7160493827160493,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8823529411764706,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8169014084507042,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7631578947368421,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.26748523116111755,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8372093023255814,
"eval_overall_precision": 0.796875,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.9645,
"eval_samples_per_second": 193.888,
"eval_steps_per_second": 3.111,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.5238301157951355,
"learning_rate": 4.15e-05,
"loss": 0.0032,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.8299319727891157,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7746478873239436,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8896103896103896,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8000000000000002,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7567567567567568,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.28771573305130005,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8356164383561643,
"eval_overall_precision": 0.7963446475195822,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.9538,
"eval_samples_per_second": 196.063,
"eval_steps_per_second": 3.145,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.005304540041834116,
"learning_rate": 4.1e-05,
"loss": 0.0034,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.8133333333333335,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7552447552447553,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6923076923076923,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.894736842105263,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8831168831168831,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.821917808219178,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8928571428571429,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8928571428571429,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.28492802381515503,
"eval_overall_accuracy": 0.9614451988360815,
"eval_overall_f1": 0.8429752066115703,
"eval_overall_precision": 0.8073878627968337,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.9617,
"eval_samples_per_second": 194.443,
"eval_steps_per_second": 3.119,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.05048967897891998,
"learning_rate": 4.05e-05,
"loss": 0.0051,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7832167832167831,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.717948717948718,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8990228013029316,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8789808917197452,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2656005918979645,
"eval_overall_accuracy": 0.9643549951503395,
"eval_overall_f1": 0.8493150684931507,
"eval_overall_precision": 0.8093994778067886,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.9518,
"eval_samples_per_second": 196.476,
"eval_steps_per_second": 3.152,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.005232055671513081,
"learning_rate": 4e-05,
"loss": 0.0029,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7482014388489208,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7027027027027027,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.823529411764706,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2749578654766083,
"eval_overall_accuracy": 0.9638700290979632,
"eval_overall_f1": 0.8365122615803814,
"eval_overall_precision": 0.7932816537467701,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.9399,
"eval_samples_per_second": 198.964,
"eval_steps_per_second": 3.192,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 20.893596649169922,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0051,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7464788732394366,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6883116883116883,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8115942028985507,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7777777777777778,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2634299099445343,
"eval_overall_accuracy": 0.9643549951503395,
"eval_overall_f1": 0.8429752066115703,
"eval_overall_precision": 0.8073878627968337,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.9692,
"eval_samples_per_second": 192.946,
"eval_steps_per_second": 3.095,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.013275664299726486,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.003,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7417218543046358,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6511627906976745,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9061488673139159,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8333333333333333,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7692307692307693,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2914196252822876,
"eval_overall_accuracy": 0.9614451988360815,
"eval_overall_f1": 0.8455284552845529,
"eval_overall_precision": 0.7979539641943734,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9669,
"eval_samples_per_second": 193.405,
"eval_steps_per_second": 3.103,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.05714813619852066,
"learning_rate": 3.85e-05,
"loss": 0.0035,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8435374149659864,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.76056338028169,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7012987012987013,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8115942028985507,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7777777777777778,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2690264582633972,
"eval_overall_accuracy": 0.9645974781765276,
"eval_overall_f1": 0.8543689320388349,
"eval_overall_precision": 0.8235294117647058,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.943,
"eval_samples_per_second": 198.31,
"eval_steps_per_second": 3.181,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 8.982757568359375,
"learning_rate": 3.8e-05,
"loss": 0.0024,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7924528301886792,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7549668874172185,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6627906976744186,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9108910891089109,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9019607843137255,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8333333333333333,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7692307692307693,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.301530122756958,
"eval_overall_accuracy": 0.9602327837051406,
"eval_overall_f1": 0.8425302826379543,
"eval_overall_precision": 0.7904040404040404,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.9593,
"eval_samples_per_second": 194.925,
"eval_steps_per_second": 3.127,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.10265465825796127,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0032,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8157894736842104,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7971014492753623,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7534246575342466,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2815525233745575,
"eval_overall_accuracy": 0.9636275460717749,
"eval_overall_f1": 0.851182197496523,
"eval_overall_precision": 0.8225806451612904,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.9507,
"eval_samples_per_second": 196.688,
"eval_steps_per_second": 3.155,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.0032238499261438847,
"learning_rate": 3.7e-05,
"loss": 0.003,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8344370860927152,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7659574468085107,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7105263157894737,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.9042904290429042,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8954248366013072,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8333333333333333,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7692307692307693,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.28177666664123535,
"eval_overall_accuracy": 0.9636275460717749,
"eval_overall_f1": 0.8508287292817679,
"eval_overall_precision": 0.8169761273209549,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.9649,
"eval_samples_per_second": 193.801,
"eval_steps_per_second": 3.109,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.03518635779619217,
"learning_rate": 3.65e-05,
"loss": 0.0016,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8133333333333335,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7777777777777778,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7088607594936709,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9144736842105262,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9025974025974026,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2842986285686493,
"eval_overall_accuracy": 0.9648399612027158,
"eval_overall_f1": 0.8528198074277854,
"eval_overall_precision": 0.8157894736842105,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 1.03,
"eval_samples_per_second": 181.562,
"eval_steps_per_second": 2.913,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 0.01968814805150032,
"learning_rate": 3.6e-05,
"loss": 0.0025,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7804878048780488,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.8028169014084509,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7402597402597403,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9042904290429042,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8954248366013072,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7714285714285715,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3238835334777832,
"eval_overall_accuracy": 0.960717749757517,
"eval_overall_f1": 0.8512396694214875,
"eval_overall_precision": 0.8153034300791556,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.9375,
"eval_samples_per_second": 199.463,
"eval_steps_per_second": 3.2,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.005619656760245562,
"learning_rate": 3.55e-05,
"loss": 0.0026,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8421052631578947,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.8111888111888114,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7435897435897436,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9042904290429042,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8954248366013072,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.3090417683124542,
"eval_overall_accuracy": 0.965082444228904,
"eval_overall_f1": 0.8575342465753425,
"eval_overall_precision": 0.8172323759791122,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.9535,
"eval_samples_per_second": 196.122,
"eval_steps_per_second": 3.146,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.0475270040333271,
"learning_rate": 3.5e-05,
"loss": 0.0041,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7703703703703704,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7428571428571429,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9114754098360656,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.30209869146347046,
"eval_overall_accuracy": 0.9626576139670223,
"eval_overall_f1": 0.8464730290456433,
"eval_overall_precision": 0.8138297872340425,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.9526,
"eval_samples_per_second": 196.299,
"eval_steps_per_second": 3.149,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.6186401844024658,
"learning_rate": 3.45e-05,
"loss": 0.0054,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8181818181818181,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.759124087591241,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7222222222222222,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9025974025974027,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.879746835443038,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3126040995121002,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8353741496598639,
"eval_overall_precision": 0.7912371134020618,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.9488,
"eval_samples_per_second": 197.092,
"eval_steps_per_second": 3.162,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.001890498329885304,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.002,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7737226277372263,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7361111111111112,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.9078947368421053,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8961038961038961,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.31118687987327576,
"eval_overall_accuracy": 0.9629000969932104,
"eval_overall_f1": 0.8448753462603877,
"eval_overall_precision": 0.8133333333333334,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.9533,
"eval_samples_per_second": 196.155,
"eval_steps_per_second": 3.147,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.4719323217868805,
"learning_rate": 3.35e-05,
"loss": 0.0023,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8476821192052981,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7703703703703704,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7428571428571429,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.9078947368421053,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8961038961038961,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.3178064227104187,
"eval_overall_accuracy": 0.9638700290979632,
"eval_overall_f1": 0.853185595567867,
"eval_overall_precision": 0.8213333333333334,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.9706,
"eval_samples_per_second": 192.671,
"eval_steps_per_second": 3.091,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.008191280998289585,
"learning_rate": 3.3e-05,
"loss": 0.0045,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8456375838926176,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7777777777777778,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7088607594936709,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8859934853420196,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8450704225352113,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7894736842105263,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.2925824224948883,
"eval_overall_accuracy": 0.9638700290979632,
"eval_overall_f1": 0.8454172366621068,
"eval_overall_precision": 0.8046875,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.9524,
"eval_samples_per_second": 196.348,
"eval_steps_per_second": 3.15,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.005140832159668207,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0026,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.8387096774193548,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7738095238095238,
"eval_LOCATION_recall": 0.9154929577464789,
"eval_ORGANIZATION_f1": 0.7375,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6210526315789474,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9114754098360656,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.78125,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6944444444444444,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.3151751160621643,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8375165125495376,
"eval_overall_precision": 0.7731707317073171,
"eval_overall_recall": 0.9135446685878963,
"eval_runtime": 0.9517,
"eval_samples_per_second": 196.484,
"eval_steps_per_second": 3.152,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.002234996994957328,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0017,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.8059701492537313,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.782608695652174,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.9114754098360656,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.27503567934036255,
"eval_overall_accuracy": 0.9670223084384093,
"eval_overall_f1": 0.8635724331926864,
"eval_overall_precision": 0.8434065934065934,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 1.0319,
"eval_samples_per_second": 181.221,
"eval_steps_per_second": 2.907,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 2.4394583702087402,
"learning_rate": 3.15e-05,
"loss": 0.0016,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.8456375838926176,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7755102040816327,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6951219512195121,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8867313915857605,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.3136846423149109,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8439620081411126,
"eval_overall_precision": 0.7974358974358975,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.9561,
"eval_samples_per_second": 195.586,
"eval_steps_per_second": 3.138,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.02068762294948101,
"learning_rate": 3.1e-05,
"loss": 0.002,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7619047619047619,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6829268292682927,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9114754098360656,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.31167086958885193,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8431105047748976,
"eval_overall_precision": 0.8005181347150259,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.9533,
"eval_samples_per_second": 196.17,
"eval_steps_per_second": 3.147,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.004659323953092098,
"learning_rate": 3.05e-05,
"loss": 0.0031,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8421052631578947,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.9014084507042254,
"eval_ORGANIZATION_f1": 0.7682119205298013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6744186046511628,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9114754098360656,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.823529411764706,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.3022630512714386,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8521031207598372,
"eval_overall_precision": 0.8051282051282052,
"eval_overall_recall": 0.9048991354466859,
"eval_runtime": 0.9507,
"eval_samples_per_second": 196.705,
"eval_steps_per_second": 3.156,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.5910449624061584,
"learning_rate": 3e-05,
"loss": 0.0018,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7763157894736842,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6781609195402298,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9055374592833875,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8000000000000002,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7567567567567568,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.31180375814437866,
"eval_overall_accuracy": 0.9619301648884578,
"eval_overall_f1": 0.8416779431664412,
"eval_overall_precision": 0.7933673469387755,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.9409,
"eval_samples_per_second": 198.747,
"eval_steps_per_second": 3.188,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.0014322897186502814,
"learning_rate": 2.95e-05,
"loss": 0.0022,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7832167832167831,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.717948717948718,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9036544850498339,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9006622516556292,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.2662249207496643,
"eval_overall_accuracy": 0.9636275460717749,
"eval_overall_f1": 0.8515950069348127,
"eval_overall_precision": 0.820855614973262,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.9578,
"eval_samples_per_second": 195.232,
"eval_steps_per_second": 3.132,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.0011240842286497355,
"learning_rate": 2.9e-05,
"loss": 0.0006,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7712418300653594,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6704545454545454,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9019607843137256,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8846153846153846,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3214167058467865,
"eval_overall_accuracy": 0.9597478176527643,
"eval_overall_f1": 0.8373983739837398,
"eval_overall_precision": 0.7902813299232737,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.9589,
"eval_samples_per_second": 195.011,
"eval_steps_per_second": 3.129,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.0019562048837542534,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0011,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.7712418300653594,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7195121951219512,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7785234899328859,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6904761904761905,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9144736842105262,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9025974025974026,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8169014084507042,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7631578947368421,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3223561942577362,
"eval_overall_accuracy": 0.9616876818622696,
"eval_overall_f1": 0.8408163265306122,
"eval_overall_precision": 0.7963917525773195,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.9419,
"eval_samples_per_second": 198.529,
"eval_steps_per_second": 3.185,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.004401817452162504,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0015,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8344370860927152,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7402597402597403,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6404494382022472,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9013157894736842,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8896103896103896,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.30491575598716736,
"eval_overall_accuracy": 0.9619301648884578,
"eval_overall_f1": 0.8428184281842819,
"eval_overall_precision": 0.7953964194373402,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.9628,
"eval_samples_per_second": 194.222,
"eval_steps_per_second": 3.116,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 0.032622966915369034,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0023,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.763888888888889,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6962025316455697,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8933333333333333,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.8529411764705883,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8285714285714286,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.26732492446899414,
"eval_overall_accuracy": 0.9648399612027158,
"eval_overall_f1": 0.8440111420612814,
"eval_overall_precision": 0.816711590296496,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 1.0306,
"eval_samples_per_second": 181.45,
"eval_steps_per_second": 2.911,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.009263483807444572,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0015,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8435374149659864,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7769784172661871,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7297297297297297,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.913907284768212,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9078947368421053,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.2788328230381012,
"eval_overall_accuracy": 0.9662948593598448,
"eval_overall_f1": 0.8587412587412588,
"eval_overall_precision": 0.8342391304347826,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.9441,
"eval_samples_per_second": 198.082,
"eval_steps_per_second": 3.178,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.016023587435483932,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0019,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.8513513513513514,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.8235294117647058,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7887323943661971,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9169435215946843,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9139072847682119,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.2903594672679901,
"eval_overall_accuracy": 0.9670223084384093,
"eval_overall_f1": 0.8671328671328672,
"eval_overall_precision": 0.842391304347826,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.9543,
"eval_samples_per_second": 195.955,
"eval_steps_per_second": 3.144,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.0013861858751624823,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0016,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7755102040816327,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6951219512195121,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9174917491749175,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9084967320261438,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.30562856793403625,
"eval_overall_accuracy": 0.962172647914646,
"eval_overall_f1": 0.8454172366621068,
"eval_overall_precision": 0.8046875,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.953,
"eval_samples_per_second": 196.222,
"eval_steps_per_second": 3.148,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.004494914319366217,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0021,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8266666666666665,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7913669064748202,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7432432432432432,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.913907284768212,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9078947368421053,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.30186086893081665,
"eval_overall_accuracy": 0.9643549951503395,
"eval_overall_f1": 0.8583333333333334,
"eval_overall_precision": 0.8284182305630027,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.9632,
"eval_samples_per_second": 194.143,
"eval_steps_per_second": 3.115,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 0.07165616750717163,
"learning_rate": 2.5e-05,
"loss": 0.0013,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.794701986754967,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.76056338028169,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7012987012987013,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3192538917064667,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8395061728395062,
"eval_overall_precision": 0.8010471204188482,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.9477,
"eval_samples_per_second": 197.324,
"eval_steps_per_second": 3.166,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.0017693530535325408,
"learning_rate": 2.45e-05,
"loss": 0.0013,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7808219178082192,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7037037037037037,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9055374592833875,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3206080496311188,
"eval_overall_accuracy": 0.9616876818622696,
"eval_overall_f1": 0.850480109739369,
"eval_overall_precision": 0.8115183246073299,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.9406,
"eval_samples_per_second": 198.804,
"eval_steps_per_second": 3.189,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.077069491147995,
"learning_rate": 2.4e-05,
"loss": 0.0014,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8299319727891157,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7801418439716312,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7236842105263158,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9144736842105262,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9025974025974026,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.29891258478164673,
"eval_overall_accuracy": 0.9653249272550921,
"eval_overall_f1": 0.8567454798331016,
"eval_overall_precision": 0.8279569892473119,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.9575,
"eval_samples_per_second": 195.296,
"eval_steps_per_second": 3.133,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.002096625277772546,
"learning_rate": 2.35e-05,
"loss": 0.0007,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8194444444444445,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8082191780821918,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7913669064748202,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7432432432432432,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9042904290429042,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8954248366013072,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8405797101449276,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8055555555555556,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8928571428571429,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8928571428571429,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.30264776945114136,
"eval_overall_accuracy": 0.9672647914645974,
"eval_overall_f1": 0.8579465541490857,
"eval_overall_precision": 0.8379120879120879,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.951,
"eval_samples_per_second": 196.632,
"eval_steps_per_second": 3.155,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.001791234826669097,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0014,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.8055555555555556,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7341772151898734,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8983606557377048,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8838709677419355,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8529411764705883,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8285714285714286,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.305812805891037,
"eval_overall_accuracy": 0.9670223084384093,
"eval_overall_f1": 0.8587257617728532,
"eval_overall_precision": 0.8266666666666667,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.9512,
"eval_samples_per_second": 196.589,
"eval_steps_per_second": 3.154,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.0006963410996831954,
"learning_rate": 2.25e-05,
"loss": 0.0013,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8133333333333335,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7826086956521738,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7397260273972602,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7714285714285715,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.31985101103782654,
"eval_overall_accuracy": 0.9619301648884578,
"eval_overall_f1": 0.8448753462603877,
"eval_overall_precision": 0.8133333333333334,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.9536,
"eval_samples_per_second": 196.106,
"eval_steps_per_second": 3.146,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.004016083665192127,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.002,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8266666666666665,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7971014492753623,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7534246575342466,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.33322784304618835,
"eval_overall_accuracy": 0.962172647914646,
"eval_overall_f1": 0.8524137931034482,
"eval_overall_precision": 0.8174603174603174,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.9475,
"eval_samples_per_second": 197.363,
"eval_steps_per_second": 3.166,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.002730452921241522,
"learning_rate": 2.15e-05,
"loss": 0.0006,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7862068965517242,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7125,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8169014084507042,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7631578947368421,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3458655774593353,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8497267759562841,
"eval_overall_precision": 0.8077922077922078,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.9455,
"eval_samples_per_second": 197.779,
"eval_steps_per_second": 3.173,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.0037386000622063875,
"learning_rate": 2.1e-05,
"loss": 0.0014,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.802721088435374,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7195121951219512,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9049180327868852,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8169014084507042,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7631578947368421,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.32678091526031494,
"eval_overall_accuracy": 0.9614451988360815,
"eval_overall_f1": 0.8485675306957708,
"eval_overall_precision": 0.805699481865285,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.9604,
"eval_samples_per_second": 194.708,
"eval_steps_per_second": 3.124,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.0023347027599811554,
"learning_rate": 2.05e-05,
"loss": 0.0012,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8181818181818181,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9042904290429042,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8954248366013072,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8450704225352113,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7894736842105263,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3488438129425049,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8455284552845529,
"eval_overall_precision": 0.7979539641943734,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9526,
"eval_samples_per_second": 196.312,
"eval_steps_per_second": 3.149,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.0007857033051550388,
"learning_rate": 2e-05,
"loss": 0.0015,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8133333333333335,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7724137931034483,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9108910891089109,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9019607843137255,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.3345150947570801,
"eval_overall_accuracy": 0.962172647914646,
"eval_overall_f1": 0.8528198074277854,
"eval_overall_precision": 0.8157894736842105,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.9473,
"eval_samples_per_second": 197.404,
"eval_steps_per_second": 3.167,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.0016401028260588646,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0005,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8157894736842104,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.8,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7466666666666667,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9078947368421053,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8961038961038961,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8450704225352113,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7894736842105263,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3476317226886749,
"eval_overall_accuracy": 0.9624151309408342,
"eval_overall_f1": 0.8539944903581268,
"eval_overall_precision": 0.8179419525065963,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.9315,
"eval_samples_per_second": 200.75,
"eval_steps_per_second": 3.221,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.02758892811834812,
"learning_rate": 1.9e-05,
"loss": 0.001,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.8028169014084509,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7402597402597403,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9078947368421053,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8961038961038961,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3546055257320404,
"eval_overall_accuracy": 0.9633850630455868,
"eval_overall_f1": 0.8539944903581268,
"eval_overall_precision": 0.8179419525065963,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.9503,
"eval_samples_per_second": 196.775,
"eval_steps_per_second": 3.157,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.32324543595314026,
"learning_rate": 1.85e-05,
"loss": 0.0008,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7862068965517242,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7125,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9049180327868852,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3560656011104584,
"eval_overall_accuracy": 0.9616876818622696,
"eval_overall_f1": 0.8481532147742818,
"eval_overall_precision": 0.8072916666666666,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.9525,
"eval_samples_per_second": 196.325,
"eval_steps_per_second": 3.15,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.0021076402626931667,
"learning_rate": 1.8e-05,
"loss": 0.0012,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8344370860927152,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7887323943661972,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7272727272727273,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9144736842105262,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9025974025974026,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.33117640018463135,
"eval_overall_accuracy": 0.9624151309408342,
"eval_overall_f1": 0.8567493112947657,
"eval_overall_precision": 0.820580474934037,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.9576,
"eval_samples_per_second": 195.279,
"eval_steps_per_second": 3.133,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.27350062131881714,
"learning_rate": 1.75e-05,
"loss": 0.0017,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7913669064748202,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7432432432432432,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9055374592833875,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8450704225352113,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7894736842105263,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3442927598953247,
"eval_overall_accuracy": 0.9602327837051406,
"eval_overall_f1": 0.8461538461538461,
"eval_overall_precision": 0.8083989501312336,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.953,
"eval_samples_per_second": 196.22,
"eval_steps_per_second": 3.148,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.7737051248550415,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0005,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.7763157894736843,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7913669064748202,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7432432432432432,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9055374592833875,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8169014084507042,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7631578947368421,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3465050756931305,
"eval_overall_accuracy": 0.9602327837051406,
"eval_overall_f1": 0.8383561643835616,
"eval_overall_precision": 0.7989556135770235,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.9746,
"eval_samples_per_second": 191.87,
"eval_steps_per_second": 3.078,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.0003085023781750351,
"learning_rate": 1.65e-05,
"loss": 0.0004,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.8266666666666665,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.8115942028985507,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7671232876712328,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9114754098360656,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8450704225352113,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7894736842105263,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3288689851760864,
"eval_overall_accuracy": 0.9638700290979632,
"eval_overall_f1": 0.8591160220994475,
"eval_overall_precision": 0.8249336870026526,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.9508,
"eval_samples_per_second": 196.673,
"eval_steps_per_second": 3.155,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.0015671561704948545,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0002,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.832214765100671,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.8,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7466666666666667,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9144736842105262,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9025974025974026,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8450704225352113,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7894736842105263,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.33385857939720154,
"eval_overall_accuracy": 0.9641125121241513,
"eval_overall_f1": 0.8591160220994475,
"eval_overall_precision": 0.8249336870026526,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.9543,
"eval_samples_per_second": 195.947,
"eval_steps_per_second": 3.144,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.0012689490104094148,
"learning_rate": 1.55e-05,
"loss": 0.0006,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8400000000000001,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7215189873417722,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6129032258064516,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9078947368421053,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8961038961038961,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.35171428322792053,
"eval_overall_accuracy": 0.9580504364694471,
"eval_overall_f1": 0.8382749326145552,
"eval_overall_precision": 0.7873417721518987,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.953,
"eval_samples_per_second": 196.232,
"eval_steps_per_second": 3.148,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.00089789874618873,
"learning_rate": 1.5e-05,
"loss": 0.001,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7913669064748202,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7432432432432432,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9049180327868852,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.32278671860694885,
"eval_overall_accuracy": 0.9648399612027158,
"eval_overall_f1": 0.853185595567867,
"eval_overall_precision": 0.8213333333333334,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 1.0201,
"eval_samples_per_second": 183.317,
"eval_steps_per_second": 2.941,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.001998705556616187,
"learning_rate": 1.45e-05,
"loss": 0.0002,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.8400000000000001,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.8111888111888114,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7435897435897436,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9049180327868852,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3305073380470276,
"eval_overall_accuracy": 0.9633850630455868,
"eval_overall_f1": 0.8571428571428571,
"eval_overall_precision": 0.8188976377952756,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9607,
"eval_samples_per_second": 194.654,
"eval_steps_per_second": 3.123,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.0005069375038146973,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0006,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7826086956521738,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7397260273972602,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.9271523178807947,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9210526315789473,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8000000000000002,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7567567567567568,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.30825239419937134,
"eval_overall_accuracy": 0.9675072744907857,
"eval_overall_f1": 0.8575418994413407,
"eval_overall_precision": 0.8319783197831978,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.9597,
"eval_samples_per_second": 194.861,
"eval_steps_per_second": 3.126,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.0007079507340677083,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0003,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8266666666666665,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7857142857142856,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7333333333333333,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9205298013245033,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9144736842105263,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8000000000000002,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7567567567567568,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3165390193462372,
"eval_overall_accuracy": 0.9667798254122212,
"eval_overall_f1": 0.853185595567867,
"eval_overall_precision": 0.8213333333333334,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.9558,
"eval_samples_per_second": 195.657,
"eval_steps_per_second": 3.139,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.00018394706421531737,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0002,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8053691275167785,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.8085106382978723,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9235880398671096,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9205298013245033,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8000000000000002,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7567567567567568,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.31818944215774536,
"eval_overall_accuracy": 0.967992240543162,
"eval_overall_f1": 0.8555555555555555,
"eval_overall_precision": 0.8257372654155496,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.9609,
"eval_samples_per_second": 194.606,
"eval_steps_per_second": 3.122,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.00024878690601326525,
"learning_rate": 1.25e-05,
"loss": 0.0012,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.8082191780821918,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7283950617283951,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9180327868852459,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9032258064516129,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8169014084507042,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7631578947368421,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.34358134865760803,
"eval_overall_accuracy": 0.9641125121241513,
"eval_overall_f1": 0.8528610354223433,
"eval_overall_precision": 0.8087855297157622,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.9518,
"eval_samples_per_second": 196.477,
"eval_steps_per_second": 3.152,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.0002495927328709513,
"learning_rate": 1.2e-05,
"loss": 0.0002,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.802721088435374,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7195121951219512,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9210526315789475,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9090909090909091,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.34999027848243713,
"eval_overall_accuracy": 0.9636275460717749,
"eval_overall_f1": 0.854024556616644,
"eval_overall_precision": 0.810880829015544,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.9639,
"eval_samples_per_second": 194.004,
"eval_steps_per_second": 3.112,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.000243131464230828,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0007,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.8137931034482759,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7375,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9210526315789475,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9090909090909091,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3344757556915283,
"eval_overall_accuracy": 0.9645974781765276,
"eval_overall_f1": 0.8575342465753425,
"eval_overall_precision": 0.8172323759791122,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.9601,
"eval_samples_per_second": 194.77,
"eval_steps_per_second": 3.125,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.00021198501053731889,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0006,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.802919708029197,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7638888888888888,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9210526315789475,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9090909090909091,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3224840760231018,
"eval_overall_accuracy": 0.9655674102812803,
"eval_overall_f1": 0.8559556786703602,
"eval_overall_precision": 0.824,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.9532,
"eval_samples_per_second": 196.177,
"eval_steps_per_second": 3.147,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.0016178454970940948,
"learning_rate": 1.05e-05,
"loss": 0.0002,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7913669064748202,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7432432432432432,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9180327868852459,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9032258064516129,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3340538740158081,
"eval_overall_accuracy": 0.965082444228904,
"eval_overall_f1": 0.8547717842323651,
"eval_overall_precision": 0.8218085106382979,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 1.013,
"eval_samples_per_second": 184.602,
"eval_steps_per_second": 2.962,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.0010399464517831802,
"learning_rate": 1e-05,
"loss": 0.0005,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8133333333333335,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7913669064748202,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7432432432432432,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9144736842105262,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9025974025974026,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3451690971851349,
"eval_overall_accuracy": 0.965082444228904,
"eval_overall_f1": 0.8543689320388349,
"eval_overall_precision": 0.8235294117647058,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.9594,
"eval_samples_per_second": 194.923,
"eval_steps_per_second": 3.127,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.0004898614133708179,
"learning_rate": 9.5e-06,
"loss": 0.0002,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8133333333333335,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7857142857142856,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7333333333333333,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9144736842105262,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9025974025974026,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3453369140625,
"eval_overall_accuracy": 0.965082444228904,
"eval_overall_f1": 0.853185595567867,
"eval_overall_precision": 0.8213333333333334,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.9528,
"eval_samples_per_second": 196.26,
"eval_steps_per_second": 3.149,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.0012529068626463413,
"learning_rate": 9e-06,
"loss": 0.0002,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7943262411347517,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7368421052631579,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9049180327868852,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3554005026817322,
"eval_overall_accuracy": 0.9641125121241513,
"eval_overall_f1": 0.8481532147742818,
"eval_overall_precision": 0.8072916666666666,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.9565,
"eval_samples_per_second": 195.504,
"eval_steps_per_second": 3.136,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.0037664775736629963,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0005,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7681159420289856,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.726027397260274,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.9102990033222591,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9072847682119205,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.33550789952278137,
"eval_overall_accuracy": 0.965082444228904,
"eval_overall_f1": 0.8491620111731844,
"eval_overall_precision": 0.8238482384823849,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.9544,
"eval_samples_per_second": 195.933,
"eval_steps_per_second": 3.143,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.00019280197739135474,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0002,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7659574468085107,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7105263157894737,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.9049180327868852,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3492893576622009,
"eval_overall_accuracy": 0.9633850630455868,
"eval_overall_f1": 0.8422496570644719,
"eval_overall_precision": 0.8036649214659686,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.9553,
"eval_samples_per_second": 195.753,
"eval_steps_per_second": 3.14,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.0007057705661281943,
"learning_rate": 7.5e-06,
"loss": 0.0003,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7714285714285715,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.72,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.9049180327868852,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3493691086769104,
"eval_overall_accuracy": 0.9636275460717749,
"eval_overall_f1": 0.8418156808803301,
"eval_overall_precision": 0.8052631578947368,
"eval_overall_recall": 0.8818443804034583,
"eval_runtime": 0.9473,
"eval_samples_per_second": 197.399,
"eval_steps_per_second": 3.167,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.00023777979367878288,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0002,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7801418439716312,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7236842105263158,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9049180327868852,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8903225806451613,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.35241079330444336,
"eval_overall_accuracy": 0.9641125121241513,
"eval_overall_f1": 0.8434065934065933,
"eval_overall_precision": 0.8057742782152231,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.9506,
"eval_samples_per_second": 196.717,
"eval_steps_per_second": 3.156,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.0003070076636504382,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0002,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7785234899328859,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6904761904761905,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3664219081401825,
"eval_overall_accuracy": 0.9629000969932104,
"eval_overall_f1": 0.8466757123473542,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9567,
"eval_samples_per_second": 195.468,
"eval_steps_per_second": 3.136,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.0003128907410427928,
"learning_rate": 6e-06,
"loss": 0.0002,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8053691275167785,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7792207792207791,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6741573033707865,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.9180327868852459,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9032258064516129,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8450704225352113,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7894736842105263,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3721804618835449,
"eval_overall_accuracy": 0.9626576139670223,
"eval_overall_f1": 0.8509485094850948,
"eval_overall_precision": 0.80306905370844,
"eval_overall_recall": 0.9048991354466859,
"eval_runtime": 0.9518,
"eval_samples_per_second": 196.461,
"eval_steps_per_second": 3.152,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.0002441601827740669,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0002,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7837837837837838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6987951807228916,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9180327868852459,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9032258064516129,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3669990599155426,
"eval_overall_accuracy": 0.9629000969932104,
"eval_overall_f1": 0.8501362397820164,
"eval_overall_precision": 0.8062015503875969,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.968,
"eval_samples_per_second": 193.188,
"eval_steps_per_second": 3.099,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 0.001270479173399508,
"learning_rate": 5e-06,
"loss": 0.0002,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7837837837837838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6987951807228916,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9180327868852459,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9032258064516129,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.36801740527153015,
"eval_overall_accuracy": 0.9629000969932104,
"eval_overall_f1": 0.8501362397820164,
"eval_overall_precision": 0.8062015503875969,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9464,
"eval_samples_per_second": 197.59,
"eval_steps_per_second": 3.17,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.00022247471497394145,
"learning_rate": 4.5e-06,
"loss": 0.0002,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7837837837837838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6987951807228916,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3627462089061737,
"eval_overall_accuracy": 0.9629000969932104,
"eval_overall_f1": 0.8462585034013606,
"eval_overall_precision": 0.8015463917525774,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.9545,
"eval_samples_per_second": 195.918,
"eval_steps_per_second": 3.143,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.00013813188706990331,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0002,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7785234899328859,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6904761904761905,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9180327868852459,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9032258064516129,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3727177083492279,
"eval_overall_accuracy": 0.9629000969932104,
"eval_overall_f1": 0.8493894165535958,
"eval_overall_precision": 0.8025641025641026,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.954,
"eval_samples_per_second": 196.013,
"eval_steps_per_second": 3.145,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.000215419742744416,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0002,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7837837837837838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6987951807228916,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9084967320261438,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.37157806754112244,
"eval_overall_accuracy": 0.962172647914646,
"eval_overall_f1": 0.8451086956521738,
"eval_overall_precision": 0.7994858611825193,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.9451,
"eval_samples_per_second": 197.862,
"eval_steps_per_second": 3.174,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.0003316714719403535,
"learning_rate": 3e-06,
"loss": 0.0002,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.8082191780821918,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7283950617283951,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9205298013245033,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9144736842105263,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.35780400037765503,
"eval_overall_accuracy": 0.9643549951503395,
"eval_overall_f1": 0.8559670781893004,
"eval_overall_precision": 0.8167539267015707,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9435,
"eval_samples_per_second": 198.203,
"eval_steps_per_second": 3.18,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.005569119472056627,
"learning_rate": 2.5e-06,
"loss": 0.0002,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.8082191780821918,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7283950617283951,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9205298013245033,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9144736842105263,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3565683662891388,
"eval_overall_accuracy": 0.9645974781765276,
"eval_overall_f1": 0.8559670781893004,
"eval_overall_precision": 0.8167539267015707,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9611,
"eval_samples_per_second": 194.577,
"eval_steps_per_second": 3.122,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.00045707172830589116,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0006,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7945205479452054,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7160493827160493,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9180327868852459,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9032258064516129,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3609143793582916,
"eval_overall_accuracy": 0.9641125121241513,
"eval_overall_f1": 0.8524590163934427,
"eval_overall_precision": 0.8103896103896104,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9457,
"eval_samples_per_second": 197.739,
"eval_steps_per_second": 3.172,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.0002619586593937129,
"learning_rate": 1.5e-06,
"loss": 0.0003,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7945205479452054,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7160493827160493,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9180327868852459,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9032258064516129,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3629205524921417,
"eval_overall_accuracy": 0.9641125121241513,
"eval_overall_f1": 0.8524590163934427,
"eval_overall_precision": 0.8103896103896104,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9477,
"eval_samples_per_second": 197.31,
"eval_steps_per_second": 3.165,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.0001948641292983666,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0002,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7945205479452054,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7160493827160493,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9180327868852459,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9032258064516129,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.35546010732650757,
"eval_overall_accuracy": 0.9645974781765276,
"eval_overall_f1": 0.8524590163934427,
"eval_overall_precision": 0.8103896103896104,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9637,
"eval_samples_per_second": 194.037,
"eval_steps_per_second": 3.113,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.023726776242256165,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0002,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7945205479452054,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7160493827160493,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9180327868852459,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9032258064516129,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.35447004437446594,
"eval_overall_accuracy": 0.9648399612027158,
"eval_overall_f1": 0.8524590163934427,
"eval_overall_precision": 0.8103896103896104,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.951,
"eval_samples_per_second": 196.644,
"eval_steps_per_second": 3.155,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.0003471510426606983,
"learning_rate": 0.0,
"loss": 0.0004,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7945205479452054,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7160493827160493,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9180327868852459,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.9032258064516129,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8571428571428571,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.8108108108108109,
"eval_QUANTITY_recall": 0.9090909090909091,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.3544124364852905,
"eval_overall_accuracy": 0.9645974781765276,
"eval_overall_f1": 0.8524590163934427,
"eval_overall_precision": 0.8103896103896104,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.9623,
"eval_samples_per_second": 194.318,
"eval_steps_per_second": 3.117,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4591573981087056.0,
"train_loss": 0.008363780669411118,
"train_runtime": 2646.2436,
"train_samples_per_second": 63.789,
"train_steps_per_second": 4.006
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4591573981087056.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}