nerui-base-0 / trainer_state.json
apwic's picture
End of training
32af349 verified
raw
history blame
111 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 9600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 4.475216865539551,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.2611,
"step": 96
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.9109947643979057,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8969072164948454,
"eval_LOCATION_recall": 0.925531914893617,
"eval_ORGANIZATION_f1": 0.8967551622418879,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.8837209302325582,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9854014598540146,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9854014598540146,
"eval_PERSON_recall": 0.9854014598540146,
"eval_loss": 0.046344444155693054,
"eval_overall_accuracy": 0.9864640883977901,
"eval_overall_f1": 0.9303482587064676,
"eval_overall_precision": 0.9211822660098522,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.5089,
"eval_samples_per_second": 334.076,
"eval_steps_per_second": 5.895,
"step": 96
},
{
"epoch": 2.0,
"grad_norm": 5.619458198547363,
"learning_rate": 4.9e-05,
"loss": 0.0645,
"step": 192
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.8490566037735849,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.7627118644067796,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.8597560975609756,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.8757763975155279,
"eval_ORGANIZATION_recall": 0.844311377245509,
"eval_PERSON_f1": 0.981549815498155,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9925373134328358,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.0677841454744339,
"eval_overall_accuracy": 0.9779005524861878,
"eval_overall_f1": 0.8976572133168926,
"eval_overall_precision": 0.8813559322033898,
"eval_overall_recall": 0.914572864321608,
"eval_runtime": 0.5311,
"eval_samples_per_second": 320.081,
"eval_steps_per_second": 5.648,
"step": 192
},
{
"epoch": 3.0,
"grad_norm": 0.5541238784790039,
"learning_rate": 4.85e-05,
"loss": 0.0354,
"step": 288
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.9278350515463918,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.8988095238095238,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.893491124260355,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.9818181818181817,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9782608695652174,
"eval_PERSON_recall": 0.9854014598540146,
"eval_loss": 0.04672340676188469,
"eval_overall_accuracy": 0.9861878453038674,
"eval_overall_f1": 0.9341614906832298,
"eval_overall_precision": 0.9238329238329238,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.5296,
"eval_samples_per_second": 321.026,
"eval_steps_per_second": 5.665,
"step": 288
},
{
"epoch": 4.0,
"grad_norm": 2.0090787410736084,
"learning_rate": 4.8e-05,
"loss": 0.0232,
"step": 384
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.9230769230769231,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8910891089108911,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9164086687306501,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9487179487179487,
"eval_ORGANIZATION_recall": 0.8862275449101796,
"eval_PERSON_f1": 0.9552238805970148,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9770992366412213,
"eval_PERSON_recall": 0.9343065693430657,
"eval_loss": 0.06353317946195602,
"eval_overall_accuracy": 0.9845303867403314,
"eval_overall_f1": 0.9312977099236641,
"eval_overall_precision": 0.9432989690721649,
"eval_overall_recall": 0.9195979899497487,
"eval_runtime": 0.5408,
"eval_samples_per_second": 314.335,
"eval_steps_per_second": 5.547,
"step": 384
},
{
"epoch": 5.0,
"grad_norm": 0.37130075693130493,
"learning_rate": 4.75e-05,
"loss": 0.0158,
"step": 480
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.91,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8584905660377359,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9022082018927444,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9533333333333334,
"eval_ORGANIZATION_recall": 0.8562874251497006,
"eval_PERSON_f1": 0.9854014598540146,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9854014598540146,
"eval_PERSON_recall": 0.9854014598540146,
"eval_loss": 0.05297553166747093,
"eval_overall_accuracy": 0.9861878453038674,
"eval_overall_f1": 0.9329962073324906,
"eval_overall_precision": 0.9389312977099237,
"eval_overall_recall": 0.9271356783919598,
"eval_runtime": 0.5568,
"eval_samples_per_second": 305.315,
"eval_steps_per_second": 5.388,
"step": 480
},
{
"epoch": 6.0,
"grad_norm": 1.5923467874526978,
"learning_rate": 4.7e-05,
"loss": 0.011,
"step": 576
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.9319371727748691,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9175257731958762,
"eval_LOCATION_recall": 0.9468085106382979,
"eval_ORGANIZATION_f1": 0.9129129129129129,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9156626506024096,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9816849816849818,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9852941176470589,
"eval_PERSON_recall": 0.9781021897810219,
"eval_loss": 0.05083903297781944,
"eval_overall_accuracy": 0.9878453038674033,
"eval_overall_f1": 0.9410288582183186,
"eval_overall_precision": 0.9398496240601504,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.5598,
"eval_samples_per_second": 303.698,
"eval_steps_per_second": 5.359,
"step": 576
},
{
"epoch": 7.0,
"grad_norm": 2.4925856590270996,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.0086,
"step": 672
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.925531914893617,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.925531914893617,
"eval_LOCATION_recall": 0.925531914893617,
"eval_ORGANIZATION_f1": 0.9176470588235294,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9017341040462428,
"eval_ORGANIZATION_recall": 0.9341317365269461,
"eval_PERSON_f1": 0.9816849816849818,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9852941176470589,
"eval_PERSON_recall": 0.9781021897810219,
"eval_loss": 0.0657382383942604,
"eval_overall_accuracy": 0.9864640883977901,
"eval_overall_f1": 0.9413233458177278,
"eval_overall_precision": 0.9354838709677419,
"eval_overall_recall": 0.9472361809045227,
"eval_runtime": 0.5677,
"eval_samples_per_second": 299.462,
"eval_steps_per_second": 5.285,
"step": 672
},
{
"epoch": 8.0,
"grad_norm": 0.08103451132774353,
"learning_rate": 4.600000000000001e-05,
"loss": 0.007,
"step": 768
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.900523560209424,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8865979381443299,
"eval_LOCATION_recall": 0.9148936170212766,
"eval_ORGANIZATION_f1": 0.8988095238095238,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.893491124260355,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.9779411764705882,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9851851851851852,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.0754326730966568,
"eval_overall_accuracy": 0.9864640883977901,
"eval_overall_f1": 0.9261576971214018,
"eval_overall_precision": 0.9226932668329177,
"eval_overall_recall": 0.9296482412060302,
"eval_runtime": 0.5838,
"eval_samples_per_second": 291.187,
"eval_steps_per_second": 5.139,
"step": 768
},
{
"epoch": 9.0,
"grad_norm": 0.2643495202064514,
"learning_rate": 4.55e-05,
"loss": 0.0061,
"step": 864
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.908108108108108,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9230769230769231,
"eval_LOCATION_recall": 0.8936170212765957,
"eval_ORGANIZATION_f1": 0.9080459770114944,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.8729281767955801,
"eval_ORGANIZATION_recall": 0.9461077844311377,
"eval_PERSON_f1": 0.988929889298893,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 1.0,
"eval_PERSON_recall": 0.9781021897810219,
"eval_loss": 0.07025933265686035,
"eval_overall_accuracy": 0.9878453038674033,
"eval_overall_f1": 0.9353233830845771,
"eval_overall_precision": 0.9261083743842364,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.5996,
"eval_samples_per_second": 283.509,
"eval_steps_per_second": 5.003,
"step": 864
},
{
"epoch": 10.0,
"grad_norm": 0.8626702427864075,
"learning_rate": 4.5e-05,
"loss": 0.0058,
"step": 960
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.9032258064516129,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9130434782608695,
"eval_LOCATION_recall": 0.8936170212765957,
"eval_ORGANIZATION_f1": 0.9011627906976745,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.8757062146892656,
"eval_ORGANIZATION_recall": 0.9281437125748503,
"eval_PERSON_f1": 0.9708029197080292,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9708029197080292,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.06500135362148285,
"eval_overall_accuracy": 0.9867403314917127,
"eval_overall_f1": 0.9253731343283583,
"eval_overall_precision": 0.916256157635468,
"eval_overall_recall": 0.9346733668341709,
"eval_runtime": 0.6116,
"eval_samples_per_second": 277.94,
"eval_steps_per_second": 4.905,
"step": 960
},
{
"epoch": 11.0,
"grad_norm": 0.020984740927815437,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.0048,
"step": 1056
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.9128205128205128,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8811881188118812,
"eval_LOCATION_recall": 0.9468085106382979,
"eval_ORGANIZATION_f1": 0.9112426035502958,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9005847953216374,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.08488745987415314,
"eval_overall_accuracy": 0.9859116022099448,
"eval_overall_f1": 0.9328358208955224,
"eval_overall_precision": 0.9236453201970444,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.6184,
"eval_samples_per_second": 274.893,
"eval_steps_per_second": 4.851,
"step": 1056
},
{
"epoch": 12.0,
"grad_norm": 0.3056125044822693,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.0057,
"step": 1152
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.9109947643979057,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8969072164948454,
"eval_LOCATION_recall": 0.925531914893617,
"eval_ORGANIZATION_f1": 0.903225806451613,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.8850574712643678,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.988929889298893,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 1.0,
"eval_PERSON_recall": 0.9781021897810219,
"eval_loss": 0.072464220225811,
"eval_overall_accuracy": 0.9870165745856354,
"eval_overall_f1": 0.9339975093399752,
"eval_overall_precision": 0.9259259259259259,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.622,
"eval_samples_per_second": 273.318,
"eval_steps_per_second": 4.823,
"step": 1152
},
{
"epoch": 13.0,
"grad_norm": 0.08819713443517685,
"learning_rate": 4.35e-05,
"loss": 0.0052,
"step": 1248
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.9130434782608695,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9333333333333333,
"eval_LOCATION_recall": 0.8936170212765957,
"eval_ORGANIZATION_f1": 0.8895522388059701,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.8869047619047619,
"eval_ORGANIZATION_recall": 0.8922155688622755,
"eval_PERSON_f1": 0.9816849816849818,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9852941176470589,
"eval_PERSON_recall": 0.9781021897810219,
"eval_loss": 0.08716335147619247,
"eval_overall_accuracy": 0.9845303867403314,
"eval_overall_f1": 0.9267676767676767,
"eval_overall_precision": 0.9314720812182741,
"eval_overall_recall": 0.9221105527638191,
"eval_runtime": 0.6038,
"eval_samples_per_second": 281.559,
"eval_steps_per_second": 4.969,
"step": 1248
},
{
"epoch": 14.0,
"grad_norm": 0.0017481500981375575,
"learning_rate": 4.3e-05,
"loss": 0.002,
"step": 1344
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.8972972972972972,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9120879120879121,
"eval_LOCATION_recall": 0.8829787234042553,
"eval_ORGANIZATION_f1": 0.9285714285714287,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9230769230769231,
"eval_ORGANIZATION_recall": 0.9341317365269461,
"eval_PERSON_f1": 0.9816849816849818,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9852941176470589,
"eval_PERSON_recall": 0.9781021897810219,
"eval_loss": 0.07973892986774445,
"eval_overall_accuracy": 0.9881215469613259,
"eval_overall_f1": 0.9395465994962218,
"eval_overall_precision": 0.9419191919191919,
"eval_overall_recall": 0.9371859296482412,
"eval_runtime": 0.6104,
"eval_samples_per_second": 278.491,
"eval_steps_per_second": 4.915,
"step": 1344
},
{
"epoch": 15.0,
"grad_norm": 5.35858154296875,
"learning_rate": 4.25e-05,
"loss": 0.0036,
"step": 1440
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.9297297297297297,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.945054945054945,
"eval_LOCATION_recall": 0.9148936170212766,
"eval_ORGANIZATION_f1": 0.9235294117647059,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9075144508670521,
"eval_ORGANIZATION_recall": 0.9401197604790419,
"eval_PERSON_f1": 0.988929889298893,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 1.0,
"eval_PERSON_recall": 0.9781021897810219,
"eval_loss": 0.08796700835227966,
"eval_overall_accuracy": 0.987292817679558,
"eval_overall_f1": 0.9472361809045227,
"eval_overall_precision": 0.9472361809045227,
"eval_overall_recall": 0.9472361809045227,
"eval_runtime": 0.6289,
"eval_samples_per_second": 270.333,
"eval_steps_per_second": 4.771,
"step": 1440
},
{
"epoch": 16.0,
"grad_norm": 0.012317053973674774,
"learning_rate": 4.2e-05,
"loss": 0.0026,
"step": 1536
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8888888888888888,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8842105263157894,
"eval_LOCATION_recall": 0.8936170212765957,
"eval_ORGANIZATION_f1": 0.9305135951661632,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9390243902439024,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9779411764705882,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9851851851851852,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.08714718371629715,
"eval_overall_accuracy": 0.9870165745856354,
"eval_overall_f1": 0.9368686868686869,
"eval_overall_precision": 0.9416243654822335,
"eval_overall_recall": 0.9321608040201005,
"eval_runtime": 0.6145,
"eval_samples_per_second": 276.648,
"eval_steps_per_second": 4.882,
"step": 1536
},
{
"epoch": 17.0,
"grad_norm": 0.00884944200515747,
"learning_rate": 4.15e-05,
"loss": 0.0028,
"step": 1632
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.9175257731958764,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.89,
"eval_LOCATION_recall": 0.9468085106382979,
"eval_ORGANIZATION_f1": 0.924924924924925,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.927710843373494,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9851851851851852,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 1.0,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.08211695402860641,
"eval_overall_accuracy": 0.9883977900552486,
"eval_overall_f1": 0.9435382685069008,
"eval_overall_precision": 0.9423558897243107,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.6144,
"eval_samples_per_second": 276.708,
"eval_steps_per_second": 4.883,
"step": 1632
},
{
"epoch": 18.0,
"grad_norm": 0.005733116064220667,
"learning_rate": 4.1e-05,
"loss": 0.0024,
"step": 1728
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.9166666666666666,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8979591836734694,
"eval_LOCATION_recall": 0.9361702127659575,
"eval_ORGANIZATION_f1": 0.9337349397590362,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9393939393939394,
"eval_ORGANIZATION_recall": 0.9281437125748503,
"eval_PERSON_f1": 0.9777777777777779,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9924812030075187,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.07464080303907394,
"eval_overall_accuracy": 0.988950276243094,
"eval_overall_f1": 0.9445843828715367,
"eval_overall_precision": 0.946969696969697,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.6238,
"eval_samples_per_second": 272.509,
"eval_steps_per_second": 4.809,
"step": 1728
},
{
"epoch": 19.0,
"grad_norm": 5.751409530639648,
"learning_rate": 4.05e-05,
"loss": 0.003,
"step": 1824
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.9072164948453608,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.88,
"eval_LOCATION_recall": 0.9361702127659575,
"eval_ORGANIZATION_f1": 0.9123867069486405,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9207317073170732,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.967032967032967,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9705882352941176,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.0849042758345604,
"eval_overall_accuracy": 0.9859116022099448,
"eval_overall_f1": 0.9298245614035087,
"eval_overall_precision": 0.9275,
"eval_overall_recall": 0.9321608040201005,
"eval_runtime": 0.626,
"eval_samples_per_second": 271.56,
"eval_steps_per_second": 4.792,
"step": 1824
},
{
"epoch": 20.0,
"grad_norm": 0.3233324885368347,
"learning_rate": 4e-05,
"loss": 0.0035,
"step": 1920
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8969072164948454,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.87,
"eval_LOCATION_recall": 0.925531914893617,
"eval_ORGANIZATION_f1": 0.9300911854103343,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9444444444444444,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.981549815498155,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9925373134328358,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.08302651345729828,
"eval_overall_accuracy": 0.9875690607734806,
"eval_overall_f1": 0.9395465994962218,
"eval_overall_precision": 0.9419191919191919,
"eval_overall_recall": 0.9371859296482412,
"eval_runtime": 0.612,
"eval_samples_per_second": 277.763,
"eval_steps_per_second": 4.902,
"step": 1920
},
{
"epoch": 21.0,
"grad_norm": 0.0027803461998701096,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0015,
"step": 2016
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.8994708994708994,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8947368421052632,
"eval_LOCATION_recall": 0.9042553191489362,
"eval_ORGANIZATION_f1": 0.9226190476190477,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9171597633136095,
"eval_ORGANIZATION_recall": 0.9281437125748503,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.09646125137805939,
"eval_overall_accuracy": 0.9864640883977901,
"eval_overall_f1": 0.9346733668341709,
"eval_overall_precision": 0.9346733668341709,
"eval_overall_recall": 0.9346733668341709,
"eval_runtime": 0.6227,
"eval_samples_per_second": 273.012,
"eval_steps_per_second": 4.818,
"step": 2016
},
{
"epoch": 22.0,
"grad_norm": 0.012560858391225338,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0029,
"step": 2112
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8994708994708994,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8947368421052632,
"eval_LOCATION_recall": 0.9042553191489362,
"eval_ORGANIZATION_f1": 0.9112426035502958,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9005847953216374,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9565217391304348,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9496402877697842,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.1119152307510376,
"eval_overall_accuracy": 0.9831491712707182,
"eval_overall_f1": 0.9240348692403487,
"eval_overall_precision": 0.9160493827160494,
"eval_overall_recall": 0.9321608040201005,
"eval_runtime": 0.622,
"eval_samples_per_second": 273.291,
"eval_steps_per_second": 4.823,
"step": 2112
},
{
"epoch": 23.0,
"grad_norm": 0.015381195582449436,
"learning_rate": 3.85e-05,
"loss": 0.0031,
"step": 2208
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.934010152284264,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8932038834951457,
"eval_LOCATION_recall": 0.9787234042553191,
"eval_ORGANIZATION_f1": 0.8952380952380953,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9527027027027027,
"eval_ORGANIZATION_recall": 0.844311377245509,
"eval_PERSON_f1": 0.9672727272727273,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9637681159420289,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.10207368433475494,
"eval_overall_accuracy": 0.9842541436464088,
"eval_overall_f1": 0.9301143583227447,
"eval_overall_precision": 0.9408740359897172,
"eval_overall_recall": 0.9195979899497487,
"eval_runtime": 0.6155,
"eval_samples_per_second": 276.214,
"eval_steps_per_second": 4.874,
"step": 2208
},
{
"epoch": 24.0,
"grad_norm": 0.029895633459091187,
"learning_rate": 3.8e-05,
"loss": 0.0023,
"step": 2304
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.9081632653061226,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8725490196078431,
"eval_LOCATION_recall": 0.9468085106382979,
"eval_ORGANIZATION_f1": 0.9123867069486405,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9207317073170732,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.9743589743589743,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9779411764705882,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.08727628737688065,
"eval_overall_accuracy": 0.9864640883977901,
"eval_overall_f1": 0.9325,
"eval_overall_precision": 0.927860696517413,
"eval_overall_recall": 0.9371859296482412,
"eval_runtime": 0.6257,
"eval_samples_per_second": 271.688,
"eval_steps_per_second": 4.795,
"step": 2304
},
{
"epoch": 25.0,
"grad_norm": 1.8711739778518677,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0029,
"step": 2400
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.9045226130653266,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8571428571428571,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.8975903614457832,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9030303030303031,
"eval_ORGANIZATION_recall": 0.8922155688622755,
"eval_PERSON_f1": 0.9781021897810219,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9781021897810219,
"eval_PERSON_recall": 0.9781021897810219,
"eval_loss": 0.10519938915967941,
"eval_overall_accuracy": 0.9856353591160221,
"eval_overall_f1": 0.9267080745341615,
"eval_overall_precision": 0.9164619164619164,
"eval_overall_recall": 0.9371859296482412,
"eval_runtime": 0.6271,
"eval_samples_per_second": 271.08,
"eval_steps_per_second": 4.784,
"step": 2400
},
{
"epoch": 26.0,
"grad_norm": 0.8989447951316833,
"learning_rate": 3.7e-05,
"loss": 0.0033,
"step": 2496
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8640776699029127,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.7946428571428571,
"eval_LOCATION_recall": 0.9468085106382979,
"eval_ORGANIZATION_f1": 0.9068322981366459,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9419354838709677,
"eval_ORGANIZATION_recall": 0.874251497005988,
"eval_PERSON_f1": 0.9708029197080292,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9708029197080292,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.12218903750181198,
"eval_overall_accuracy": 0.9828729281767956,
"eval_overall_f1": 0.917705735660848,
"eval_overall_precision": 0.9108910891089109,
"eval_overall_recall": 0.9246231155778895,
"eval_runtime": 0.6123,
"eval_samples_per_second": 277.664,
"eval_steps_per_second": 4.9,
"step": 2496
},
{
"epoch": 27.0,
"grad_norm": 0.014491462148725986,
"learning_rate": 3.65e-05,
"loss": 0.0021,
"step": 2592
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.9035532994923857,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8640776699029126,
"eval_LOCATION_recall": 0.9468085106382979,
"eval_ORGANIZATION_f1": 0.9090909090909091,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9202453987730062,
"eval_ORGANIZATION_recall": 0.8982035928143712,
"eval_PERSON_f1": 0.9708029197080292,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9708029197080292,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.11366433650255203,
"eval_overall_accuracy": 0.9853591160220995,
"eval_overall_f1": 0.9288389513108615,
"eval_overall_precision": 0.9230769230769231,
"eval_overall_recall": 0.9346733668341709,
"eval_runtime": 0.6239,
"eval_samples_per_second": 272.493,
"eval_steps_per_second": 4.809,
"step": 2592
},
{
"epoch": 28.0,
"grad_norm": 0.00040458361036144197,
"learning_rate": 3.6e-05,
"loss": 0.0014,
"step": 2688
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8947368421052632,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8854166666666666,
"eval_LOCATION_recall": 0.9042553191489362,
"eval_ORGANIZATION_f1": 0.9085545722713864,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.8953488372093024,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9703703703703703,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9849624060150376,
"eval_PERSON_recall": 0.9562043795620438,
"eval_loss": 0.0998811274766922,
"eval_overall_accuracy": 0.9861878453038674,
"eval_overall_f1": 0.9261576971214018,
"eval_overall_precision": 0.9226932668329177,
"eval_overall_recall": 0.9296482412060302,
"eval_runtime": 0.6221,
"eval_samples_per_second": 273.284,
"eval_steps_per_second": 4.823,
"step": 2688
},
{
"epoch": 29.0,
"grad_norm": 0.003671834012493491,
"learning_rate": 3.55e-05,
"loss": 0.0017,
"step": 2784
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8947368421052632,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8854166666666666,
"eval_LOCATION_recall": 0.9042553191489362,
"eval_ORGANIZATION_f1": 0.8988095238095238,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.893491124260355,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.9675090252707581,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9571428571428572,
"eval_PERSON_recall": 0.9781021897810219,
"eval_loss": 0.09638147801160812,
"eval_overall_accuracy": 0.9842541436464088,
"eval_overall_f1": 0.9215442092154421,
"eval_overall_precision": 0.9135802469135802,
"eval_overall_recall": 0.9296482412060302,
"eval_runtime": 0.6201,
"eval_samples_per_second": 274.15,
"eval_steps_per_second": 4.838,
"step": 2784
},
{
"epoch": 30.0,
"grad_norm": 2.668123245239258,
"learning_rate": 3.5e-05,
"loss": 0.0064,
"step": 2880
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8947368421052632,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8854166666666666,
"eval_LOCATION_recall": 0.9042553191489362,
"eval_ORGANIZATION_f1": 0.9317507418397626,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9235294117647059,
"eval_ORGANIZATION_recall": 0.9401197604790419,
"eval_PERSON_f1": 0.9777777777777779,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9924812030075187,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.0691131055355072,
"eval_overall_accuracy": 0.9875690607734806,
"eval_overall_f1": 0.9385194479297366,
"eval_overall_precision": 0.9373433583959899,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6245,
"eval_samples_per_second": 272.208,
"eval_steps_per_second": 4.804,
"step": 2880
},
{
"epoch": 31.0,
"grad_norm": 0.004453280474990606,
"learning_rate": 3.45e-05,
"loss": 0.0032,
"step": 2976
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.9166666666666666,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8979591836734694,
"eval_LOCATION_recall": 0.9361702127659575,
"eval_ORGANIZATION_f1": 0.9235294117647059,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9075144508670521,
"eval_ORGANIZATION_recall": 0.9401197604790419,
"eval_PERSON_f1": 0.9851851851851852,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 1.0,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.08723258972167969,
"eval_overall_accuracy": 0.9878453038674033,
"eval_overall_f1": 0.9426433915211971,
"eval_overall_precision": 0.9356435643564357,
"eval_overall_recall": 0.949748743718593,
"eval_runtime": 0.6234,
"eval_samples_per_second": 272.695,
"eval_steps_per_second": 4.812,
"step": 2976
},
{
"epoch": 32.0,
"grad_norm": 0.0032113208435475826,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0027,
"step": 3072
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.9119170984455959,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8888888888888888,
"eval_LOCATION_recall": 0.9361702127659575,
"eval_ORGANIZATION_f1": 0.9198813056379822,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9117647058823529,
"eval_ORGANIZATION_recall": 0.9281437125748503,
"eval_PERSON_f1": 0.9703703703703703,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9849624060150376,
"eval_PERSON_recall": 0.9562043795620438,
"eval_loss": 0.09214069694280624,
"eval_overall_accuracy": 0.9861878453038674,
"eval_overall_f1": 0.9349999999999999,
"eval_overall_precision": 0.9303482587064676,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6805,
"eval_samples_per_second": 249.808,
"eval_steps_per_second": 4.408,
"step": 3072
},
{
"epoch": 33.0,
"grad_norm": 0.0023403808008879423,
"learning_rate": 3.35e-05,
"loss": 0.0017,
"step": 3168
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.90625,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8877551020408163,
"eval_LOCATION_recall": 0.925531914893617,
"eval_ORGANIZATION_f1": 0.9333333333333335,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9447852760736196,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.966789667896679,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9776119402985075,
"eval_PERSON_recall": 0.9562043795620438,
"eval_loss": 0.09554101526737213,
"eval_overall_accuracy": 0.9870165745856354,
"eval_overall_f1": 0.9382093316519546,
"eval_overall_precision": 0.9417721518987342,
"eval_overall_recall": 0.9346733668341709,
"eval_runtime": 0.6163,
"eval_samples_per_second": 275.837,
"eval_steps_per_second": 4.868,
"step": 3168
},
{
"epoch": 34.0,
"grad_norm": 0.0025567917618900537,
"learning_rate": 3.3e-05,
"loss": 0.0027,
"step": 3264
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.9238578680203046,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.883495145631068,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9393939393939393,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.950920245398773,
"eval_ORGANIZATION_recall": 0.9281437125748503,
"eval_PERSON_f1": 0.9779411764705882,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9851851851851852,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.10889267921447754,
"eval_overall_accuracy": 0.9867403314917127,
"eval_overall_f1": 0.9486858573216519,
"eval_overall_precision": 0.9451371571072319,
"eval_overall_recall": 0.9522613065326633,
"eval_runtime": 0.6143,
"eval_samples_per_second": 276.722,
"eval_steps_per_second": 4.883,
"step": 3264
},
{
"epoch": 35.0,
"grad_norm": 0.003604689845815301,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0024,
"step": 3360
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.9137055837563451,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8737864077669902,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9365558912386707,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9451219512195121,
"eval_ORGANIZATION_recall": 0.9281437125748503,
"eval_PERSON_f1": 0.9710144927536232,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9640287769784173,
"eval_PERSON_recall": 0.9781021897810219,
"eval_loss": 0.09201914817094803,
"eval_overall_accuracy": 0.9870165745856354,
"eval_overall_f1": 0.9427860696517413,
"eval_overall_precision": 0.9334975369458128,
"eval_overall_recall": 0.9522613065326633,
"eval_runtime": 0.6128,
"eval_samples_per_second": 277.43,
"eval_steps_per_second": 4.896,
"step": 3360
},
{
"epoch": 36.0,
"grad_norm": 0.009372674860060215,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0022,
"step": 3456
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.9430051813471503,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9191919191919192,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9418960244648319,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9625,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9672727272727273,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9637681159420289,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.07915590703487396,
"eval_overall_accuracy": 0.9897790055248619,
"eval_overall_f1": 0.950943396226415,
"eval_overall_precision": 0.9521410579345088,
"eval_overall_recall": 0.949748743718593,
"eval_runtime": 0.6137,
"eval_samples_per_second": 277.022,
"eval_steps_per_second": 4.889,
"step": 3456
},
{
"epoch": 37.0,
"grad_norm": 0.008921943604946136,
"learning_rate": 3.15e-05,
"loss": 0.0013,
"step": 3552
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.9230769230769231,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8910891089108911,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9393939393939393,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.950920245398773,
"eval_ORGANIZATION_recall": 0.9281437125748503,
"eval_PERSON_f1": 0.981549815498155,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9925373134328358,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.09620564430952072,
"eval_overall_accuracy": 0.9883977900552486,
"eval_overall_f1": 0.949748743718593,
"eval_overall_precision": 0.949748743718593,
"eval_overall_recall": 0.949748743718593,
"eval_runtime": 0.6579,
"eval_samples_per_second": 258.391,
"eval_steps_per_second": 4.56,
"step": 3552
},
{
"epoch": 38.0,
"grad_norm": 0.0019985612016171217,
"learning_rate": 3.1e-05,
"loss": 0.0028,
"step": 3648
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.9326424870466321,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9090909090909091,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.923076923076923,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9122807017543859,
"eval_ORGANIZATION_recall": 0.9341317365269461,
"eval_PERSON_f1": 0.9703703703703703,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9849624060150376,
"eval_PERSON_recall": 0.9562043795620438,
"eval_loss": 0.0810953676700592,
"eval_overall_accuracy": 0.9875690607734806,
"eval_overall_f1": 0.9413233458177278,
"eval_overall_precision": 0.9354838709677419,
"eval_overall_recall": 0.9472361809045227,
"eval_runtime": 0.6203,
"eval_samples_per_second": 274.044,
"eval_steps_per_second": 4.836,
"step": 3648
},
{
"epoch": 39.0,
"grad_norm": 0.0019018716411665082,
"learning_rate": 3.05e-05,
"loss": 0.0022,
"step": 3744
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.9015544041450778,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8787878787878788,
"eval_LOCATION_recall": 0.925531914893617,
"eval_ORGANIZATION_f1": 0.9161676646706587,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9161676646706587,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9703703703703703,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9849624060150376,
"eval_PERSON_recall": 0.9562043795620438,
"eval_loss": 0.1018829345703125,
"eval_overall_accuracy": 0.9859116022099448,
"eval_overall_f1": 0.9309912170639899,
"eval_overall_precision": 0.9298245614035088,
"eval_overall_recall": 0.9321608040201005,
"eval_runtime": 0.6176,
"eval_samples_per_second": 275.269,
"eval_steps_per_second": 4.858,
"step": 3744
},
{
"epoch": 40.0,
"grad_norm": 0.06729024648666382,
"learning_rate": 3e-05,
"loss": 0.0012,
"step": 3840
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.9119170984455959,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8888888888888888,
"eval_LOCATION_recall": 0.9361702127659575,
"eval_ORGANIZATION_f1": 0.9181286549707602,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.8971428571428571,
"eval_ORGANIZATION_recall": 0.9401197604790419,
"eval_PERSON_f1": 0.9777777777777779,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9924812030075187,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.096034474670887,
"eval_overall_accuracy": 0.9867403314917127,
"eval_overall_f1": 0.9366459627329192,
"eval_overall_precision": 0.9262899262899262,
"eval_overall_recall": 0.9472361809045227,
"eval_runtime": 0.612,
"eval_samples_per_second": 277.787,
"eval_steps_per_second": 4.902,
"step": 3840
},
{
"epoch": 41.0,
"grad_norm": 0.0005613254033960402,
"learning_rate": 2.95e-05,
"loss": 0.0008,
"step": 3936
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.9285714285714286,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8921568627450981,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9382716049382717,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9681528662420382,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9779411764705882,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9851851851851852,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.0963701382279396,
"eval_overall_accuracy": 0.988950276243094,
"eval_overall_f1": 0.9494949494949495,
"eval_overall_precision": 0.9543147208121827,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.6226,
"eval_samples_per_second": 273.045,
"eval_steps_per_second": 4.818,
"step": 3936
},
{
"epoch": 42.0,
"grad_norm": 0.0030692138243466616,
"learning_rate": 2.9e-05,
"loss": 0.0015,
"step": 4032
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.9319371727748691,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9175257731958762,
"eval_LOCATION_recall": 0.9468085106382979,
"eval_ORGANIZATION_f1": 0.9074626865671641,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9047619047619048,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9708029197080292,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9708029197080292,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.07825793325901031,
"eval_overall_accuracy": 0.9881215469613259,
"eval_overall_f1": 0.9349999999999999,
"eval_overall_precision": 0.9303482587064676,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6264,
"eval_samples_per_second": 271.375,
"eval_steps_per_second": 4.789,
"step": 4032
},
{
"epoch": 43.0,
"grad_norm": 0.0004494467575568706,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0019,
"step": 4128
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.934010152284264,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8932038834951457,
"eval_LOCATION_recall": 0.9787234042553191,
"eval_ORGANIZATION_f1": 0.9272727272727274,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9386503067484663,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.981549815498155,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9925373134328358,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.07773718982934952,
"eval_overall_accuracy": 0.9883977900552486,
"eval_overall_f1": 0.9473684210526316,
"eval_overall_precision": 0.945,
"eval_overall_recall": 0.949748743718593,
"eval_runtime": 0.6145,
"eval_samples_per_second": 276.668,
"eval_steps_per_second": 4.882,
"step": 4128
},
{
"epoch": 44.0,
"grad_norm": 0.0007905985112302005,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0011,
"step": 4224
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.9246231155778896,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8761904761904762,
"eval_LOCATION_recall": 0.9787234042553191,
"eval_ORGANIZATION_f1": 0.9422492401215805,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9567901234567902,
"eval_ORGANIZATION_recall": 0.9281437125748503,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.08259343355894089,
"eval_overall_accuracy": 0.9892265193370166,
"eval_overall_f1": 0.9486858573216519,
"eval_overall_precision": 0.9451371571072319,
"eval_overall_recall": 0.9522613065326633,
"eval_runtime": 0.731,
"eval_samples_per_second": 232.542,
"eval_steps_per_second": 4.104,
"step": 4224
},
{
"epoch": 45.0,
"grad_norm": 0.00027426957967691123,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0007,
"step": 4320
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.9387755102040817,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9019607843137255,
"eval_LOCATION_recall": 0.9787234042553191,
"eval_ORGANIZATION_f1": 0.9259259259259259,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9554140127388535,
"eval_ORGANIZATION_recall": 0.8982035928143712,
"eval_PERSON_f1": 0.9705882352941176,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9777777777777777,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.07949012517929077,
"eval_overall_accuracy": 0.9867403314917127,
"eval_overall_f1": 0.9444444444444445,
"eval_overall_precision": 0.949238578680203,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6776,
"eval_samples_per_second": 250.88,
"eval_steps_per_second": 4.427,
"step": 4320
},
{
"epoch": 46.0,
"grad_norm": 6.9263811111450195,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0025,
"step": 4416
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.9435897435897436,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9108910891089109,
"eval_LOCATION_recall": 0.9787234042553191,
"eval_ORGANIZATION_f1": 0.9144542772861356,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9011627906976745,
"eval_ORGANIZATION_recall": 0.9281437125748503,
"eval_PERSON_f1": 0.9739776951672863,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9924242424242424,
"eval_PERSON_recall": 0.9562043795620438,
"eval_loss": 0.08157689869403839,
"eval_overall_accuracy": 0.9878453038674033,
"eval_overall_f1": 0.9414694894146949,
"eval_overall_precision": 0.9333333333333333,
"eval_overall_recall": 0.949748743718593,
"eval_runtime": 0.6189,
"eval_samples_per_second": 274.66,
"eval_steps_per_second": 4.847,
"step": 4416
},
{
"epoch": 47.0,
"grad_norm": 0.001023626420646906,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0012,
"step": 4512
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.9253731343283582,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8691588785046729,
"eval_LOCATION_recall": 0.9893617021276596,
"eval_ORGANIZATION_f1": 0.9353846153846154,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9620253164556962,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9777777777777779,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9924812030075187,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.09457841515541077,
"eval_overall_accuracy": 0.9875690607734806,
"eval_overall_f1": 0.9472361809045227,
"eval_overall_precision": 0.9472361809045227,
"eval_overall_recall": 0.9472361809045227,
"eval_runtime": 0.6136,
"eval_samples_per_second": 277.045,
"eval_steps_per_second": 4.889,
"step": 4512
},
{
"epoch": 48.0,
"grad_norm": 0.0005152701633051038,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0016,
"step": 4608
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.9246231155778896,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8761904761904762,
"eval_LOCATION_recall": 0.9787234042553191,
"eval_ORGANIZATION_f1": 0.924924924924925,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.927710843373494,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9777777777777779,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9924812030075187,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.0960976779460907,
"eval_overall_accuracy": 0.987292817679558,
"eval_overall_f1": 0.9426433915211971,
"eval_overall_precision": 0.9356435643564357,
"eval_overall_recall": 0.949748743718593,
"eval_runtime": 0.6176,
"eval_samples_per_second": 275.273,
"eval_steps_per_second": 4.858,
"step": 4608
},
{
"epoch": 49.0,
"grad_norm": 0.0012280733790248632,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.001,
"step": 4704
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.9333333333333335,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.900990099009901,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9285714285714287,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9230769230769231,
"eval_ORGANIZATION_recall": 0.9341317365269461,
"eval_PERSON_f1": 0.981549815498155,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9925373134328358,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.09950720518827438,
"eval_overall_accuracy": 0.9864640883977901,
"eval_overall_f1": 0.9476309226932669,
"eval_overall_precision": 0.9405940594059405,
"eval_overall_recall": 0.9547738693467337,
"eval_runtime": 0.6234,
"eval_samples_per_second": 272.715,
"eval_steps_per_second": 4.813,
"step": 4704
},
{
"epoch": 50.0,
"grad_norm": 0.00443949643522501,
"learning_rate": 2.5e-05,
"loss": 0.001,
"step": 4800
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.934010152284264,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8932038834951457,
"eval_LOCATION_recall": 0.9787234042553191,
"eval_ORGANIZATION_f1": 0.9259259259259259,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9554140127388535,
"eval_ORGANIZATION_recall": 0.8982035928143712,
"eval_PERSON_f1": 0.9703703703703703,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9849624060150376,
"eval_PERSON_recall": 0.9562043795620438,
"eval_loss": 0.0988643616437912,
"eval_overall_accuracy": 0.9870165745856354,
"eval_overall_f1": 0.943109987357775,
"eval_overall_precision": 0.9491094147582697,
"eval_overall_recall": 0.9371859296482412,
"eval_runtime": 0.6234,
"eval_samples_per_second": 272.715,
"eval_steps_per_second": 4.813,
"step": 4800
},
{
"epoch": 51.0,
"grad_norm": 0.0002302059147041291,
"learning_rate": 2.45e-05,
"loss": 0.0004,
"step": 4896
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.9387755102040817,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9019607843137255,
"eval_LOCATION_recall": 0.9787234042553191,
"eval_ORGANIZATION_f1": 0.9151515151515152,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9263803680981595,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.9743589743589743,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9779411764705882,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.11296043545007706,
"eval_overall_accuracy": 0.9870165745856354,
"eval_overall_f1": 0.9411764705882354,
"eval_overall_precision": 0.9376558603491272,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.6148,
"eval_samples_per_second": 276.493,
"eval_steps_per_second": 4.879,
"step": 4896
},
{
"epoch": 52.0,
"grad_norm": 0.0004114691982977092,
"learning_rate": 2.4e-05,
"loss": 0.0007,
"step": 4992
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.9381443298969071,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.91,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9212121212121211,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9325153374233128,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9743589743589743,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9779411764705882,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.10785677284002304,
"eval_overall_accuracy": 0.9878453038674033,
"eval_overall_f1": 0.9435382685069008,
"eval_overall_precision": 0.9423558897243107,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.6113,
"eval_samples_per_second": 278.074,
"eval_steps_per_second": 4.907,
"step": 4992
},
{
"epoch": 53.0,
"grad_norm": 0.0016004899516701698,
"learning_rate": 2.35e-05,
"loss": 0.0011,
"step": 5088
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.9479166666666666,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9285714285714286,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9235474006116209,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.94375,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.9705882352941176,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9777777777777777,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10214179754257202,
"eval_overall_accuracy": 0.9878453038674033,
"eval_overall_f1": 0.9456384323640961,
"eval_overall_precision": 0.9516539440203562,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6154,
"eval_samples_per_second": 276.238,
"eval_steps_per_second": 4.875,
"step": 5088
},
{
"epoch": 54.0,
"grad_norm": 0.00200115074403584,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0009,
"step": 5184
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8958333333333333,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.8775510204081632,
"eval_LOCATION_recall": 0.9148936170212766,
"eval_ORGANIZATION_f1": 0.8979591836734695,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.875,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9705882352941176,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9777777777777777,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.12426385283470154,
"eval_overall_accuracy": 0.9825966850828729,
"eval_overall_f1": 0.9219330855018587,
"eval_overall_precision": 0.9095354523227384,
"eval_overall_recall": 0.9346733668341709,
"eval_runtime": 0.6204,
"eval_samples_per_second": 273.999,
"eval_steps_per_second": 4.835,
"step": 5184
},
{
"epoch": 55.0,
"grad_norm": 0.006822248920798302,
"learning_rate": 2.25e-05,
"loss": 0.0011,
"step": 5280
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.9381443298969071,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.91,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9161676646706587,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9161676646706587,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.08817728608846664,
"eval_overall_accuracy": 0.9883977900552486,
"eval_overall_f1": 0.9411764705882354,
"eval_overall_precision": 0.9376558603491272,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.6164,
"eval_samples_per_second": 275.795,
"eval_steps_per_second": 4.867,
"step": 5280
},
{
"epoch": 56.0,
"grad_norm": 0.002012253738939762,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0004,
"step": 5376
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.9479166666666666,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9285714285714286,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9235474006116209,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.94375,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.08795258402824402,
"eval_overall_accuracy": 0.9900552486187846,
"eval_overall_f1": 0.9468354430379746,
"eval_overall_precision": 0.9540816326530612,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6131,
"eval_samples_per_second": 277.291,
"eval_steps_per_second": 4.893,
"step": 5376
},
{
"epoch": 57.0,
"grad_norm": 0.001478194841183722,
"learning_rate": 2.15e-05,
"loss": 0.0006,
"step": 5472
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.9333333333333335,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.900990099009901,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.913946587537092,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9058823529411765,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10102926194667816,
"eval_overall_accuracy": 0.987292817679558,
"eval_overall_f1": 0.9389788293897883,
"eval_overall_precision": 0.9308641975308642,
"eval_overall_recall": 0.9472361809045227,
"eval_runtime": 0.6159,
"eval_samples_per_second": 276.031,
"eval_steps_per_second": 4.871,
"step": 5472
},
{
"epoch": 58.0,
"grad_norm": 0.0009641240467317402,
"learning_rate": 2.1e-05,
"loss": 0.0006,
"step": 5568
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.9333333333333335,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.900990099009901,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9166666666666667,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9112426035502958,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9779411764705882,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9851851851851852,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.09803132712841034,
"eval_overall_accuracy": 0.9875690607734806,
"eval_overall_f1": 0.9414694894146949,
"eval_overall_precision": 0.9333333333333333,
"eval_overall_recall": 0.949748743718593,
"eval_runtime": 0.7109,
"eval_samples_per_second": 239.12,
"eval_steps_per_second": 4.22,
"step": 5568
},
{
"epoch": 59.0,
"grad_norm": 0.00035870648571290076,
"learning_rate": 2.05e-05,
"loss": 0.0003,
"step": 5664
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.9430051813471503,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9191919191919192,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9263803680981595,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.949685534591195,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.9705882352941176,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9777777777777777,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.09932650625705719,
"eval_overall_accuracy": 0.9883977900552486,
"eval_overall_f1": 0.9456384323640961,
"eval_overall_precision": 0.9516539440203562,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6278,
"eval_samples_per_second": 270.773,
"eval_steps_per_second": 4.778,
"step": 5664
},
{
"epoch": 60.0,
"grad_norm": 0.005340063478797674,
"learning_rate": 2e-05,
"loss": 0.0003,
"step": 5760
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.9278350515463918,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9216867469879517,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9272727272727272,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9779411764705882,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9851851851851852,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.09833351522684097,
"eval_overall_accuracy": 0.9883977900552486,
"eval_overall_f1": 0.9423558897243106,
"eval_overall_precision": 0.94,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.6201,
"eval_samples_per_second": 274.141,
"eval_steps_per_second": 4.838,
"step": 5760
},
{
"epoch": 61.0,
"grad_norm": 0.0003080039459746331,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0003,
"step": 5856
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.9381443298969071,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.91,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.906906906906907,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9096385542168675,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.09371061623096466,
"eval_overall_accuracy": 0.9886740331491712,
"eval_overall_f1": 0.93734335839599,
"eval_overall_precision": 0.935,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6239,
"eval_samples_per_second": 272.497,
"eval_steps_per_second": 4.809,
"step": 5856
},
{
"epoch": 62.0,
"grad_norm": 0.0016579064540565014,
"learning_rate": 1.9e-05,
"loss": 0.0011,
"step": 5952
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.9238578680203046,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.883495145631068,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9263803680981595,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.949685534591195,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.981549815498155,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9925373134328358,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.1108747124671936,
"eval_overall_accuracy": 0.9867403314917127,
"eval_overall_f1": 0.9445843828715367,
"eval_overall_precision": 0.946969696969697,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.6246,
"eval_samples_per_second": 272.177,
"eval_steps_per_second": 4.803,
"step": 5952
},
{
"epoch": 63.0,
"grad_norm": 0.0014240954769775271,
"learning_rate": 1.85e-05,
"loss": 0.0009,
"step": 6048
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.9479166666666666,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9285714285714286,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9161676646706587,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9161676646706587,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9777777777777779,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9924812030075187,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.0866396427154541,
"eval_overall_accuracy": 0.9897790055248619,
"eval_overall_f1": 0.9447236180904522,
"eval_overall_precision": 0.9447236180904522,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.6176,
"eval_samples_per_second": 275.269,
"eval_steps_per_second": 4.858,
"step": 6048
},
{
"epoch": 64.0,
"grad_norm": 0.0007542133680544794,
"learning_rate": 1.8e-05,
"loss": 0.0004,
"step": 6144
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.9072164948453608,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.88,
"eval_LOCATION_recall": 0.9361702127659575,
"eval_ORGANIZATION_f1": 0.9221556886227545,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9221556886227545,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9777777777777779,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9924812030075187,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.1202077716588974,
"eval_overall_accuracy": 0.9848066298342542,
"eval_overall_f1": 0.93734335839599,
"eval_overall_precision": 0.935,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.628,
"eval_samples_per_second": 270.7,
"eval_steps_per_second": 4.777,
"step": 6144
},
{
"epoch": 65.0,
"grad_norm": 0.0002191825769841671,
"learning_rate": 1.75e-05,
"loss": 0.0023,
"step": 6240
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.9533678756476683,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9292929292929293,
"eval_LOCATION_recall": 0.9787234042553191,
"eval_ORGANIZATION_f1": 0.9189189189189191,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9216867469879518,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9852941176470589,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9925925925925926,
"eval_PERSON_recall": 0.9781021897810219,
"eval_loss": 0.09679195284843445,
"eval_overall_accuracy": 0.9883977900552486,
"eval_overall_f1": 0.9498746867167919,
"eval_overall_precision": 0.9475,
"eval_overall_recall": 0.9522613065326633,
"eval_runtime": 0.6251,
"eval_samples_per_second": 271.962,
"eval_steps_per_second": 4.799,
"step": 6240
},
{
"epoch": 66.0,
"grad_norm": 0.0010986309498548508,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0017,
"step": 6336
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.9430051813471503,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9191919191919192,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9300911854103343,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9444444444444444,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.981549815498155,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9925373134328358,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.10312038660049438,
"eval_overall_accuracy": 0.9875690607734806,
"eval_overall_f1": 0.9508196721311476,
"eval_overall_precision": 0.9544303797468354,
"eval_overall_recall": 0.9472361809045227,
"eval_runtime": 0.7092,
"eval_samples_per_second": 239.702,
"eval_steps_per_second": 4.23,
"step": 6336
},
{
"epoch": 67.0,
"grad_norm": 0.0005643566255457699,
"learning_rate": 1.65e-05,
"loss": 0.0014,
"step": 6432
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.9326424870466321,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9090909090909091,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9263803680981595,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.949685534591195,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.981549815498155,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9925373134328358,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.10499503463506699,
"eval_overall_accuracy": 0.9881215469613259,
"eval_overall_f1": 0.9468354430379746,
"eval_overall_precision": 0.9540816326530612,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6298,
"eval_samples_per_second": 269.943,
"eval_steps_per_second": 4.764,
"step": 6432
},
{
"epoch": 68.0,
"grad_norm": 0.0005254722782410681,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0007,
"step": 6528
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.9430051813471503,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9191919191919192,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9259259259259259,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9554140127388535,
"eval_ORGANIZATION_recall": 0.8982035928143712,
"eval_PERSON_f1": 0.9851851851851852,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 1.0,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.10490843653678894,
"eval_overall_accuracy": 0.9892265193370166,
"eval_overall_f1": 0.9504447268106734,
"eval_overall_precision": 0.961439588688946,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.61,
"eval_samples_per_second": 278.701,
"eval_steps_per_second": 4.918,
"step": 6528
},
{
"epoch": 69.0,
"grad_norm": 0.018979080021381378,
"learning_rate": 1.55e-05,
"loss": 0.0005,
"step": 6624
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.9375000000000001,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9183673469387755,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9166666666666667,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9112426035502958,
"eval_ORGANIZATION_recall": 0.9221556886227545,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.09969516843557358,
"eval_overall_accuracy": 0.9859116022099448,
"eval_overall_f1": 0.9411764705882354,
"eval_overall_precision": 0.9376558603491272,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.6163,
"eval_samples_per_second": 275.818,
"eval_steps_per_second": 4.867,
"step": 6624
},
{
"epoch": 70.0,
"grad_norm": 0.00027675795718096197,
"learning_rate": 1.5e-05,
"loss": 0.001,
"step": 6720
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.9375000000000001,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9183673469387755,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9198813056379822,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9117647058823529,
"eval_ORGANIZATION_recall": 0.9281437125748503,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.1053897961974144,
"eval_overall_accuracy": 0.9875690607734806,
"eval_overall_f1": 0.9425,
"eval_overall_precision": 0.9378109452736318,
"eval_overall_recall": 0.9472361809045227,
"eval_runtime": 0.6397,
"eval_samples_per_second": 265.745,
"eval_steps_per_second": 4.69,
"step": 6720
},
{
"epoch": 71.0,
"grad_norm": 0.00024086404300760478,
"learning_rate": 1.45e-05,
"loss": 0.0005,
"step": 6816
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.9430051813471503,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9191919191919192,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9357798165137615,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.95625,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.09782951325178146,
"eval_overall_accuracy": 0.9900552486187846,
"eval_overall_f1": 0.9506953223767383,
"eval_overall_precision": 0.9567430025445293,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.6144,
"eval_samples_per_second": 276.707,
"eval_steps_per_second": 4.883,
"step": 6816
},
{
"epoch": 72.0,
"grad_norm": 0.005460801534354687,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0008,
"step": 6912
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.9368421052631578,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9270833333333334,
"eval_LOCATION_recall": 0.9468085106382979,
"eval_ORGANIZATION_f1": 0.9272727272727274,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9386503067484663,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.0954757034778595,
"eval_overall_accuracy": 0.9886740331491712,
"eval_overall_f1": 0.9456384323640961,
"eval_overall_precision": 0.9516539440203562,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6066,
"eval_samples_per_second": 280.257,
"eval_steps_per_second": 4.946,
"step": 6912
},
{
"epoch": 73.0,
"grad_norm": 0.0004871623241342604,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0005,
"step": 7008
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9329268292682927,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9503105590062112,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10084227472543716,
"eval_overall_accuracy": 0.9892265193370166,
"eval_overall_f1": 0.949367088607595,
"eval_overall_precision": 0.9566326530612245,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.6223,
"eval_samples_per_second": 273.189,
"eval_steps_per_second": 4.821,
"step": 7008
},
{
"epoch": 74.0,
"grad_norm": 0.00226827641017735,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0004,
"step": 7104
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.929663608562691,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.95,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.966789667896679,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9776119402985075,
"eval_PERSON_recall": 0.9562043795620438,
"eval_loss": 0.1032579094171524,
"eval_overall_accuracy": 0.9883977900552486,
"eval_overall_f1": 0.9455006337135614,
"eval_overall_precision": 0.9539641943734015,
"eval_overall_recall": 0.9371859296482412,
"eval_runtime": 0.657,
"eval_samples_per_second": 258.764,
"eval_steps_per_second": 4.566,
"step": 7104
},
{
"epoch": 75.0,
"grad_norm": 0.0031442521139979362,
"learning_rate": 1.25e-05,
"loss": 0.0005,
"step": 7200
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9320987654320988,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9617834394904459,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.9703703703703703,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9849624060150376,
"eval_PERSON_recall": 0.9562043795620438,
"eval_loss": 0.11296577751636505,
"eval_overall_accuracy": 0.9886740331491712,
"eval_overall_f1": 0.9477707006369427,
"eval_overall_precision": 0.9612403100775194,
"eval_overall_recall": 0.9346733668341709,
"eval_runtime": 0.6204,
"eval_samples_per_second": 274.019,
"eval_steps_per_second": 4.836,
"step": 7200
},
{
"epoch": 76.0,
"grad_norm": 0.001323927310295403,
"learning_rate": 1.2e-05,
"loss": 0.0007,
"step": 7296
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9244712990936556,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9329268292682927,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.966789667896679,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9776119402985075,
"eval_PERSON_recall": 0.9562043795620438,
"eval_loss": 0.1114824041724205,
"eval_overall_accuracy": 0.9883977900552486,
"eval_overall_f1": 0.9432534678436318,
"eval_overall_precision": 0.9468354430379747,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6209,
"eval_samples_per_second": 273.776,
"eval_steps_per_second": 4.831,
"step": 7296
},
{
"epoch": 77.0,
"grad_norm": 0.003065042197704315,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0006,
"step": 7392
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9259259259259259,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9554140127388535,
"eval_ORGANIZATION_recall": 0.8982035928143712,
"eval_PERSON_f1": 0.9779411764705882,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9851851851851852,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.112979955971241,
"eval_overall_accuracy": 0.988950276243094,
"eval_overall_f1": 0.9479034307496823,
"eval_overall_precision": 0.9588688946015425,
"eval_overall_recall": 0.9371859296482412,
"eval_runtime": 0.6315,
"eval_samples_per_second": 269.218,
"eval_steps_per_second": 4.751,
"step": 7392
},
{
"epoch": 78.0,
"grad_norm": 7.085573196411133,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0005,
"step": 7488
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9141104294478527,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9371069182389937,
"eval_ORGANIZATION_recall": 0.8922155688622755,
"eval_PERSON_f1": 0.9632352941176471,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9703703703703703,
"eval_PERSON_recall": 0.9562043795620438,
"eval_loss": 0.11508027464151382,
"eval_overall_accuracy": 0.9875690607734806,
"eval_overall_f1": 0.9378960709759189,
"eval_overall_precision": 0.9462915601023018,
"eval_overall_recall": 0.9296482412060302,
"eval_runtime": 0.6139,
"eval_samples_per_second": 276.907,
"eval_steps_per_second": 4.887,
"step": 7488
},
{
"epoch": 79.0,
"grad_norm": 0.0023044480476528406,
"learning_rate": 1.05e-05,
"loss": 0.0003,
"step": 7584
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9268292682926829,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9440993788819876,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.11096746474504471,
"eval_overall_accuracy": 0.9886740331491712,
"eval_overall_f1": 0.9468354430379746,
"eval_overall_precision": 0.9540816326530612,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6643,
"eval_samples_per_second": 255.917,
"eval_steps_per_second": 4.516,
"step": 7584
},
{
"epoch": 80.0,
"grad_norm": 0.00011201861343579367,
"learning_rate": 1e-05,
"loss": 0.0002,
"step": 7680
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9268292682926829,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9440993788819876,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.11268793046474457,
"eval_overall_accuracy": 0.9886740331491712,
"eval_overall_f1": 0.9468354430379746,
"eval_overall_precision": 0.9540816326530612,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6122,
"eval_samples_per_second": 277.679,
"eval_steps_per_second": 4.9,
"step": 7680
},
{
"epoch": 81.0,
"grad_norm": 0.0002784592506941408,
"learning_rate": 9.5e-06,
"loss": 0.0003,
"step": 7776
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9268292682926829,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9440993788819876,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.11348237097263336,
"eval_overall_accuracy": 0.9886740331491712,
"eval_overall_f1": 0.9468354430379746,
"eval_overall_precision": 0.9540816326530612,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6095,
"eval_samples_per_second": 278.928,
"eval_steps_per_second": 4.922,
"step": 7776
},
{
"epoch": 82.0,
"grad_norm": 0.00022091029677540064,
"learning_rate": 9e-06,
"loss": 0.0003,
"step": 7872
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9268292682926829,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9440993788819876,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10818831622600555,
"eval_overall_accuracy": 0.9886740331491712,
"eval_overall_f1": 0.9468354430379746,
"eval_overall_precision": 0.9540816326530612,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6203,
"eval_samples_per_second": 274.071,
"eval_steps_per_second": 4.837,
"step": 7872
},
{
"epoch": 83.0,
"grad_norm": 0.00032480747904628515,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0006,
"step": 7968
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.9430051813471503,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9191919191919192,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.937888198757764,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9741935483870968,
"eval_ORGANIZATION_recall": 0.9041916167664671,
"eval_PERSON_f1": 0.9779411764705882,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9851851851851852,
"eval_PERSON_recall": 0.9708029197080292,
"eval_loss": 0.11552965641021729,
"eval_overall_accuracy": 0.9895027624309393,
"eval_overall_f1": 0.9529860228716646,
"eval_overall_precision": 0.9640102827763496,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.623,
"eval_samples_per_second": 272.886,
"eval_steps_per_second": 4.816,
"step": 7968
},
{
"epoch": 84.0,
"grad_norm": 0.0005326655227690935,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0003,
"step": 8064
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.9479166666666666,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9285714285714286,
"eval_LOCATION_recall": 0.9680851063829787,
"eval_ORGANIZATION_f1": 0.9386503067484663,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9622641509433962,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10718917846679688,
"eval_overall_accuracy": 0.9897790055248619,
"eval_overall_f1": 0.9531051964512041,
"eval_overall_precision": 0.9616368286445013,
"eval_overall_recall": 0.9447236180904522,
"eval_runtime": 0.616,
"eval_samples_per_second": 275.964,
"eval_steps_per_second": 4.87,
"step": 8064
},
{
"epoch": 85.0,
"grad_norm": 0.0004018662730231881,
"learning_rate": 7.5e-06,
"loss": 0.0007,
"step": 8160
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9272727272727274,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9386503067484663,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10133817046880722,
"eval_overall_accuracy": 0.9895027624309393,
"eval_overall_f1": 0.946969696969697,
"eval_overall_precision": 0.9517766497461929,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.6043,
"eval_samples_per_second": 281.311,
"eval_steps_per_second": 4.964,
"step": 8160
},
{
"epoch": 86.0,
"grad_norm": 0.002058778889477253,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0003,
"step": 8256
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9300911854103343,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9444444444444444,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10222224146127701,
"eval_overall_accuracy": 0.9897790055248619,
"eval_overall_f1": 0.9481668773704173,
"eval_overall_precision": 0.9541984732824428,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.6385,
"eval_samples_per_second": 266.268,
"eval_steps_per_second": 4.699,
"step": 8256
},
{
"epoch": 87.0,
"grad_norm": 0.00029380357591435313,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0002,
"step": 8352
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9300911854103343,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9444444444444444,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10264620184898376,
"eval_overall_accuracy": 0.9897790055248619,
"eval_overall_f1": 0.9481668773704173,
"eval_overall_precision": 0.9541984732824428,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.6718,
"eval_samples_per_second": 253.056,
"eval_steps_per_second": 4.466,
"step": 8352
},
{
"epoch": 88.0,
"grad_norm": 0.00025997136253863573,
"learning_rate": 6e-06,
"loss": 0.0002,
"step": 8448
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9300911854103343,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9444444444444444,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10285894572734833,
"eval_overall_accuracy": 0.9897790055248619,
"eval_overall_f1": 0.9481668773704173,
"eval_overall_precision": 0.9541984732824428,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.6216,
"eval_samples_per_second": 273.509,
"eval_steps_per_second": 4.827,
"step": 8448
},
{
"epoch": 89.0,
"grad_norm": 0.19176463782787323,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0003,
"step": 8544
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9300911854103343,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9444444444444444,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.1034075915813446,
"eval_overall_accuracy": 0.9897790055248619,
"eval_overall_f1": 0.9481668773704173,
"eval_overall_precision": 0.9541984732824428,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.6284,
"eval_samples_per_second": 270.534,
"eval_steps_per_second": 4.774,
"step": 8544
},
{
"epoch": 90.0,
"grad_norm": 9.726906137075275e-05,
"learning_rate": 5e-06,
"loss": 0.0003,
"step": 8640
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9357798165137615,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.95625,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10428432375192642,
"eval_overall_accuracy": 0.9897790055248619,
"eval_overall_f1": 0.9505703422053232,
"eval_overall_precision": 0.959079283887468,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.6211,
"eval_samples_per_second": 273.713,
"eval_steps_per_second": 4.83,
"step": 8640
},
{
"epoch": 91.0,
"grad_norm": 0.0001318985887337476,
"learning_rate": 4.5e-06,
"loss": 0.0002,
"step": 8736
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.929663608562691,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.95,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10446962714195251,
"eval_overall_accuracy": 0.9892265193370166,
"eval_overall_f1": 0.9480354879594423,
"eval_overall_precision": 0.9565217391304348,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6186,
"eval_samples_per_second": 274.801,
"eval_steps_per_second": 4.849,
"step": 8736
},
{
"epoch": 92.0,
"grad_norm": 0.0003957097651436925,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0002,
"step": 8832
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9329268292682927,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9503105590062112,
"eval_ORGANIZATION_recall": 0.9161676646706587,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10467536002397537,
"eval_overall_accuracy": 0.9895027624309393,
"eval_overall_f1": 0.949367088607595,
"eval_overall_precision": 0.9566326530612245,
"eval_overall_recall": 0.9422110552763819,
"eval_runtime": 0.6214,
"eval_samples_per_second": 273.573,
"eval_steps_per_second": 4.828,
"step": 8832
},
{
"epoch": 93.0,
"grad_norm": 0.00048287183744832873,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0003,
"step": 8928
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.929663608562691,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.95,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10538303107023239,
"eval_overall_accuracy": 0.9897790055248619,
"eval_overall_f1": 0.9480354879594423,
"eval_overall_precision": 0.9565217391304348,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6144,
"eval_samples_per_second": 276.699,
"eval_steps_per_second": 4.883,
"step": 8928
},
{
"epoch": 94.0,
"grad_norm": 0.00010792938701342791,
"learning_rate": 3e-06,
"loss": 0.0009,
"step": 9024
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9325153374233129,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9559748427672956,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10885108262300491,
"eval_overall_accuracy": 0.9895027624309393,
"eval_overall_f1": 0.9492385786802031,
"eval_overall_precision": 0.958974358974359,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6137,
"eval_samples_per_second": 277.001,
"eval_steps_per_second": 4.888,
"step": 9024
},
{
"epoch": 95.0,
"grad_norm": 0.00041213424992747605,
"learning_rate": 2.5e-06,
"loss": 0.0004,
"step": 9120
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9268292682926829,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9440993788819876,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10332932323217392,
"eval_overall_accuracy": 0.9895027624309393,
"eval_overall_f1": 0.9468354430379746,
"eval_overall_precision": 0.9540816326530612,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6203,
"eval_samples_per_second": 274.044,
"eval_steps_per_second": 4.836,
"step": 9120
},
{
"epoch": 96.0,
"grad_norm": 0.0002837861829902977,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0002,
"step": 9216
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9268292682926829,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9440993788819876,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10279857367277145,
"eval_overall_accuracy": 0.9895027624309393,
"eval_overall_f1": 0.9468354430379746,
"eval_overall_precision": 0.9540816326530612,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6235,
"eval_samples_per_second": 272.654,
"eval_steps_per_second": 4.812,
"step": 9216
},
{
"epoch": 97.0,
"grad_norm": 0.0002584067406132817,
"learning_rate": 1.5e-06,
"loss": 0.0002,
"step": 9312
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.9268292682926829,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.9440993788819876,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10300398617982864,
"eval_overall_accuracy": 0.9895027624309393,
"eval_overall_f1": 0.9468354430379746,
"eval_overall_precision": 0.9540816326530612,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6161,
"eval_samples_per_second": 275.938,
"eval_steps_per_second": 4.869,
"step": 9312
},
{
"epoch": 98.0,
"grad_norm": 0.00020491515169851482,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0003,
"step": 9408
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.929663608562691,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.95,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10345587879419327,
"eval_overall_accuracy": 0.9892265193370166,
"eval_overall_f1": 0.9480354879594423,
"eval_overall_precision": 0.9565217391304348,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6258,
"eval_samples_per_second": 271.659,
"eval_steps_per_second": 4.794,
"step": 9408
},
{
"epoch": 99.0,
"grad_norm": 0.0002451244508847594,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0002,
"step": 9504
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.929663608562691,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.95,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10355650633573532,
"eval_overall_accuracy": 0.9892265193370166,
"eval_overall_f1": 0.9480354879594423,
"eval_overall_precision": 0.9565217391304348,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6161,
"eval_samples_per_second": 275.943,
"eval_steps_per_second": 4.87,
"step": 9504
},
{
"epoch": 100.0,
"grad_norm": 0.0001467197434976697,
"learning_rate": 0.0,
"loss": 0.0002,
"step": 9600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.9424083769633509,
"eval_LOCATION_number": 94,
"eval_LOCATION_precision": 0.9278350515463918,
"eval_LOCATION_recall": 0.9574468085106383,
"eval_ORGANIZATION_f1": 0.929663608562691,
"eval_ORGANIZATION_number": 167,
"eval_ORGANIZATION_precision": 0.95,
"eval_ORGANIZATION_recall": 0.9101796407185628,
"eval_PERSON_f1": 0.9741697416974171,
"eval_PERSON_number": 137,
"eval_PERSON_precision": 0.9850746268656716,
"eval_PERSON_recall": 0.9635036496350365,
"eval_loss": 0.10357167571783066,
"eval_overall_accuracy": 0.9892265193370166,
"eval_overall_f1": 0.9480354879594423,
"eval_overall_precision": 0.9565217391304348,
"eval_overall_recall": 0.9396984924623115,
"eval_runtime": 0.6779,
"eval_samples_per_second": 250.774,
"eval_steps_per_second": 4.425,
"step": 9600
},
{
"epoch": 100.0,
"step": 9600,
"total_flos": 3851325939318660.0,
"train_loss": 0.005652450745304426,
"train_runtime": 2268.3568,
"train_samples_per_second": 67.45,
"train_steps_per_second": 4.232
}
],
"logging_steps": 500,
"max_steps": 9600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 3851325939318660.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}