|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 3.6827080249786377, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.3501, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.7483870967741935, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6904761904761905, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.6709677419354838, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5777777777777777, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8679245283018867, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8214285714285714, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7123287671232875, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.65, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.13337989151477814, |
|
"eval_overall_accuracy": 0.953443258971872, |
|
"eval_overall_f1": 0.7905138339920948, |
|
"eval_overall_precision": 0.7281553398058253, |
|
"eval_overall_recall": 0.8645533141210374, |
|
"eval_runtime": 0.9448, |
|
"eval_samples_per_second": 197.919, |
|
"eval_steps_per_second": 3.175, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 2.115112781524658, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.1148, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.7612903225806451, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7023809523809523, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.697986577181208, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6190476190476191, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8996763754045306, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8742138364779874, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6329113924050633, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5434782608695652, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.7692307692307693, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6756756756756757, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1362091302871704, |
|
"eval_overall_accuracy": 0.9558680892337537, |
|
"eval_overall_f1": 0.7926023778071334, |
|
"eval_overall_precision": 0.7317073170731707, |
|
"eval_overall_recall": 0.8645533141210374, |
|
"eval_runtime": 0.9986, |
|
"eval_samples_per_second": 187.27, |
|
"eval_steps_per_second": 3.004, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 2.7631375789642334, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.0732, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.7662337662337662, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7108433734939759, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7702702702702702, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6867469879518072, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8766233766233766, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8544303797468354, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.806451612903226, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14412528276443481, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8221024258760108, |
|
"eval_overall_precision": 0.7721518987341772, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.9223, |
|
"eval_samples_per_second": 202.756, |
|
"eval_steps_per_second": 3.253, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 1.3901716470718384, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.0453, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7123287671232877, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6419753086419753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8996763754045306, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8742138364779874, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8214285714285714, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8214285714285714, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.1702796369791031, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8260869565217391, |
|
"eval_overall_precision": 0.781491002570694, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.94, |
|
"eval_samples_per_second": 198.941, |
|
"eval_steps_per_second": 3.192, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 0.532292902469635, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.0312, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7832167832167831, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.717948717948718, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.17514730989933014, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8324324324324324, |
|
"eval_overall_precision": 0.7837150127226463, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.9647, |
|
"eval_samples_per_second": 193.847, |
|
"eval_steps_per_second": 3.11, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 5.477240085601807, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.0236, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.7712418300653594, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7195121951219512, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7482993197278912, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6707317073170732, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.20889906585216522, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8197596795727637, |
|
"eval_overall_precision": 0.763681592039801, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.9433, |
|
"eval_samples_per_second": 198.231, |
|
"eval_steps_per_second": 3.18, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 2.7495665550231934, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.017, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.8275862068965518, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8108108108108109, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.763888888888889, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6962025316455697, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8925081433224756, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8726114649681529, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8108108108108109, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7317073170731707, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.21119879186153412, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8406593406593407, |
|
"eval_overall_precision": 0.8031496062992126, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.9486, |
|
"eval_samples_per_second": 197.142, |
|
"eval_steps_per_second": 3.163, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.43028321862220764, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.0133, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7862068965517242, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7125, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8996763754045306, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8742138364779874, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8108108108108109, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7317073170731707, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.21715472638607025, |
|
"eval_overall_accuracy": 0.9602327837051406, |
|
"eval_overall_f1": 0.8466757123473542, |
|
"eval_overall_precision": 0.8, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9553, |
|
"eval_samples_per_second": 195.744, |
|
"eval_steps_per_second": 3.14, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 0.03873327746987343, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.0096, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7482993197278912, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6707317073170732, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9019607843137256, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8846153846153846, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7887323943661972, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7368421052631579, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.23949624598026276, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8365122615803814, |
|
"eval_overall_precision": 0.7932816537467701, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 1.0163, |
|
"eval_samples_per_second": 183.996, |
|
"eval_steps_per_second": 2.952, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 1.984230875968933, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.0077, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8996763754045306, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8742138364779874, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.806451612903226, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.26252666115760803, |
|
"eval_overall_accuracy": 0.9568380213385063, |
|
"eval_overall_f1": 0.8268456375838926, |
|
"eval_overall_precision": 0.7738693467336684, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.952, |
|
"eval_samples_per_second": 196.421, |
|
"eval_steps_per_second": 3.151, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 0.09802401065826416, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.0059, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.8400000000000001, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7659574468085107, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7105263157894737, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8823529411764707, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8653846153846154, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.8169014084507042, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7631578947368421, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.235382542014122, |
|
"eval_overall_accuracy": 0.9648399612027158, |
|
"eval_overall_f1": 0.8418156808803301, |
|
"eval_overall_precision": 0.8052631578947368, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.9545, |
|
"eval_samples_per_second": 195.917, |
|
"eval_steps_per_second": 3.143, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 0.4382927417755127, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.0078, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.8251748251748252, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8194444444444444, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.8201438848920863, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7702702702702703, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.896103896103896, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8734177215189873, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8115942028985507, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7777777777777778, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.21610549092292786, |
|
"eval_overall_accuracy": 0.9675072744907857, |
|
"eval_overall_f1": 0.8575418994413407, |
|
"eval_overall_precision": 0.8319783197831978, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.9504, |
|
"eval_samples_per_second": 196.751, |
|
"eval_steps_per_second": 3.156, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 2.4125523567199707, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.0044, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.8181818181818181, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7552447552447553, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6923076923076923, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9042904290429042, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8954248366013072, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.821917808219178, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.26299452781677246, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8469945355191256, |
|
"eval_overall_precision": 0.8051948051948052, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.9454, |
|
"eval_samples_per_second": 197.792, |
|
"eval_steps_per_second": 3.173, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 0.6766614317893982, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.0047, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.8493150684931506, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8266666666666667, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7862068965517242, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7125, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8802588996763754, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8553459119496856, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.9090909090909091, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9259259259259259, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.25089046359062195, |
|
"eval_overall_accuracy": 0.9638700290979632, |
|
"eval_overall_f1": 0.8500687757909215, |
|
"eval_overall_precision": 0.8131578947368421, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.9494, |
|
"eval_samples_per_second": 196.976, |
|
"eval_steps_per_second": 3.16, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 2.052441358566284, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.0041, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7755102040816327, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6951219512195121, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8831168831168831, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8607594936708861, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.821917808219178, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2882152795791626, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8306451612903226, |
|
"eval_overall_precision": 0.7783375314861462, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.9611, |
|
"eval_samples_per_second": 194.573, |
|
"eval_steps_per_second": 3.121, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 0.014275839552283287, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.0044, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.8053691275167785, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7945205479452054, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7160493827160493, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8910891089108911, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8823529411764706, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.8169014084507042, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7631578947368421, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.26748523116111755, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8372093023255814, |
|
"eval_overall_precision": 0.796875, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.9645, |
|
"eval_samples_per_second": 193.888, |
|
"eval_steps_per_second": 3.111, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.5238301157951355, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.0032, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.8299319727891157, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8026315789473685, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7746478873239436, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7142857142857143, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8896103896103896, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8670886075949367, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8000000000000002, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7567567567567568, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.28771573305130005, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8356164383561643, |
|
"eval_overall_precision": 0.7963446475195822, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.9538, |
|
"eval_samples_per_second": 196.063, |
|
"eval_steps_per_second": 3.145, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 0.005304540041834116, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.0034, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.8133333333333335, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7552447552447553, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6923076923076923, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.894736842105263, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8831168831168831, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.821917808219178, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.28492802381515503, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8429752066115703, |
|
"eval_overall_precision": 0.8073878627968337, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.9617, |
|
"eval_samples_per_second": 194.443, |
|
"eval_steps_per_second": 3.119, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 0.05048967897891998, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.0051, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7832167832167831, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.717948717948718, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8990228013029316, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8789808917197452, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2656005918979645, |
|
"eval_overall_accuracy": 0.9643549951503395, |
|
"eval_overall_f1": 0.8493150684931507, |
|
"eval_overall_precision": 0.8093994778067886, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.9518, |
|
"eval_samples_per_second": 196.476, |
|
"eval_steps_per_second": 3.152, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 0.005232055671513081, |
|
"learning_rate": 4e-05, |
|
"loss": 0.0029, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7482014388489208, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7027027027027027, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.823529411764706, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2749578654766083, |
|
"eval_overall_accuracy": 0.9638700290979632, |
|
"eval_overall_f1": 0.8365122615803814, |
|
"eval_overall_precision": 0.7932816537467701, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.9399, |
|
"eval_samples_per_second": 198.964, |
|
"eval_steps_per_second": 3.192, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 20.893596649169922, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0051, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7464788732394366, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6883116883116883, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9084967320261438, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8910256410256411, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8115942028985507, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7777777777777778, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2634299099445343, |
|
"eval_overall_accuracy": 0.9643549951503395, |
|
"eval_overall_f1": 0.8429752066115703, |
|
"eval_overall_precision": 0.8073878627968337, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.9692, |
|
"eval_samples_per_second": 192.946, |
|
"eval_steps_per_second": 3.095, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 0.013275664299726486, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.003, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.8243243243243243, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7922077922077922, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7417218543046358, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6511627906976745, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9061488673139159, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8805031446540881, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8333333333333333, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7692307692307693, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2914196252822876, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8455284552845529, |
|
"eval_overall_precision": 0.7979539641943734, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9669, |
|
"eval_samples_per_second": 193.405, |
|
"eval_steps_per_second": 3.103, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 0.05714813619852066, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.0035, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.8435374149659864, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.76056338028169, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7012987012987013, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9084967320261438, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8910256410256411, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8115942028985507, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7777777777777778, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2690264582633972, |
|
"eval_overall_accuracy": 0.9645974781765276, |
|
"eval_overall_f1": 0.8543689320388349, |
|
"eval_overall_precision": 0.8235294117647058, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.943, |
|
"eval_samples_per_second": 198.31, |
|
"eval_steps_per_second": 3.181, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 8.982757568359375, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0024, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7549668874172185, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6627906976744186, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9108910891089109, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9019607843137255, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8333333333333333, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7692307692307693, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.301530122756958, |
|
"eval_overall_accuracy": 0.9602327837051406, |
|
"eval_overall_f1": 0.8425302826379543, |
|
"eval_overall_precision": 0.7904040404040404, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.9593, |
|
"eval_samples_per_second": 194.925, |
|
"eval_steps_per_second": 3.127, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 0.10265465825796127, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0032, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.8157894736842104, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7971014492753623, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7534246575342466, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2815525233745575, |
|
"eval_overall_accuracy": 0.9636275460717749, |
|
"eval_overall_f1": 0.851182197496523, |
|
"eval_overall_precision": 0.8225806451612904, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.9507, |
|
"eval_samples_per_second": 196.688, |
|
"eval_steps_per_second": 3.155, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 0.0032238499261438847, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.003, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.8344370860927152, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7659574468085107, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7105263157894737, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9042904290429042, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8954248366013072, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8333333333333333, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7692307692307693, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.28177666664123535, |
|
"eval_overall_accuracy": 0.9636275460717749, |
|
"eval_overall_f1": 0.8508287292817679, |
|
"eval_overall_precision": 0.8169761273209549, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.9649, |
|
"eval_samples_per_second": 193.801, |
|
"eval_steps_per_second": 3.109, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 0.03518635779619217, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0016, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.8133333333333335, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7777777777777778, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7088607594936709, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9144736842105262, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9025974025974026, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2842986285686493, |
|
"eval_overall_accuracy": 0.9648399612027158, |
|
"eval_overall_f1": 0.8528198074277854, |
|
"eval_overall_precision": 0.8157894736842105, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 1.03, |
|
"eval_samples_per_second": 181.562, |
|
"eval_steps_per_second": 2.913, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 0.01968814805150032, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.0025, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.8366013071895425, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.8028169014084509, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7402597402597403, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9042904290429042, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8954248366013072, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7714285714285715, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3238835334777832, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.8512396694214875, |
|
"eval_overall_precision": 0.8153034300791556, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.9375, |
|
"eval_samples_per_second": 199.463, |
|
"eval_steps_per_second": 3.2, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.005619656760245562, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0026, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.8421052631578947, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.8111888111888114, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7435897435897436, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9042904290429042, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8954248366013072, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.3090417683124542, |
|
"eval_overall_accuracy": 0.965082444228904, |
|
"eval_overall_f1": 0.8575342465753425, |
|
"eval_overall_precision": 0.8172323759791122, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.9535, |
|
"eval_samples_per_second": 196.122, |
|
"eval_steps_per_second": 3.146, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 0.0475270040333271, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.0041, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7703703703703704, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7428571428571429, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.9114754098360656, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.896774193548387, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.30209869146347046, |
|
"eval_overall_accuracy": 0.9626576139670223, |
|
"eval_overall_f1": 0.8464730290456433, |
|
"eval_overall_precision": 0.8138297872340425, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.9526, |
|
"eval_samples_per_second": 196.299, |
|
"eval_steps_per_second": 3.149, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.6186401844024658, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0054, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.8181818181818181, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.759124087591241, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7222222222222222, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.9025974025974027, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.879746835443038, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3126040995121002, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.8353741496598639, |
|
"eval_overall_precision": 0.7912371134020618, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.9488, |
|
"eval_samples_per_second": 197.092, |
|
"eval_steps_per_second": 3.162, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.001890498329885304, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.002, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.8243243243243243, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7922077922077922, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7737226277372263, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7361111111111112, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9078947368421053, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8961038961038961, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.31118687987327576, |
|
"eval_overall_accuracy": 0.9629000969932104, |
|
"eval_overall_f1": 0.8448753462603877, |
|
"eval_overall_precision": 0.8133333333333334, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.9533, |
|
"eval_samples_per_second": 196.155, |
|
"eval_steps_per_second": 3.147, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.4719323217868805, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0023, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.8476821192052981, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7703703703703704, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7428571428571429, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.9078947368421053, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8961038961038961, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.3178064227104187, |
|
"eval_overall_accuracy": 0.9638700290979632, |
|
"eval_overall_f1": 0.853185595567867, |
|
"eval_overall_precision": 0.8213333333333334, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.9706, |
|
"eval_samples_per_second": 192.671, |
|
"eval_steps_per_second": 3.091, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 0.008191280998289585, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0045, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.8456375838926176, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7777777777777778, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7088607594936709, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8859934853420196, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8662420382165605, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.8450704225352113, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7894736842105263, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2925824224948883, |
|
"eval_overall_accuracy": 0.9638700290979632, |
|
"eval_overall_f1": 0.8454172366621068, |
|
"eval_overall_precision": 0.8046875, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.9524, |
|
"eval_samples_per_second": 196.348, |
|
"eval_steps_per_second": 3.15, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 0.005140832159668207, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0026, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.8387096774193548, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7738095238095238, |
|
"eval_LOCATION_recall": 0.9154929577464789, |
|
"eval_ORGANIZATION_f1": 0.7375, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6210526315789474, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9114754098360656, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.896774193548387, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.78125, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6944444444444444, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.3151751160621643, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8375165125495376, |
|
"eval_overall_precision": 0.7731707317073171, |
|
"eval_overall_recall": 0.9135446685878963, |
|
"eval_runtime": 0.9517, |
|
"eval_samples_per_second": 196.484, |
|
"eval_steps_per_second": 3.152, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.002234996994957328, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0017, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.8356164383561644, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8133333333333334, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.8059701492537313, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.782608695652174, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9114754098360656, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.896774193548387, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.27503567934036255, |
|
"eval_overall_accuracy": 0.9670223084384093, |
|
"eval_overall_f1": 0.8635724331926864, |
|
"eval_overall_precision": 0.8434065934065934, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 1.0319, |
|
"eval_samples_per_second": 181.221, |
|
"eval_steps_per_second": 2.907, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 2.4394583702087402, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0016, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.8456375838926176, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7755102040816327, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6951219512195121, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8867313915857605, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.3136846423149109, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.8439620081411126, |
|
"eval_overall_precision": 0.7974358974358975, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.9561, |
|
"eval_samples_per_second": 195.586, |
|
"eval_steps_per_second": 3.138, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 0.02068762294948101, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.002, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8163265306122449, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7894736842105263, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7619047619047619, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6829268292682927, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9114754098360656, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.896774193548387, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.31167086958885193, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8431105047748976, |
|
"eval_overall_precision": 0.8005181347150259, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.9533, |
|
"eval_samples_per_second": 196.17, |
|
"eval_steps_per_second": 3.147, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 0.004659323953092098, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0031, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.8421052631578947, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7682119205298013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6744186046511628, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9114754098360656, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.896774193548387, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.823529411764706, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.3022630512714386, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8521031207598372, |
|
"eval_overall_precision": 0.8051282051282052, |
|
"eval_overall_recall": 0.9048991354466859, |
|
"eval_runtime": 0.9507, |
|
"eval_samples_per_second": 196.705, |
|
"eval_steps_per_second": 3.156, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 0.5910449624061584, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0018, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7763157894736842, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6781609195402298, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9055374592833875, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8853503184713376, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8000000000000002, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7567567567567568, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.31180375814437866, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8416779431664412, |
|
"eval_overall_precision": 0.7933673469387755, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.9409, |
|
"eval_samples_per_second": 198.747, |
|
"eval_steps_per_second": 3.188, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.0014322897186502814, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0022, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.8187919463087248, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.782051282051282, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7832167832167831, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.717948717948718, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9036544850498339, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9006622516556292, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2662249207496643, |
|
"eval_overall_accuracy": 0.9636275460717749, |
|
"eval_overall_f1": 0.8515950069348127, |
|
"eval_overall_precision": 0.820855614973262, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.9578, |
|
"eval_samples_per_second": 195.232, |
|
"eval_steps_per_second": 3.132, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.0011240842286497355, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0006, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.7866666666666666, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7468354430379747, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7712418300653594, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6704545454545454, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9019607843137256, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8846153846153846, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3214167058467865, |
|
"eval_overall_accuracy": 0.9597478176527643, |
|
"eval_overall_f1": 0.8373983739837398, |
|
"eval_overall_precision": 0.7902813299232737, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.9589, |
|
"eval_samples_per_second": 195.011, |
|
"eval_steps_per_second": 3.129, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.0019562048837542534, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0011, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.7712418300653594, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7195121951219512, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7785234899328859, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6904761904761905, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9144736842105262, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9025974025974026, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8169014084507042, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7631578947368421, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3223561942577362, |
|
"eval_overall_accuracy": 0.9616876818622696, |
|
"eval_overall_f1": 0.8408163265306122, |
|
"eval_overall_precision": 0.7963917525773195, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.9419, |
|
"eval_samples_per_second": 198.529, |
|
"eval_steps_per_second": 3.185, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 0.004401817452162504, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.0015, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.8344370860927152, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7402597402597403, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6404494382022472, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9013157894736842, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8896103896103896, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.30491575598716736, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8428184281842819, |
|
"eval_overall_precision": 0.7953964194373402, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.9628, |
|
"eval_samples_per_second": 194.222, |
|
"eval_steps_per_second": 3.116, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 0.032622966915369034, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0023, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.8187919463087248, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.782051282051282, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.763888888888889, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6962025316455697, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8933333333333333, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8933333333333333, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.8529411764705883, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8285714285714286, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.26732492446899414, |
|
"eval_overall_accuracy": 0.9648399612027158, |
|
"eval_overall_f1": 0.8440111420612814, |
|
"eval_overall_precision": 0.816711590296496, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 1.0306, |
|
"eval_samples_per_second": 181.45, |
|
"eval_steps_per_second": 2.911, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.009263483807444572, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.0015, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.8435374149659864, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7769784172661871, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7297297297297297, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.913907284768212, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9078947368421053, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2788328230381012, |
|
"eval_overall_accuracy": 0.9662948593598448, |
|
"eval_overall_f1": 0.8587412587412588, |
|
"eval_overall_precision": 0.8342391304347826, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.9441, |
|
"eval_samples_per_second": 198.082, |
|
"eval_steps_per_second": 3.178, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 0.016023587435483932, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0019, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.8235294117647058, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7887323943661971, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9169435215946843, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9139072847682119, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2903594672679901, |
|
"eval_overall_accuracy": 0.9670223084384093, |
|
"eval_overall_f1": 0.8671328671328672, |
|
"eval_overall_precision": 0.842391304347826, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.9543, |
|
"eval_samples_per_second": 195.955, |
|
"eval_steps_per_second": 3.144, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 0.0013861858751624823, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0016, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.759493670886076, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7755102040816327, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6951219512195121, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9174917491749175, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9084967320261438, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.30562856793403625, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8454172366621068, |
|
"eval_overall_precision": 0.8046875, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.953, |
|
"eval_samples_per_second": 196.222, |
|
"eval_steps_per_second": 3.148, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.004494914319366217, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0021, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.8266666666666665, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7913669064748202, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7432432432432432, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.913907284768212, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9078947368421053, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.30186086893081665, |
|
"eval_overall_accuracy": 0.9643549951503395, |
|
"eval_overall_f1": 0.8583333333333334, |
|
"eval_overall_precision": 0.8284182305630027, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.9632, |
|
"eval_samples_per_second": 194.143, |
|
"eval_steps_per_second": 3.115, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 0.07165616750717163, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0013, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.794701986754967, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.76056338028169, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7012987012987013, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9084967320261438, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8910256410256411, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3192538917064667, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8395061728395062, |
|
"eval_overall_precision": 0.8010471204188482, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.9477, |
|
"eval_samples_per_second": 197.324, |
|
"eval_steps_per_second": 3.166, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 0.0017693530535325408, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0013, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.8187919463087248, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.782051282051282, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7808219178082192, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7037037037037037, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9055374592833875, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8853503184713376, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3206080496311188, |
|
"eval_overall_accuracy": 0.9616876818622696, |
|
"eval_overall_f1": 0.850480109739369, |
|
"eval_overall_precision": 0.8115183246073299, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.9406, |
|
"eval_samples_per_second": 198.804, |
|
"eval_steps_per_second": 3.189, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 0.077069491147995, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0014, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.8299319727891157, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8026315789473685, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7801418439716312, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7236842105263158, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9144736842105262, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9025974025974026, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.29891258478164673, |
|
"eval_overall_accuracy": 0.9653249272550921, |
|
"eval_overall_f1": 0.8567454798331016, |
|
"eval_overall_precision": 0.8279569892473119, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.9575, |
|
"eval_samples_per_second": 195.296, |
|
"eval_steps_per_second": 3.133, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 0.002096625277772546, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0007, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.8194444444444445, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8082191780821918, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7913669064748202, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7432432432432432, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9042904290429042, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8954248366013072, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8405797101449276, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8055555555555556, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.30264776945114136, |
|
"eval_overall_accuracy": 0.9672647914645974, |
|
"eval_overall_f1": 0.8579465541490857, |
|
"eval_overall_precision": 0.8379120879120879, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.951, |
|
"eval_samples_per_second": 196.632, |
|
"eval_steps_per_second": 3.155, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 0.001791234826669097, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0014, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.8243243243243243, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7922077922077922, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.8055555555555556, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7341772151898734, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8983606557377048, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8838709677419355, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8529411764705883, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8285714285714286, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.305812805891037, |
|
"eval_overall_accuracy": 0.9670223084384093, |
|
"eval_overall_f1": 0.8587257617728532, |
|
"eval_overall_precision": 0.8266666666666667, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.9512, |
|
"eval_samples_per_second": 196.589, |
|
"eval_steps_per_second": 3.154, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 0.0006963410996831954, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0013, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.8133333333333335, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7826086956521738, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7397260273972602, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9084967320261438, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8910256410256411, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7714285714285715, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.31985101103782654, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8448753462603877, |
|
"eval_overall_precision": 0.8133333333333334, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.9536, |
|
"eval_samples_per_second": 196.106, |
|
"eval_steps_per_second": 3.146, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 0.004016083665192127, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.002, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.8266666666666665, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7971014492753623, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7534246575342466, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9084967320261438, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8910256410256411, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.33322784304618835, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8524137931034482, |
|
"eval_overall_precision": 0.8174603174603174, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.9475, |
|
"eval_samples_per_second": 197.363, |
|
"eval_steps_per_second": 3.166, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.002730452921241522, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0006, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7862068965517242, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7125, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9084967320261438, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8910256410256411, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8169014084507042, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7631578947368421, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3458655774593353, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8497267759562841, |
|
"eval_overall_precision": 0.8077922077922078, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.9455, |
|
"eval_samples_per_second": 197.779, |
|
"eval_steps_per_second": 3.173, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.0037386000622063875, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0014, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.802721088435374, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7195121951219512, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9049180327868852, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8903225806451613, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8169014084507042, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7631578947368421, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.32678091526031494, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8485675306957708, |
|
"eval_overall_precision": 0.805699481865285, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.9604, |
|
"eval_samples_per_second": 194.708, |
|
"eval_steps_per_second": 3.124, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 0.0023347027599811554, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0012, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.8181818181818181, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9042904290429042, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8954248366013072, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8450704225352113, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7894736842105263, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3488438129425049, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8455284552845529, |
|
"eval_overall_precision": 0.7979539641943734, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9526, |
|
"eval_samples_per_second": 196.312, |
|
"eval_steps_per_second": 3.149, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 0.0007857033051550388, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0015, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.8133333333333335, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7724137931034483, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9108910891089109, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9019607843137255, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.3345150947570801, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8528198074277854, |
|
"eval_overall_precision": 0.8157894736842105, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.9473, |
|
"eval_samples_per_second": 197.404, |
|
"eval_steps_per_second": 3.167, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 0.0016401028260588646, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0005, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.8157894736842104, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.8, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7466666666666667, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9078947368421053, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8961038961038961, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8450704225352113, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7894736842105263, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3476317226886749, |
|
"eval_overall_accuracy": 0.9624151309408342, |
|
"eval_overall_f1": 0.8539944903581268, |
|
"eval_overall_precision": 0.8179419525065963, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.9315, |
|
"eval_samples_per_second": 200.75, |
|
"eval_steps_per_second": 3.221, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 0.02758892811834812, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.001, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.8028169014084509, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7402597402597403, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9078947368421053, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8961038961038961, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3546055257320404, |
|
"eval_overall_accuracy": 0.9633850630455868, |
|
"eval_overall_f1": 0.8539944903581268, |
|
"eval_overall_precision": 0.8179419525065963, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.9503, |
|
"eval_samples_per_second": 196.775, |
|
"eval_steps_per_second": 3.157, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 0.32324543595314026, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0008, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7862068965517242, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7125, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9049180327868852, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8903225806451613, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3560656011104584, |
|
"eval_overall_accuracy": 0.9616876818622696, |
|
"eval_overall_f1": 0.8481532147742818, |
|
"eval_overall_precision": 0.8072916666666666, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.9525, |
|
"eval_samples_per_second": 196.325, |
|
"eval_steps_per_second": 3.15, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 0.0021076402626931667, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0012, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.8344370860927152, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7887323943661972, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7272727272727273, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9144736842105262, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9025974025974026, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.33117640018463135, |
|
"eval_overall_accuracy": 0.9624151309408342, |
|
"eval_overall_f1": 0.8567493112947657, |
|
"eval_overall_precision": 0.820580474934037, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.9576, |
|
"eval_samples_per_second": 195.279, |
|
"eval_steps_per_second": 3.133, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 0.27350062131881714, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0017, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7913669064748202, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7432432432432432, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9055374592833875, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8853503184713376, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8450704225352113, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7894736842105263, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3442927598953247, |
|
"eval_overall_accuracy": 0.9602327837051406, |
|
"eval_overall_f1": 0.8461538461538461, |
|
"eval_overall_precision": 0.8083989501312336, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.953, |
|
"eval_samples_per_second": 196.22, |
|
"eval_steps_per_second": 3.148, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.7737051248550415, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0005, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.7763157894736843, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7283950617283951, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7913669064748202, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7432432432432432, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9055374592833875, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8853503184713376, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8169014084507042, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7631578947368421, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3465050756931305, |
|
"eval_overall_accuracy": 0.9602327837051406, |
|
"eval_overall_f1": 0.8383561643835616, |
|
"eval_overall_precision": 0.7989556135770235, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.9746, |
|
"eval_samples_per_second": 191.87, |
|
"eval_steps_per_second": 3.078, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.0003085023781750351, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0004, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.8266666666666665, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.8115942028985507, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7671232876712328, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9114754098360656, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.896774193548387, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8450704225352113, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7894736842105263, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3288689851760864, |
|
"eval_overall_accuracy": 0.9638700290979632, |
|
"eval_overall_f1": 0.8591160220994475, |
|
"eval_overall_precision": 0.8249336870026526, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.9508, |
|
"eval_samples_per_second": 196.673, |
|
"eval_steps_per_second": 3.155, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.0015671561704948545, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0002, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.832214765100671, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7948717948717948, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.8, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7466666666666667, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9144736842105262, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9025974025974026, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8450704225352113, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7894736842105263, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.33385857939720154, |
|
"eval_overall_accuracy": 0.9641125121241513, |
|
"eval_overall_f1": 0.8591160220994475, |
|
"eval_overall_precision": 0.8249336870026526, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.9543, |
|
"eval_samples_per_second": 195.947, |
|
"eval_steps_per_second": 3.144, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 0.0012689490104094148, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0006, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.8400000000000001, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7215189873417722, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6129032258064516, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9078947368421053, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8961038961038961, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.35171428322792053, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8382749326145552, |
|
"eval_overall_precision": 0.7873417721518987, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.953, |
|
"eval_samples_per_second": 196.232, |
|
"eval_steps_per_second": 3.148, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 0.00089789874618873, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.001, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.8378378378378378, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8051948051948052, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7913669064748202, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7432432432432432, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9049180327868852, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8903225806451613, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.32278671860694885, |
|
"eval_overall_accuracy": 0.9648399612027158, |
|
"eval_overall_f1": 0.853185595567867, |
|
"eval_overall_precision": 0.8213333333333334, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 1.0201, |
|
"eval_samples_per_second": 183.317, |
|
"eval_steps_per_second": 2.941, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 0.001998705556616187, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0002, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.8400000000000001, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.8111888111888114, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7435897435897436, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9049180327868852, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8903225806451613, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3305073380470276, |
|
"eval_overall_accuracy": 0.9633850630455868, |
|
"eval_overall_f1": 0.8571428571428571, |
|
"eval_overall_precision": 0.8188976377952756, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9607, |
|
"eval_samples_per_second": 194.654, |
|
"eval_steps_per_second": 3.123, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 0.0005069375038146973, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0006, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.8356164383561644, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8133333333333334, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7826086956521738, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7397260273972602, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9271523178807947, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9210526315789473, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8000000000000002, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7567567567567568, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.30825239419937134, |
|
"eval_overall_accuracy": 0.9675072744907857, |
|
"eval_overall_f1": 0.8575418994413407, |
|
"eval_overall_precision": 0.8319783197831978, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.9597, |
|
"eval_samples_per_second": 194.861, |
|
"eval_steps_per_second": 3.126, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.0007079507340677083, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0003, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.8266666666666665, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7857142857142856, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7333333333333333, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9205298013245033, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9144736842105263, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8000000000000002, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7567567567567568, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3165390193462372, |
|
"eval_overall_accuracy": 0.9667798254122212, |
|
"eval_overall_f1": 0.853185595567867, |
|
"eval_overall_precision": 0.8213333333333334, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.9558, |
|
"eval_samples_per_second": 195.657, |
|
"eval_steps_per_second": 3.139, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 0.00018394706421531737, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0002, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.8053691275167785, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.8085106382978723, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.75, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9235880398671096, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9205298013245033, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8000000000000002, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7567567567567568, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.31818944215774536, |
|
"eval_overall_accuracy": 0.967992240543162, |
|
"eval_overall_f1": 0.8555555555555555, |
|
"eval_overall_precision": 0.8257372654155496, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.9609, |
|
"eval_samples_per_second": 194.606, |
|
"eval_steps_per_second": 3.122, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.00024878690601326525, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0012, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.8082191780821918, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7283950617283951, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9180327868852459, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9032258064516129, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8169014084507042, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7631578947368421, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.34358134865760803, |
|
"eval_overall_accuracy": 0.9641125121241513, |
|
"eval_overall_f1": 0.8528610354223433, |
|
"eval_overall_precision": 0.8087855297157622, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.9518, |
|
"eval_samples_per_second": 196.477, |
|
"eval_steps_per_second": 3.152, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 0.0002495927328709513, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0002, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.802721088435374, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7195121951219512, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9210526315789475, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9090909090909091, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.34999027848243713, |
|
"eval_overall_accuracy": 0.9636275460717749, |
|
"eval_overall_f1": 0.854024556616644, |
|
"eval_overall_precision": 0.810880829015544, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.9639, |
|
"eval_samples_per_second": 194.004, |
|
"eval_steps_per_second": 3.112, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 0.000243131464230828, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0007, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.8137931034482759, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7375, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9210526315789475, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9090909090909091, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3344757556915283, |
|
"eval_overall_accuracy": 0.9645974781765276, |
|
"eval_overall_f1": 0.8575342465753425, |
|
"eval_overall_precision": 0.8172323759791122, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.9601, |
|
"eval_samples_per_second": 194.77, |
|
"eval_steps_per_second": 3.125, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 0.00021198501053731889, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0006, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.802919708029197, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7638888888888888, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9210526315789475, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9090909090909091, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3224840760231018, |
|
"eval_overall_accuracy": 0.9655674102812803, |
|
"eval_overall_f1": 0.8559556786703602, |
|
"eval_overall_precision": 0.824, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.9532, |
|
"eval_samples_per_second": 196.177, |
|
"eval_steps_per_second": 3.147, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.0016178454970940948, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0002, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7913669064748202, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7432432432432432, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9180327868852459, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9032258064516129, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3340538740158081, |
|
"eval_overall_accuracy": 0.965082444228904, |
|
"eval_overall_f1": 0.8547717842323651, |
|
"eval_overall_precision": 0.8218085106382979, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 1.013, |
|
"eval_samples_per_second": 184.602, |
|
"eval_steps_per_second": 2.962, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.0010399464517831802, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0005, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.8133333333333335, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7913669064748202, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7432432432432432, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9144736842105262, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9025974025974026, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3451690971851349, |
|
"eval_overall_accuracy": 0.965082444228904, |
|
"eval_overall_f1": 0.8543689320388349, |
|
"eval_overall_precision": 0.8235294117647058, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.9594, |
|
"eval_samples_per_second": 194.923, |
|
"eval_steps_per_second": 3.127, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 0.0004898614133708179, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0002, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.8133333333333335, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7857142857142856, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7333333333333333, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9144736842105262, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9025974025974026, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3453369140625, |
|
"eval_overall_accuracy": 0.965082444228904, |
|
"eval_overall_f1": 0.853185595567867, |
|
"eval_overall_precision": 0.8213333333333334, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.9528, |
|
"eval_samples_per_second": 196.26, |
|
"eval_steps_per_second": 3.149, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 0.0012529068626463413, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0002, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7943262411347517, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7368421052631579, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9049180327868852, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8903225806451613, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3554005026817322, |
|
"eval_overall_accuracy": 0.9641125121241513, |
|
"eval_overall_f1": 0.8481532147742818, |
|
"eval_overall_precision": 0.8072916666666666, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.9565, |
|
"eval_samples_per_second": 195.504, |
|
"eval_steps_per_second": 3.136, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.0037664775736629963, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0005, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7681159420289856, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.726027397260274, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.9102990033222591, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9072847682119205, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.33550789952278137, |
|
"eval_overall_accuracy": 0.965082444228904, |
|
"eval_overall_f1": 0.8491620111731844, |
|
"eval_overall_precision": 0.8238482384823849, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.9544, |
|
"eval_samples_per_second": 195.933, |
|
"eval_steps_per_second": 3.143, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 0.00019280197739135474, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0002, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7659574468085107, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7105263157894737, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9049180327868852, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8903225806451613, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3492893576622009, |
|
"eval_overall_accuracy": 0.9633850630455868, |
|
"eval_overall_f1": 0.8422496570644719, |
|
"eval_overall_precision": 0.8036649214659686, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.9553, |
|
"eval_samples_per_second": 195.753, |
|
"eval_steps_per_second": 3.14, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 0.0007057705661281943, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0003, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7714285714285715, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.72, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9049180327868852, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8903225806451613, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3493691086769104, |
|
"eval_overall_accuracy": 0.9636275460717749, |
|
"eval_overall_f1": 0.8418156808803301, |
|
"eval_overall_precision": 0.8052631578947368, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.9473, |
|
"eval_samples_per_second": 197.399, |
|
"eval_steps_per_second": 3.167, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 0.00023777979367878288, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0002, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7801418439716312, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7236842105263158, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9049180327868852, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8903225806451613, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.35241079330444336, |
|
"eval_overall_accuracy": 0.9641125121241513, |
|
"eval_overall_f1": 0.8434065934065933, |
|
"eval_overall_precision": 0.8057742782152231, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.9506, |
|
"eval_samples_per_second": 196.717, |
|
"eval_steps_per_second": 3.156, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.0003070076636504382, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0002, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7785234899328859, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6904761904761905, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9084967320261438, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8910256410256411, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3664219081401825, |
|
"eval_overall_accuracy": 0.9629000969932104, |
|
"eval_overall_f1": 0.8466757123473542, |
|
"eval_overall_precision": 0.8, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9567, |
|
"eval_samples_per_second": 195.468, |
|
"eval_steps_per_second": 3.136, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 0.0003128907410427928, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0002, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.8053691275167785, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7792207792207791, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6741573033707865, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.9180327868852459, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9032258064516129, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8450704225352113, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7894736842105263, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3721804618835449, |
|
"eval_overall_accuracy": 0.9626576139670223, |
|
"eval_overall_f1": 0.8509485094850948, |
|
"eval_overall_precision": 0.80306905370844, |
|
"eval_overall_recall": 0.9048991354466859, |
|
"eval_runtime": 0.9518, |
|
"eval_samples_per_second": 196.461, |
|
"eval_steps_per_second": 3.152, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.0002441601827740669, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0002, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7837837837837838, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6987951807228916, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9180327868852459, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9032258064516129, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3669990599155426, |
|
"eval_overall_accuracy": 0.9629000969932104, |
|
"eval_overall_f1": 0.8501362397820164, |
|
"eval_overall_precision": 0.8062015503875969, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.968, |
|
"eval_samples_per_second": 193.188, |
|
"eval_steps_per_second": 3.099, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 0.001270479173399508, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0002, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7837837837837838, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6987951807228916, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9180327868852459, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9032258064516129, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.36801740527153015, |
|
"eval_overall_accuracy": 0.9629000969932104, |
|
"eval_overall_f1": 0.8501362397820164, |
|
"eval_overall_precision": 0.8062015503875969, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9464, |
|
"eval_samples_per_second": 197.59, |
|
"eval_steps_per_second": 3.17, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 0.00022247471497394145, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0002, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7837837837837838, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6987951807228916, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9084967320261438, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8910256410256411, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3627462089061737, |
|
"eval_overall_accuracy": 0.9629000969932104, |
|
"eval_overall_f1": 0.8462585034013606, |
|
"eval_overall_precision": 0.8015463917525774, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.9545, |
|
"eval_samples_per_second": 195.918, |
|
"eval_steps_per_second": 3.143, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 0.00013813188706990331, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0002, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7785234899328859, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6904761904761905, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9180327868852459, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9032258064516129, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3727177083492279, |
|
"eval_overall_accuracy": 0.9629000969932104, |
|
"eval_overall_f1": 0.8493894165535958, |
|
"eval_overall_precision": 0.8025641025641026, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.954, |
|
"eval_samples_per_second": 196.013, |
|
"eval_steps_per_second": 3.145, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.000215419742744416, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0002, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7837837837837838, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6987951807228916, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9084967320261438, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8910256410256411, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.37157806754112244, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8451086956521738, |
|
"eval_overall_precision": 0.7994858611825193, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.9451, |
|
"eval_samples_per_second": 197.862, |
|
"eval_steps_per_second": 3.174, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 0.0003316714719403535, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0002, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.8082191780821918, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7283950617283951, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9205298013245033, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9144736842105263, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.35780400037765503, |
|
"eval_overall_accuracy": 0.9643549951503395, |
|
"eval_overall_f1": 0.8559670781893004, |
|
"eval_overall_precision": 0.8167539267015707, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9435, |
|
"eval_samples_per_second": 198.203, |
|
"eval_steps_per_second": 3.18, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 0.005569119472056627, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0002, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.8082191780821918, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7283950617283951, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9205298013245033, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9144736842105263, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3565683662891388, |
|
"eval_overall_accuracy": 0.9645974781765276, |
|
"eval_overall_f1": 0.8559670781893004, |
|
"eval_overall_precision": 0.8167539267015707, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9611, |
|
"eval_samples_per_second": 194.577, |
|
"eval_steps_per_second": 3.122, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 0.00045707172830589116, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0006, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7945205479452054, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7160493827160493, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9180327868852459, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9032258064516129, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3609143793582916, |
|
"eval_overall_accuracy": 0.9641125121241513, |
|
"eval_overall_f1": 0.8524590163934427, |
|
"eval_overall_precision": 0.8103896103896104, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9457, |
|
"eval_samples_per_second": 197.739, |
|
"eval_steps_per_second": 3.172, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 0.0002619586593937129, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0003, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7945205479452054, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7160493827160493, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9180327868852459, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9032258064516129, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3629205524921417, |
|
"eval_overall_accuracy": 0.9641125121241513, |
|
"eval_overall_f1": 0.8524590163934427, |
|
"eval_overall_precision": 0.8103896103896104, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9477, |
|
"eval_samples_per_second": 197.31, |
|
"eval_steps_per_second": 3.165, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 0.0001948641292983666, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0002, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7945205479452054, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7160493827160493, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9180327868852459, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9032258064516129, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.35546010732650757, |
|
"eval_overall_accuracy": 0.9645974781765276, |
|
"eval_overall_f1": 0.8524590163934427, |
|
"eval_overall_precision": 0.8103896103896104, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9637, |
|
"eval_samples_per_second": 194.037, |
|
"eval_steps_per_second": 3.113, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.023726776242256165, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0002, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7945205479452054, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7160493827160493, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9180327868852459, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9032258064516129, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.35447004437446594, |
|
"eval_overall_accuracy": 0.9648399612027158, |
|
"eval_overall_f1": 0.8524590163934427, |
|
"eval_overall_precision": 0.8103896103896104, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.951, |
|
"eval_samples_per_second": 196.644, |
|
"eval_steps_per_second": 3.155, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.0003471510426606983, |
|
"learning_rate": 0.0, |
|
"loss": 0.0004, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7945205479452054, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7160493827160493, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9180327868852459, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.9032258064516129, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8571428571428571, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.8108108108108109, |
|
"eval_QUANTITY_recall": 0.9090909090909091, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.3544124364852905, |
|
"eval_overall_accuracy": 0.9645974781765276, |
|
"eval_overall_f1": 0.8524590163934427, |
|
"eval_overall_precision": 0.8103896103896104, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.9623, |
|
"eval_samples_per_second": 194.318, |
|
"eval_steps_per_second": 3.117, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 4591573981087056.0, |
|
"train_loss": 0.008363780669411118, |
|
"train_runtime": 2646.2436, |
|
"train_samples_per_second": 63.789, |
|
"train_steps_per_second": 4.006 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 4591573981087056.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|