|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 1.5824520587921143, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.9315, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.012987012987012988, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.25, |
|
"eval_PERSON_recall": 0.006666666666666667, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.6119179725646973, |
|
"eval_overall_accuracy": 0.8370662072360325, |
|
"eval_overall_f1": 0.005633802816901409, |
|
"eval_overall_precision": 0.25, |
|
"eval_overall_recall": 0.002849002849002849, |
|
"eval_runtime": 0.3369, |
|
"eval_samples_per_second": 555.024, |
|
"eval_steps_per_second": 8.904, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.5226932764053345, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.5353, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.40983606557377056, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.5102040816326531, |
|
"eval_LOCATION_recall": 0.3424657534246575, |
|
"eval_ORGANIZATION_f1": 0.08695652173913043, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.1, |
|
"eval_ORGANIZATION_recall": 0.07692307692307693, |
|
"eval_PERSON_f1": 0.574468085106383, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.4778761061946903, |
|
"eval_PERSON_recall": 0.72, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.5483870967741935, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6071428571428571, |
|
"eval_TIME_recall": 0.5, |
|
"eval_loss": 0.411459743976593, |
|
"eval_overall_accuracy": 0.8924440068914595, |
|
"eval_overall_f1": 0.4397163120567376, |
|
"eval_overall_precision": 0.4378531073446328, |
|
"eval_overall_recall": 0.4415954415954416, |
|
"eval_runtime": 0.3252, |
|
"eval_samples_per_second": 574.99, |
|
"eval_steps_per_second": 9.224, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.2673431634902954, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.3686, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.5747126436781609, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.49504950495049505, |
|
"eval_LOCATION_recall": 0.684931506849315, |
|
"eval_ORGANIZATION_f1": 0.45528455284552843, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.4827586206896552, |
|
"eval_ORGANIZATION_recall": 0.4307692307692308, |
|
"eval_PERSON_f1": 0.7507163323782233, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.6582914572864321, |
|
"eval_PERSON_recall": 0.8733333333333333, |
|
"eval_QUANTITY_f1": 0.3934426229508197, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.375, |
|
"eval_QUANTITY_recall": 0.41379310344827586, |
|
"eval_TIME_f1": 0.8115942028985507, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8235294117647058, |
|
"eval_loss": 0.29026341438293457, |
|
"eval_overall_accuracy": 0.9288702928870293, |
|
"eval_overall_f1": 0.6417525773195876, |
|
"eval_overall_precision": 0.5858823529411765, |
|
"eval_overall_recall": 0.7094017094017094, |
|
"eval_runtime": 0.3326, |
|
"eval_samples_per_second": 562.209, |
|
"eval_steps_per_second": 9.019, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 1.4100310802459717, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.2668, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.5664739884393063, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.49, |
|
"eval_LOCATION_recall": 0.6712328767123288, |
|
"eval_ORGANIZATION_f1": 0.4878048780487805, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5172413793103449, |
|
"eval_ORGANIZATION_recall": 0.46153846153846156, |
|
"eval_PERSON_f1": 0.8246153846153845, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7657142857142857, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.5245901639344263, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5, |
|
"eval_QUANTITY_recall": 0.5517241379310345, |
|
"eval_TIME_f1": 0.8823529411764706, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8823529411764706, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.207948699593544, |
|
"eval_overall_accuracy": 0.9401919763721388, |
|
"eval_overall_f1": 0.6906666666666667, |
|
"eval_overall_precision": 0.6491228070175439, |
|
"eval_overall_recall": 0.7378917378917379, |
|
"eval_runtime": 0.3333, |
|
"eval_samples_per_second": 560.99, |
|
"eval_steps_per_second": 9.0, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 2.0687103271484375, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.2091, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.7195121951219512, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6483516483516484, |
|
"eval_LOCATION_recall": 0.8082191780821918, |
|
"eval_ORGANIZATION_f1": 0.5714285714285715, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5588235294117647, |
|
"eval_ORGANIZATION_recall": 0.5846153846153846, |
|
"eval_PERSON_f1": 0.8369230769230769, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7771428571428571, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.5846153846153845, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5277777777777778, |
|
"eval_QUANTITY_recall": 0.6551724137931034, |
|
"eval_TIME_f1": 0.8333333333333333, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7894736842105263, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.17728105187416077, |
|
"eval_overall_accuracy": 0.9451144474526212, |
|
"eval_overall_f1": 0.7430830039525692, |
|
"eval_overall_precision": 0.6911764705882353, |
|
"eval_overall_recall": 0.8034188034188035, |
|
"eval_runtime": 0.3284, |
|
"eval_samples_per_second": 569.476, |
|
"eval_steps_per_second": 9.136, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 2.4117839336395264, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.1833, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.6971428571428572, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.5980392156862745, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.5818181818181819, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.48, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.8353658536585366, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7696629213483146, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.5555555555555556, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.46511627906976744, |
|
"eval_QUANTITY_recall": 0.6896551724137931, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.189751997590065, |
|
"eval_overall_accuracy": 0.9424070883583558, |
|
"eval_overall_f1": 0.7248157248157246, |
|
"eval_overall_precision": 0.6371490280777538, |
|
"eval_overall_recall": 0.8404558404558404, |
|
"eval_runtime": 0.3281, |
|
"eval_samples_per_second": 569.94, |
|
"eval_steps_per_second": 9.143, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 1.2822880744934082, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.1653, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.7607361963190183, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6888888888888889, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.5857142857142857, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5466666666666666, |
|
"eval_ORGANIZATION_recall": 0.6307692307692307, |
|
"eval_PERSON_f1": 0.8616352201257862, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8154761904761905, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8450704225352113, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8108108108108109, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.15423187613487244, |
|
"eval_overall_accuracy": 0.9512675363032242, |
|
"eval_overall_f1": 0.770448548812665, |
|
"eval_overall_precision": 0.7174447174447175, |
|
"eval_overall_recall": 0.8319088319088319, |
|
"eval_runtime": 0.3338, |
|
"eval_samples_per_second": 560.152, |
|
"eval_steps_per_second": 8.986, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 1.469247817993164, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.1529, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.7590361445783131, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6774193548387096, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.5915492957746479, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5454545454545454, |
|
"eval_ORGANIZATION_recall": 0.6461538461538462, |
|
"eval_PERSON_f1": 0.8500000000000001, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7619047619047619, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.861111111111111, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8157894736842105, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14763768017292023, |
|
"eval_overall_accuracy": 0.9527442776273689, |
|
"eval_overall_f1": 0.7758846657929228, |
|
"eval_overall_precision": 0.7184466019417476, |
|
"eval_overall_recall": 0.8433048433048433, |
|
"eval_runtime": 0.3346, |
|
"eval_samples_per_second": 558.898, |
|
"eval_steps_per_second": 8.966, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.5628341436386108, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.1428, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.7544910179640719, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6702127659574468, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6225165562913907, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5465116279069767, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.879746835443038, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666666, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.575, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14981509745121002, |
|
"eval_overall_accuracy": 0.9497907949790795, |
|
"eval_overall_f1": 0.7789203084832904, |
|
"eval_overall_precision": 0.7096018735362998, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.3338, |
|
"eval_samples_per_second": 560.163, |
|
"eval_steps_per_second": 8.987, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 1.2276618480682373, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.132, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.779874213836478, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7209302325581395, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.5925925925925927, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5714285714285714, |
|
"eval_ORGANIZATION_recall": 0.6153846153846154, |
|
"eval_PERSON_f1": 0.8616352201257862, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8154761904761905, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8108108108108107, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14296573400497437, |
|
"eval_overall_accuracy": 0.9532365247354172, |
|
"eval_overall_f1": 0.7808764940239045, |
|
"eval_overall_precision": 0.7313432835820896, |
|
"eval_overall_recall": 0.8376068376068376, |
|
"eval_runtime": 0.3274, |
|
"eval_samples_per_second": 571.224, |
|
"eval_steps_per_second": 9.164, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 1.8262553215026855, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.1288, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.7515151515151515, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6739130434782609, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6330935251798562, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5945945945945946, |
|
"eval_ORGANIZATION_recall": 0.676923076923077, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.7631578947368423, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6904761904761905, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1460973471403122, |
|
"eval_overall_accuracy": 0.9515136598572483, |
|
"eval_overall_f1": 0.774869109947644, |
|
"eval_overall_precision": 0.7167070217917676, |
|
"eval_overall_recall": 0.8433048433048433, |
|
"eval_runtime": 0.3342, |
|
"eval_samples_per_second": 559.473, |
|
"eval_steps_per_second": 8.976, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 1.1676838397979736, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1219, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.7590361445783131, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6774193548387096, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6433566433566433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5897435897435898, |
|
"eval_ORGANIZATION_recall": 0.7076923076923077, |
|
"eval_PERSON_f1": 0.8734177215189873, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8313253012048193, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.7631578947368423, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6904761904761905, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14986908435821533, |
|
"eval_overall_accuracy": 0.9502830420871278, |
|
"eval_overall_f1": 0.7802340702210663, |
|
"eval_overall_precision": 0.7177033492822966, |
|
"eval_overall_recall": 0.8547008547008547, |
|
"eval_runtime": 0.333, |
|
"eval_samples_per_second": 561.614, |
|
"eval_steps_per_second": 9.01, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 1.25841224193573, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1176, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6666666666666666, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5975609756097561, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7945205479452054, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7435897435897436, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.13805125653743744, |
|
"eval_overall_accuracy": 0.9547132660595619, |
|
"eval_overall_f1": 0.7968337730870712, |
|
"eval_overall_precision": 0.742014742014742, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.3326, |
|
"eval_samples_per_second": 562.243, |
|
"eval_steps_per_second": 9.02, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 1.1619478464126587, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.1161, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.782608695652174, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6666666666666666, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5975609756097561, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8761904761904761, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8363636363636363, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7536231884057972, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.65, |
|
"eval_QUANTITY_recall": 0.896551724137931, |
|
"eval_TIME_f1": 0.7631578947368423, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6904761904761905, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14077436923980713, |
|
"eval_overall_accuracy": 0.9532365247354172, |
|
"eval_overall_f1": 0.7942708333333333, |
|
"eval_overall_precision": 0.7314148681055156, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3264, |
|
"eval_samples_per_second": 572.885, |
|
"eval_steps_per_second": 9.191, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 1.547819972038269, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.1148, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.7777777777777778, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7078651685393258, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7058823529411765, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6136363636363636, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8726114649681529, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7246376811594203, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.625, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7733333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7073170731707317, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1482475847005844, |
|
"eval_overall_accuracy": 0.9537287718434654, |
|
"eval_overall_f1": 0.7968952134540751, |
|
"eval_overall_precision": 0.7298578199052133, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.301, |
|
"eval_steps_per_second": 9.165, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 3.2295055389404297, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.1075, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6268656716417911, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6086956521739131, |
|
"eval_ORGANIZATION_recall": 0.6461538461538462, |
|
"eval_PERSON_f1": 0.8753993610223643, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7142857142857144, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6097560975609756, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7733333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7073170731707317, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14014115929603577, |
|
"eval_overall_accuracy": 0.9554516367216342, |
|
"eval_overall_f1": 0.7914438502673797, |
|
"eval_overall_precision": 0.7455919395465995, |
|
"eval_overall_recall": 0.8433048433048433, |
|
"eval_runtime": 0.3353, |
|
"eval_samples_per_second": 557.692, |
|
"eval_steps_per_second": 8.947, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.9571211934089661, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.1058, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.7875, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7199999999999999, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6352941176470588, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8761904761904761, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8363636363636363, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7575757575757576, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7631578947368423, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6904761904761905, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14074338972568512, |
|
"eval_overall_accuracy": 0.9542210189515137, |
|
"eval_overall_f1": 0.8057366362451107, |
|
"eval_overall_precision": 0.7427884615384616, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3268, |
|
"eval_samples_per_second": 572.193, |
|
"eval_steps_per_second": 9.18, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 1.2484526634216309, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.1021, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6433566433566433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5897435897435898, |
|
"eval_ORGANIZATION_recall": 0.7076923076923077, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.13723434507846832, |
|
"eval_overall_accuracy": 0.9561900073837066, |
|
"eval_overall_f1": 0.7936507936507937, |
|
"eval_overall_precision": 0.7407407407407407, |
|
"eval_overall_recall": 0.8547008547008547, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.38, |
|
"eval_steps_per_second": 9.167, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 0.977418839931488, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.1032, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.8026315789473685, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7066666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6235294117647059, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7812500000000001, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7733333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7073170731707317, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.13176140189170837, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8116710875331565, |
|
"eval_overall_precision": 0.7593052109181141, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3289, |
|
"eval_samples_per_second": 568.639, |
|
"eval_steps_per_second": 9.123, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 1.2055819034576416, |
|
"learning_rate": 4e-05, |
|
"loss": 0.0979, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7412587412587412, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6794871794871795, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.7945205479452054, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7435897435897436, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1400451809167862, |
|
"eval_overall_accuracy": 0.956928378045779, |
|
"eval_overall_f1": 0.8132450331125828, |
|
"eval_overall_precision": 0.7599009900990099, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3266, |
|
"eval_samples_per_second": 572.647, |
|
"eval_steps_per_second": 9.187, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 2.198835611343384, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.098, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.8181818181818182, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7777777777777778, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.725925925925926, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7945205479452054, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7435897435897436, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.13511410355567932, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.8194070080862534, |
|
"eval_overall_precision": 0.7774936061381074, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.3268, |
|
"eval_samples_per_second": 572.204, |
|
"eval_steps_per_second": 9.18, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 3.7243123054504395, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0942, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7027027027027027, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6265060240963856, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1375378519296646, |
|
"eval_overall_accuracy": 0.9574206251538272, |
|
"eval_overall_f1": 0.8085106382978723, |
|
"eval_overall_precision": 0.7581047381546134, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.3271, |
|
"eval_samples_per_second": 571.696, |
|
"eval_steps_per_second": 9.172, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 1.6769466400146484, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.0943, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.76, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6705882352941176, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7945205479452054, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7435897435897436, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.13511058688163757, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8249336870026525, |
|
"eval_overall_precision": 0.771712158808933, |
|
"eval_overall_recall": 0.886039886039886, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.272, |
|
"eval_steps_per_second": 9.165, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 1.9959501028060913, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.091, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.8050314465408805, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7441860465116279, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7682119205298013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6744186046511628, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8753993610223643, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14082586765289307, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8183006535947712, |
|
"eval_overall_precision": 0.7560386473429952, |
|
"eval_overall_recall": 0.8917378917378918, |
|
"eval_runtime": 0.3276, |
|
"eval_samples_per_second": 570.878, |
|
"eval_steps_per_second": 9.158, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 2.225444793701172, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.089, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7464788732394366, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6883116883116883, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7246376811594203, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.625, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1414780169725418, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8186666666666667, |
|
"eval_overall_precision": 0.7694235588972431, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3266, |
|
"eval_samples_per_second": 572.607, |
|
"eval_steps_per_second": 9.186, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 1.2359886169433594, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.0862, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7194244604316546, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6756756756756757, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7142857142857144, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6097560975609756, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7733333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7073170731707317, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14282022416591644, |
|
"eval_overall_accuracy": 0.9561900073837066, |
|
"eval_overall_f1": 0.8052980132450331, |
|
"eval_overall_precision": 0.7524752475247525, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.3275, |
|
"eval_samples_per_second": 570.999, |
|
"eval_steps_per_second": 9.16, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 1.0968230962753296, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0836, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.7950310559006212, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7272727272727273, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7323943661971831, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6753246753246753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.676056338028169, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5714285714285714, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.7733333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7073170731707317, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14485140144824982, |
|
"eval_overall_accuracy": 0.9556977602756583, |
|
"eval_overall_f1": 0.8068331143232589, |
|
"eval_overall_precision": 0.748780487804878, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3284, |
|
"eval_samples_per_second": 569.433, |
|
"eval_steps_per_second": 9.135, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 1.7558865547180176, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.0801, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7338129496402878, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6891891891891891, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8774193548387097, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.13724297285079956, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8156123822341856, |
|
"eval_overall_precision": 0.7729591836734694, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.3346, |
|
"eval_samples_per_second": 558.811, |
|
"eval_steps_per_second": 8.965, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 1.0294597148895264, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0779, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7682119205298013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6744186046511628, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1392383724451065, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8236842105263158, |
|
"eval_overall_precision": 0.7652811735941321, |
|
"eval_overall_recall": 0.8917378917378918, |
|
"eval_runtime": 0.3338, |
|
"eval_samples_per_second": 560.248, |
|
"eval_steps_per_second": 8.988, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 1.9617377519607544, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.0776, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.725925925925926, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7945205479452054, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7435897435897436, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.13599379360675812, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.8236877523553163, |
|
"eval_overall_precision": 0.7806122448979592, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.332, |
|
"eval_samples_per_second": 563.281, |
|
"eval_steps_per_second": 9.037, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.6533139944076538, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0764, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.8101265822784809, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7529411764705882, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7586206896551724, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6875, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7246376811594203, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.625, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7733333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7073170731707317, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14058609306812286, |
|
"eval_overall_accuracy": 0.9598818606940684, |
|
"eval_overall_f1": 0.8173455978975033, |
|
"eval_overall_precision": 0.7585365853658537, |
|
"eval_overall_recall": 0.886039886039886, |
|
"eval_runtime": 0.3334, |
|
"eval_samples_per_second": 560.883, |
|
"eval_steps_per_second": 8.998, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.820826530456543, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.0745, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7567567567567568, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6746987951807228, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6857142857142856, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5853658536585366, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8169014084507041, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7837837837837838, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1464959979057312, |
|
"eval_overall_accuracy": 0.9576667487078513, |
|
"eval_overall_f1": 0.8157894736842105, |
|
"eval_overall_precision": 0.7579462102689487, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3329, |
|
"eval_samples_per_second": 561.647, |
|
"eval_steps_per_second": 9.01, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.9249401688575745, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0729, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.72992700729927, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6944444444444444, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7936507936507937, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7945205479452054, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7435897435897436, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.13697849214076996, |
|
"eval_overall_accuracy": 0.9606202313561408, |
|
"eval_overall_f1": 0.8243243243243243, |
|
"eval_overall_precision": 0.7840616966580977, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3343, |
|
"eval_samples_per_second": 559.37, |
|
"eval_steps_per_second": 8.974, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 3.431596040725708, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0719, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.8311688311688312, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6814814814814816, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7076923076923077, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7812500000000001, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1357881724834442, |
|
"eval_overall_accuracy": 0.9616047255722373, |
|
"eval_overall_f1": 0.819047619047619, |
|
"eval_overall_precision": 0.7838541666666666, |
|
"eval_overall_recall": 0.8575498575498576, |
|
"eval_runtime": 0.3327, |
|
"eval_samples_per_second": 562.136, |
|
"eval_steps_per_second": 9.018, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 0.9399017691612244, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0746, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.8050314465408805, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7441860465116279, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7432432432432433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6626506024096386, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7733333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7073170731707317, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14653536677360535, |
|
"eval_overall_accuracy": 0.9574206251538272, |
|
"eval_overall_f1": 0.8141361256544503, |
|
"eval_overall_precision": 0.7530266343825666, |
|
"eval_overall_recall": 0.886039886039886, |
|
"eval_runtime": 0.3328, |
|
"eval_samples_per_second": 561.886, |
|
"eval_steps_per_second": 9.014, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.6335604190826416, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0676, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7464788732394366, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6883116883116883, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.13876868784427643, |
|
"eval_overall_accuracy": 0.9603741078021166, |
|
"eval_overall_f1": 0.8251001335113485, |
|
"eval_overall_precision": 0.7763819095477387, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3328, |
|
"eval_samples_per_second": 561.873, |
|
"eval_steps_per_second": 9.014, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 1.0286895036697388, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0674, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7432432432432433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6626506024096386, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8761904761904761, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8363636363636363, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14836791157722473, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8131578947368421, |
|
"eval_overall_precision": 0.7555012224938875, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3338, |
|
"eval_samples_per_second": 560.202, |
|
"eval_steps_per_second": 8.987, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 0.754433274269104, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0653, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6911764705882353, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6619718309859155, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1401306837797165, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.8096514745308312, |
|
"eval_overall_precision": 0.7645569620253164, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.3326, |
|
"eval_samples_per_second": 562.239, |
|
"eval_steps_per_second": 9.02, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 1.2110971212387085, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0638, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7534246575342466, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6790123456790124, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7575757575757576, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7945205479452054, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7435897435897436, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1372911036014557, |
|
"eval_overall_accuracy": 0.9608663549101649, |
|
"eval_overall_f1": 0.8229027962716379, |
|
"eval_overall_precision": 0.7725, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.332, |
|
"eval_samples_per_second": 563.249, |
|
"eval_steps_per_second": 9.036, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 0.7484323382377625, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0641, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.7875, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7567567567567568, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6746987951807228, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.879746835443038, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6857142857142856, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5853658536585366, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15354810655117035, |
|
"eval_overall_accuracy": 0.9566822544917548, |
|
"eval_overall_f1": 0.8098958333333335, |
|
"eval_overall_precision": 0.7458033573141487, |
|
"eval_overall_recall": 0.886039886039886, |
|
"eval_runtime": 0.3264, |
|
"eval_samples_per_second": 572.882, |
|
"eval_steps_per_second": 9.191, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.8354088068008423, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0632, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7801418439716312, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7236842105263158, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7575757575757576, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.13777735829353333, |
|
"eval_overall_accuracy": 0.9613586020182131, |
|
"eval_overall_f1": 0.8326639892904953, |
|
"eval_overall_precision": 0.7853535353535354, |
|
"eval_overall_recall": 0.886039886039886, |
|
"eval_runtime": 0.333, |
|
"eval_samples_per_second": 561.553, |
|
"eval_steps_per_second": 9.009, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.5027186274528503, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0607, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7464788732394366, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6883116883116883, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7945205479452054, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7435897435897436, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1403217911720276, |
|
"eval_overall_accuracy": 0.9606202313561408, |
|
"eval_overall_f1": 0.8192771084337349, |
|
"eval_overall_precision": 0.7727272727272727, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3336, |
|
"eval_samples_per_second": 560.597, |
|
"eval_steps_per_second": 8.994, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.9568884968757629, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0596, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.8311688311688312, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7323943661971831, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6753246753246753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7945205479452054, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7435897435897436, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1430799663066864, |
|
"eval_overall_accuracy": 0.9616047255722373, |
|
"eval_overall_f1": 0.8230563002680965, |
|
"eval_overall_precision": 0.7772151898734178, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3331, |
|
"eval_samples_per_second": 561.433, |
|
"eval_steps_per_second": 9.007, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 5.6017351150512695, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.0582, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7375886524822695, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6842105263157895, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14417453110218048, |
|
"eval_overall_accuracy": 0.961112478464189, |
|
"eval_overall_f1": 0.8229027962716379, |
|
"eval_overall_precision": 0.7725, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3257, |
|
"eval_samples_per_second": 574.07, |
|
"eval_steps_per_second": 9.21, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 2.356386184692383, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0606, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.8152866242038217, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.763888888888889, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6962025316455697, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.879746835443038, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7246376811594203, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.625, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14679183065891266, |
|
"eval_overall_accuracy": 0.9596357371400444, |
|
"eval_overall_f1": 0.8232189973614775, |
|
"eval_overall_precision": 0.7665847665847666, |
|
"eval_overall_recall": 0.8888888888888888, |
|
"eval_runtime": 0.3259, |
|
"eval_samples_per_second": 573.862, |
|
"eval_steps_per_second": 9.206, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.9929021000862122, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.0563, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.8311688311688312, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7285714285714285, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.68, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14097212255001068, |
|
"eval_overall_accuracy": 0.9608663549101649, |
|
"eval_overall_f1": 0.8219544846050869, |
|
"eval_overall_precision": 0.7752525252525253, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.333, |
|
"eval_samples_per_second": 561.632, |
|
"eval_steps_per_second": 9.01, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 0.8276335597038269, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0556, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7724137931034483, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.879746835443038, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6857142857142856, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5853658536585366, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15497690439224243, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8173455978975033, |
|
"eval_overall_precision": 0.7585365853658537, |
|
"eval_overall_recall": 0.886039886039886, |
|
"eval_runtime": 0.3319, |
|
"eval_samples_per_second": 563.4, |
|
"eval_steps_per_second": 9.039, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 2.3347344398498535, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0578, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.8152866242038217, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7534246575342466, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6790123456790124, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.7945205479452054, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7435897435897436, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1532071828842163, |
|
"eval_overall_accuracy": 0.9576667487078513, |
|
"eval_overall_f1": 0.8184210526315789, |
|
"eval_overall_precision": 0.7603911980440098, |
|
"eval_overall_recall": 0.886039886039886, |
|
"eval_runtime": 0.332, |
|
"eval_samples_per_second": 563.241, |
|
"eval_steps_per_second": 9.036, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.38269466161727905, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0559, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.8311688311688312, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7428571428571429, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6933333333333334, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14444759488105774, |
|
"eval_overall_accuracy": 0.9618508491262614, |
|
"eval_overall_f1": 0.8262032085561498, |
|
"eval_overall_precision": 0.7783375314861462, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.332, |
|
"eval_samples_per_second": 563.256, |
|
"eval_steps_per_second": 9.036, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 1.5551215410232544, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0544, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.757142857142857, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7066666666666667, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1467483639717102, |
|
"eval_overall_accuracy": 0.9608663549101649, |
|
"eval_overall_f1": 0.8266666666666667, |
|
"eval_overall_precision": 0.7769423558897243, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3328, |
|
"eval_samples_per_second": 561.888, |
|
"eval_steps_per_second": 9.014, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 1.1728203296661377, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0511, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7246376811594203, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.684931506849315, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14386440813541412, |
|
"eval_overall_accuracy": 0.9608663549101649, |
|
"eval_overall_f1": 0.8219544846050869, |
|
"eval_overall_precision": 0.7752525252525253, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3262, |
|
"eval_samples_per_second": 573.233, |
|
"eval_steps_per_second": 9.196, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 1.3139925003051758, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0516, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.8152866242038217, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7567567567567568, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6746987951807228, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8734177215189873, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8313253012048193, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7575757575757576, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15267647802829742, |
|
"eval_overall_accuracy": 0.9596357371400444, |
|
"eval_overall_f1": 0.8221343873517786, |
|
"eval_overall_precision": 0.7647058823529411, |
|
"eval_overall_recall": 0.8888888888888888, |
|
"eval_runtime": 0.3328, |
|
"eval_samples_per_second": 561.953, |
|
"eval_steps_per_second": 9.015, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 1.7045568227767944, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0524, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6835443037974683, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8742138364779874, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8273809523809523, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7246376811594203, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.625, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15286701917648315, |
|
"eval_overall_accuracy": 0.9598818606940684, |
|
"eval_overall_f1": 0.8194993412384717, |
|
"eval_overall_precision": 0.7622549019607843, |
|
"eval_overall_recall": 0.886039886039886, |
|
"eval_runtime": 0.3345, |
|
"eval_samples_per_second": 559.086, |
|
"eval_steps_per_second": 8.969, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 2.6849210262298584, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0513, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7450980392156863, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6477272727272727, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15772588551044464, |
|
"eval_overall_accuracy": 0.9576667487078513, |
|
"eval_overall_f1": 0.817824377457405, |
|
"eval_overall_precision": 0.7572815533980582, |
|
"eval_overall_recall": 0.8888888888888888, |
|
"eval_runtime": 0.3319, |
|
"eval_samples_per_second": 563.4, |
|
"eval_steps_per_second": 9.039, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 0.8173909783363342, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0506, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.8235294117647058, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7428571428571429, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6933333333333334, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15098540484905243, |
|
"eval_overall_accuracy": 0.9603741078021166, |
|
"eval_overall_f1": 0.8219544846050869, |
|
"eval_overall_precision": 0.7752525252525253, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3334, |
|
"eval_samples_per_second": 560.961, |
|
"eval_steps_per_second": 8.999, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 1.8647905588150024, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0511, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7517730496453899, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6973684210526315, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14845135807991028, |
|
"eval_overall_accuracy": 0.9606202313561408, |
|
"eval_overall_f1": 0.8255659121171771, |
|
"eval_overall_precision": 0.775, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3279, |
|
"eval_samples_per_second": 570.365, |
|
"eval_steps_per_second": 9.15, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.22929580509662628, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0494, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.8181818181818182, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7777777777777778, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7285714285714285, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.68, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8169014084507041, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7837837837837838, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14559510350227356, |
|
"eval_overall_accuracy": 0.9618508491262614, |
|
"eval_overall_f1": 0.8230563002680965, |
|
"eval_overall_precision": 0.7772151898734178, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3268, |
|
"eval_samples_per_second": 572.194, |
|
"eval_steps_per_second": 9.18, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.6386439800262451, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0494, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.8101265822784809, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7529411764705882, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7391304347826088, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6986301369863014, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15255826711654663, |
|
"eval_overall_accuracy": 0.9603741078021166, |
|
"eval_overall_f1": 0.8181818181818181, |
|
"eval_overall_precision": 0.7707808564231738, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3324, |
|
"eval_samples_per_second": 562.613, |
|
"eval_steps_per_second": 9.026, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 19.432247161865234, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0478, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7432432432432433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6626506024096386, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1611391305923462, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8190224570673711, |
|
"eval_overall_precision": 0.7635467980295566, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3315, |
|
"eval_samples_per_second": 564.041, |
|
"eval_steps_per_second": 9.049, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 2.1011621952056885, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0471, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.8311688311688312, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7092198581560285, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6578947368421053, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8169014084507041, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7837837837837838, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14900296926498413, |
|
"eval_overall_accuracy": 0.9613586020182131, |
|
"eval_overall_f1": 0.8214765100671142, |
|
"eval_overall_precision": 0.7766497461928934, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3328, |
|
"eval_samples_per_second": 561.901, |
|
"eval_steps_per_second": 9.014, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 1.5730093717575073, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0457, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.8366013071895425, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6835443037974683, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7301587301587301, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6764705882352942, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8285714285714286, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8055555555555556, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14521339535713196, |
|
"eval_overall_accuracy": 0.9623430962343096, |
|
"eval_overall_f1": 0.82907133243607, |
|
"eval_overall_precision": 0.7857142857142857, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3329, |
|
"eval_samples_per_second": 561.784, |
|
"eval_steps_per_second": 9.013, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 0.7596818208694458, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0453, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7234042553191491, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6710526315789473, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7575757575757576, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1535465270280838, |
|
"eval_overall_accuracy": 0.9608663549101649, |
|
"eval_overall_f1": 0.8203753351206434, |
|
"eval_overall_precision": 0.7746835443037975, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3263, |
|
"eval_samples_per_second": 573.007, |
|
"eval_steps_per_second": 9.193, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 3.6123743057250977, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0439, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15502122044563293, |
|
"eval_overall_accuracy": 0.9596357371400444, |
|
"eval_overall_f1": 0.8218085106382977, |
|
"eval_overall_precision": 0.770573566084788, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3317, |
|
"eval_samples_per_second": 563.702, |
|
"eval_steps_per_second": 9.043, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 0.6118897199630737, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0467, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.8289473684210525, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6814814814814816, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7076923076923077, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7419354838709677, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.696969696969697, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8169014084507041, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7837837837837838, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14392048120498657, |
|
"eval_overall_accuracy": 0.9613586020182131, |
|
"eval_overall_f1": 0.8169398907103825, |
|
"eval_overall_precision": 0.7847769028871391, |
|
"eval_overall_recall": 0.8518518518518519, |
|
"eval_runtime": 0.3318, |
|
"eval_samples_per_second": 563.555, |
|
"eval_steps_per_second": 9.041, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 1.4808624982833862, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0422, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7448275862068966, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.675, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.160318523645401, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8185430463576159, |
|
"eval_overall_precision": 0.7648514851485149, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.332, |
|
"eval_samples_per_second": 563.291, |
|
"eval_steps_per_second": 9.037, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 1.028084397315979, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0423, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.8152866242038217, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6835443037974683, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7575757575757576, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1588248461484909, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.824468085106383, |
|
"eval_overall_precision": 0.773067331670823, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3263, |
|
"eval_samples_per_second": 573.167, |
|
"eval_steps_per_second": 9.195, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 1.2602914571762085, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0422, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.8441558441558442, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.8024691358024691, |
|
"eval_LOCATION_recall": 0.8904109589041096, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8169014084507041, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7837837837837838, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15185856819152832, |
|
"eval_overall_accuracy": 0.9623430962343096, |
|
"eval_overall_f1": 0.8282290279627165, |
|
"eval_overall_precision": 0.7775, |
|
"eval_overall_recall": 0.886039886039886, |
|
"eval_runtime": 0.3269, |
|
"eval_samples_per_second": 572.038, |
|
"eval_steps_per_second": 9.177, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.7608669996261597, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0416, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7448275862068966, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.675, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15464389324188232, |
|
"eval_overall_accuracy": 0.9616047255722373, |
|
"eval_overall_f1": 0.824468085106383, |
|
"eval_overall_precision": 0.773067331670823, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.332, |
|
"eval_samples_per_second": 563.246, |
|
"eval_steps_per_second": 9.036, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 1.0217771530151367, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0403, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.8235294117647058, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7448275862068966, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.675, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.75, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1511322259902954, |
|
"eval_overall_accuracy": 0.9618508491262614, |
|
"eval_overall_f1": 0.824631860776439, |
|
"eval_overall_precision": 0.7777777777777778, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3329, |
|
"eval_samples_per_second": 561.81, |
|
"eval_steps_per_second": 9.013, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 1.7045354843139648, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0411, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15936115384101868, |
|
"eval_overall_accuracy": 0.9598818606940684, |
|
"eval_overall_f1": 0.8222811671087533, |
|
"eval_overall_precision": 0.7692307692307693, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3338, |
|
"eval_samples_per_second": 560.176, |
|
"eval_steps_per_second": 8.987, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 1.8637417554855347, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0391, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.8152866242038217, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7225806451612903, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6222222222222222, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.17168858647346497, |
|
"eval_overall_accuracy": 0.9561900073837066, |
|
"eval_overall_f1": 0.8156862745098039, |
|
"eval_overall_precision": 0.7536231884057971, |
|
"eval_overall_recall": 0.8888888888888888, |
|
"eval_runtime": 0.332, |
|
"eval_samples_per_second": 563.182, |
|
"eval_steps_per_second": 9.035, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 1.0552111864089966, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0393, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.8101265822784809, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7529411764705882, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7397260273972603, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16536851227283478, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8190224570673711, |
|
"eval_overall_precision": 0.7635467980295566, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3264, |
|
"eval_samples_per_second": 572.834, |
|
"eval_steps_per_second": 9.19, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.6572228670120239, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0411, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7323943661971831, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6753246753246753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15696407854557037, |
|
"eval_overall_accuracy": 0.9608663549101649, |
|
"eval_overall_f1": 0.822429906542056, |
|
"eval_overall_precision": 0.7738693467336684, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3332, |
|
"eval_samples_per_second": 561.214, |
|
"eval_steps_per_second": 9.003, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 0.9044064283370972, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0408, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7323943661971831, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6753246753246753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8169014084507041, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7837837837837838, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1582627296447754, |
|
"eval_overall_accuracy": 0.9613586020182131, |
|
"eval_overall_f1": 0.824, |
|
"eval_overall_precision": 0.7744360902255639, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3319, |
|
"eval_samples_per_second": 563.385, |
|
"eval_steps_per_second": 9.038, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.5799534916877747, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0389, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7310344827586207, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6625, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16305667161941528, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8180610889774236, |
|
"eval_overall_precision": 0.7661691542288557, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3349, |
|
"eval_samples_per_second": 558.344, |
|
"eval_steps_per_second": 8.957, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 1.983021855354309, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0377, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.15857818722724915, |
|
"eval_overall_accuracy": 0.9613586020182131, |
|
"eval_overall_f1": 0.8207171314741036, |
|
"eval_overall_precision": 0.7686567164179104, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3261, |
|
"eval_samples_per_second": 573.446, |
|
"eval_steps_per_second": 9.2, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 1.1891909837722778, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0404, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16166049242019653, |
|
"eval_overall_accuracy": 0.9601279842480925, |
|
"eval_overall_f1": 0.8207171314741036, |
|
"eval_overall_precision": 0.7686567164179104, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3315, |
|
"eval_samples_per_second": 564.102, |
|
"eval_steps_per_second": 9.05, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 0.46722444891929626, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0388, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7310344827586207, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6625, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8169014084507041, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7837837837837838, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16035309433937073, |
|
"eval_overall_accuracy": 0.9618508491262614, |
|
"eval_overall_f1": 0.823529411764706, |
|
"eval_overall_precision": 0.7758186397984886, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3324, |
|
"eval_samples_per_second": 562.645, |
|
"eval_steps_per_second": 9.026, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.8686147332191467, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0383, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16000543534755707, |
|
"eval_overall_accuracy": 0.961112478464189, |
|
"eval_overall_f1": 0.8192771084337349, |
|
"eval_overall_precision": 0.7727272727272727, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3327, |
|
"eval_samples_per_second": 561.998, |
|
"eval_steps_per_second": 9.016, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.674788773059845, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0382, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16522908210754395, |
|
"eval_overall_accuracy": 0.9596357371400444, |
|
"eval_overall_f1": 0.8169761273209548, |
|
"eval_overall_precision": 0.7642679900744417, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3342, |
|
"eval_samples_per_second": 559.61, |
|
"eval_steps_per_second": 8.978, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 1.6788341999053955, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0378, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.8101265822784809, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7529411764705882, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.17060095071792603, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8153034300791556, |
|
"eval_overall_precision": 0.7592137592137592, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3359, |
|
"eval_samples_per_second": 556.794, |
|
"eval_steps_per_second": 8.933, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 0.7395833730697632, |
|
"learning_rate": 9e-06, |
|
"loss": 0.039, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.8101265822784809, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7529411764705882, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7448275862068966, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.675, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16823621094226837, |
|
"eval_overall_accuracy": 0.9598818606940684, |
|
"eval_overall_f1": 0.8196286472148541, |
|
"eval_overall_precision": 0.7667493796526055, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3356, |
|
"eval_samples_per_second": 557.222, |
|
"eval_steps_per_second": 8.939, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.7045236229896545, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0372, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6944444444444444, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6329113924050633, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8726114649681529, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16675511002540588, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8095872170439414, |
|
"eval_overall_precision": 0.76, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.3326, |
|
"eval_samples_per_second": 562.306, |
|
"eval_steps_per_second": 9.021, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 2.7517426013946533, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0368, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1667993813753128, |
|
"eval_overall_accuracy": 0.9598818606940684, |
|
"eval_overall_f1": 0.8211920529801325, |
|
"eval_overall_precision": 0.7673267326732673, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3328, |
|
"eval_samples_per_second": 561.958, |
|
"eval_steps_per_second": 9.015, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 2.215299606323242, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0374, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7194244604316546, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6756756756756757, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16433657705783844, |
|
"eval_overall_accuracy": 0.9606202313561408, |
|
"eval_overall_f1": 0.8176943699731903, |
|
"eval_overall_precision": 0.7721518987341772, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.286, |
|
"eval_steps_per_second": 9.165, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 0.40606042742729187, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0369, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7083333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6455696202531646, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1689991056919098, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8154050464807436, |
|
"eval_overall_precision": 0.763681592039801, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3328, |
|
"eval_samples_per_second": 561.979, |
|
"eval_steps_per_second": 9.016, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 1.3081475496292114, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.036, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7132867132867133, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6538461538461539, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16559894382953644, |
|
"eval_overall_accuracy": 0.9596357371400444, |
|
"eval_overall_f1": 0.8170894526034712, |
|
"eval_overall_precision": 0.7688442211055276, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3315, |
|
"eval_samples_per_second": 564.057, |
|
"eval_steps_per_second": 9.049, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 0.7401718497276306, |
|
"learning_rate": 6e-06, |
|
"loss": 0.037, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7132867132867133, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6538461538461539, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16509054601192474, |
|
"eval_overall_accuracy": 0.9603741078021166, |
|
"eval_overall_f1": 0.8170894526034712, |
|
"eval_overall_precision": 0.7688442211055276, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3322, |
|
"eval_samples_per_second": 562.977, |
|
"eval_steps_per_second": 9.032, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.570732057094574, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0373, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7172413793103448, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.65, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16918015480041504, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.8164893617021275, |
|
"eval_overall_precision": 0.7655860349127181, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.287, |
|
"eval_steps_per_second": 9.165, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 1.0674538612365723, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0357, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7092198581560285, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6578947368421053, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16437728703022003, |
|
"eval_overall_accuracy": 0.9603741078021166, |
|
"eval_overall_f1": 0.8155080213903743, |
|
"eval_overall_precision": 0.7682619647355163, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.327, |
|
"eval_samples_per_second": 571.778, |
|
"eval_steps_per_second": 9.173, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 0.779975414276123, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0365, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1706375926733017, |
|
"eval_overall_accuracy": 0.9596357371400444, |
|
"eval_overall_f1": 0.8211920529801325, |
|
"eval_overall_precision": 0.7673267326732673, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3328, |
|
"eval_samples_per_second": 561.858, |
|
"eval_steps_per_second": 9.014, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 1.6607707738876343, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0358, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7210884353741497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6463414634146342, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16552191972732544, |
|
"eval_overall_accuracy": 0.9606202313561408, |
|
"eval_overall_f1": 0.8158940397350993, |
|
"eval_overall_precision": 0.7623762376237624, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3345, |
|
"eval_samples_per_second": 559.095, |
|
"eval_steps_per_second": 8.969, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.364473819732666, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0367, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.8152866242038217, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7272727272727272, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16641728579998016, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.8164893617021275, |
|
"eval_overall_precision": 0.7655860349127181, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3264, |
|
"eval_samples_per_second": 572.903, |
|
"eval_steps_per_second": 9.191, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 1.1335537433624268, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0367, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7123287671232877, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6419753086419753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16745708882808685, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8116710875331565, |
|
"eval_overall_precision": 0.7593052109181141, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3331, |
|
"eval_samples_per_second": 561.459, |
|
"eval_steps_per_second": 9.007, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 2.660787582397461, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0358, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.17253383994102478, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8148148148148149, |
|
"eval_overall_precision": 0.7604938271604939, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3324, |
|
"eval_samples_per_second": 562.55, |
|
"eval_steps_per_second": 9.025, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 1.2606465816497803, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0374, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.8152866242038217, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7123287671232877, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6419753086419753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1706884801387787, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.8158940397350993, |
|
"eval_overall_precision": 0.7623762376237624, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3336, |
|
"eval_samples_per_second": 560.539, |
|
"eval_steps_per_second": 8.993, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 2.224013090133667, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0342, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7132867132867133, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6538461538461539, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16819004714488983, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.8149134487350199, |
|
"eval_overall_precision": 0.765, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3327, |
|
"eval_samples_per_second": 562.071, |
|
"eval_steps_per_second": 9.017, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 1.7407749891281128, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0351, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.7234042553191491, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6710526315789473, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16785794496536255, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.8170894526034712, |
|
"eval_overall_precision": 0.7688442211055276, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.333, |
|
"eval_samples_per_second": 561.612, |
|
"eval_steps_per_second": 9.01, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.9356883764266968, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.036, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.8152866242038217, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6993006993006994, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6410256410256411, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1689637303352356, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8111702127659575, |
|
"eval_overall_precision": 0.7605985037406484, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3253, |
|
"eval_samples_per_second": 574.83, |
|
"eval_steps_per_second": 9.222, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.6478390693664551, |
|
"learning_rate": 0.0, |
|
"loss": 0.0368, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.8152866242038217, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6993006993006994, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6410256410256411, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8055555555555555, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7631578947368421, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16865810751914978, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8111702127659575, |
|
"eval_overall_precision": 0.7605985037406484, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3331, |
|
"eval_samples_per_second": 561.343, |
|
"eval_steps_per_second": 9.006, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 4567780799240064.0, |
|
"train_loss": 0.08414012978661735, |
|
"train_runtime": 604.7606, |
|
"train_samples_per_second": 279.119, |
|
"train_steps_per_second": 17.528 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 4567780799240064.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|