|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 9600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 7.524846076965332, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.2442, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.8972972972972972, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8383838383838383, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.898936170212766, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.8535353535353535, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9727626459143969, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9689922480620154, |
|
"eval_PERSON_recall": 0.9765625, |
|
"eval_loss": 0.05805998295545578, |
|
"eval_overall_accuracy": 0.9821862348178138, |
|
"eval_overall_f1": 0.9217603911980441, |
|
"eval_overall_precision": 0.8849765258215962, |
|
"eval_overall_recall": 0.9617346938775511, |
|
"eval_runtime": 0.2705, |
|
"eval_samples_per_second": 628.537, |
|
"eval_steps_per_second": 11.092, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 2.2480790615081787, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.0581, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.8864864864864866, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8282828282828283, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9190751445086704, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9464285714285714, |
|
"eval_ORGANIZATION_recall": 0.8932584269662921, |
|
"eval_PERSON_f1": 0.9727626459143969, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9689922480620154, |
|
"eval_PERSON_recall": 0.9765625, |
|
"eval_loss": 0.05479570850729942, |
|
"eval_overall_accuracy": 0.9851551956815114, |
|
"eval_overall_f1": 0.9289340101522842, |
|
"eval_overall_precision": 0.9242424242424242, |
|
"eval_overall_recall": 0.9336734693877551, |
|
"eval_runtime": 0.2786, |
|
"eval_samples_per_second": 610.099, |
|
"eval_steps_per_second": 10.766, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 0.7553579807281494, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.0357, |
|
"step": 288 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.9010989010989011, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8541666666666666, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9204545454545454, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9310344827586207, |
|
"eval_ORGANIZATION_recall": 0.9101123595505618, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.05141273885965347, |
|
"eval_overall_accuracy": 0.9856950067476383, |
|
"eval_overall_f1": 0.934010152284264, |
|
"eval_overall_precision": 0.9292929292929293, |
|
"eval_overall_recall": 0.9387755102040817, |
|
"eval_runtime": 0.2743, |
|
"eval_samples_per_second": 619.871, |
|
"eval_steps_per_second": 10.939, |
|
"step": 288 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 2.5006167888641357, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.0251, |
|
"step": 384 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.9142857142857143, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.898876404494382, |
|
"eval_LOCATION_recall": 0.9302325581395349, |
|
"eval_ORGANIZATION_f1": 0.9209809264305177, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.8941798941798942, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9641434262948206, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.983739837398374, |
|
"eval_PERSON_recall": 0.9453125, |
|
"eval_loss": 0.06069042533636093, |
|
"eval_overall_accuracy": 0.9851551956815114, |
|
"eval_overall_f1": 0.9331651954602775, |
|
"eval_overall_precision": 0.9226932668329177, |
|
"eval_overall_recall": 0.9438775510204082, |
|
"eval_runtime": 0.2776, |
|
"eval_samples_per_second": 612.329, |
|
"eval_steps_per_second": 10.806, |
|
"step": 384 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 0.45395660400390625, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.0146, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.9101123595505618, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8804347826086957, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9333333333333335, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9230769230769231, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.9644268774703557, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.976, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.06169137358665466, |
|
"eval_overall_accuracy": 0.9865047233468286, |
|
"eval_overall_f1": 0.9380530973451328, |
|
"eval_overall_precision": 0.9298245614035088, |
|
"eval_overall_recall": 0.9464285714285714, |
|
"eval_runtime": 0.2738, |
|
"eval_samples_per_second": 620.856, |
|
"eval_steps_per_second": 10.956, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 0.7863659262657166, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.0117, |
|
"step": 576 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.888888888888889, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.851063829787234, |
|
"eval_LOCATION_recall": 0.9302325581395349, |
|
"eval_ORGANIZATION_f1": 0.9166666666666666, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9065934065934066, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9603174603174603, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9758064516129032, |
|
"eval_PERSON_recall": 0.9453125, |
|
"eval_loss": 0.0706215351819992, |
|
"eval_overall_accuracy": 0.9856950067476383, |
|
"eval_overall_f1": 0.9242424242424242, |
|
"eval_overall_precision": 0.915, |
|
"eval_overall_recall": 0.9336734693877551, |
|
"eval_runtime": 0.28, |
|
"eval_samples_per_second": 607.104, |
|
"eval_steps_per_second": 10.714, |
|
"step": 576 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 0.042494997382164, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.0083, |
|
"step": 672 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.8526315789473684, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.7788461538461539, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9187675070028011, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9162011173184358, |
|
"eval_ORGANIZATION_recall": 0.9213483146067416, |
|
"eval_PERSON_f1": 0.9534883720930233, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9461538461538461, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.0925956517457962, |
|
"eval_overall_accuracy": 0.9819163292847504, |
|
"eval_overall_f1": 0.9142857142857143, |
|
"eval_overall_precision": 0.8910411622276029, |
|
"eval_overall_recall": 0.9387755102040817, |
|
"eval_runtime": 0.2741, |
|
"eval_samples_per_second": 620.296, |
|
"eval_steps_per_second": 10.946, |
|
"step": 672 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.1783752143383026, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.008, |
|
"step": 768 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.8999999999999999, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8617021276595744, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9371428571428573, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9534883720930233, |
|
"eval_ORGANIZATION_recall": 0.9213483146067416, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.07805542647838593, |
|
"eval_overall_accuracy": 0.9856950067476383, |
|
"eval_overall_f1": 0.9399744572158366, |
|
"eval_overall_precision": 0.9411764705882353, |
|
"eval_overall_recall": 0.9387755102040817, |
|
"eval_runtime": 0.2886, |
|
"eval_samples_per_second": 589.03, |
|
"eval_steps_per_second": 10.395, |
|
"step": 768 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 0.3219904899597168, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.0042, |
|
"step": 864 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.8914285714285715, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8764044943820225, |
|
"eval_LOCATION_recall": 0.9069767441860465, |
|
"eval_ORGANIZATION_f1": 0.9662921348314607, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9662921348314607, |
|
"eval_ORGANIZATION_recall": 0.9662921348314607, |
|
"eval_PERSON_f1": 0.9725490196078432, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9763779527559056, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.06586796045303345, |
|
"eval_overall_accuracy": 0.9889338731443995, |
|
"eval_overall_f1": 0.9516539440203563, |
|
"eval_overall_precision": 0.949238578680203, |
|
"eval_overall_recall": 0.9540816326530612, |
|
"eval_runtime": 0.2757, |
|
"eval_samples_per_second": 616.613, |
|
"eval_steps_per_second": 10.881, |
|
"step": 864 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 0.016961606219410896, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.0044, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.8926553672316384, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8681318681318682, |
|
"eval_LOCATION_recall": 0.9186046511627907, |
|
"eval_ORGANIZATION_f1": 0.9441340782122906, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9388888888888889, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9494163424124514, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9457364341085271, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.07118100672960281, |
|
"eval_overall_accuracy": 0.9873144399460189, |
|
"eval_overall_f1": 0.9343434343434343, |
|
"eval_overall_precision": 0.925, |
|
"eval_overall_recall": 0.9438775510204082, |
|
"eval_runtime": 0.2777, |
|
"eval_samples_per_second": 612.13, |
|
"eval_steps_per_second": 10.802, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 0.9713481664657593, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.005, |
|
"step": 1056 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.8972972972972972, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8383838383838383, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9438202247191011, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9438202247191011, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.08548479527235031, |
|
"eval_overall_accuracy": 0.9870445344129555, |
|
"eval_overall_f1": 0.9408805031446542, |
|
"eval_overall_precision": 0.9280397022332506, |
|
"eval_overall_recall": 0.9540816326530612, |
|
"eval_runtime": 0.2746, |
|
"eval_samples_per_second": 619.083, |
|
"eval_steps_per_second": 10.925, |
|
"step": 1056 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 0.007533730939030647, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.0036, |
|
"step": 1152 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.9050279329608939, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8709677419354839, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9408450704225352, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.943502824858757, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.08587783575057983, |
|
"eval_overall_accuracy": 0.9873144399460189, |
|
"eval_overall_f1": 0.9428208386277002, |
|
"eval_overall_precision": 0.9392405063291139, |
|
"eval_overall_recall": 0.9464285714285714, |
|
"eval_runtime": 0.2742, |
|
"eval_samples_per_second": 619.889, |
|
"eval_steps_per_second": 10.939, |
|
"step": 1152 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.012886933982372284, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.0042, |
|
"step": 1248 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.9152542372881357, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8901098901098901, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9526462395543176, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9447513812154696, |
|
"eval_ORGANIZATION_recall": 0.9606741573033708, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.07611611485481262, |
|
"eval_overall_accuracy": 0.9889338731443995, |
|
"eval_overall_f1": 0.9505703422053231, |
|
"eval_overall_precision": 0.9445843828715366, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2752, |
|
"eval_samples_per_second": 617.726, |
|
"eval_steps_per_second": 10.901, |
|
"step": 1248 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 0.020214928314089775, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.0036, |
|
"step": 1344 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.9028571428571427, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8876404494382022, |
|
"eval_LOCATION_recall": 0.9186046511627907, |
|
"eval_ORGANIZATION_f1": 0.9401709401709402, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.953757225433526, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.08433674275875092, |
|
"eval_overall_accuracy": 0.9862348178137652, |
|
"eval_overall_f1": 0.9435897435897437, |
|
"eval_overall_precision": 0.9484536082474226, |
|
"eval_overall_recall": 0.9387755102040817, |
|
"eval_runtime": 0.2767, |
|
"eval_samples_per_second": 614.444, |
|
"eval_steps_per_second": 10.843, |
|
"step": 1344 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 0.005007833708077669, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.0028, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.9111111111111112, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8723404255319149, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.934844192634561, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9428571428571428, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.09056564420461655, |
|
"eval_overall_accuracy": 0.9867746288798921, |
|
"eval_overall_f1": 0.94147582697201, |
|
"eval_overall_precision": 0.9390862944162437, |
|
"eval_overall_recall": 0.9438775510204082, |
|
"eval_runtime": 0.2739, |
|
"eval_samples_per_second": 620.731, |
|
"eval_steps_per_second": 10.954, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 0.002987402491271496, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.0017, |
|
"step": 1536 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.8950276243093923, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8526315789473684, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9394812680115273, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9644970414201184, |
|
"eval_ORGANIZATION_recall": 0.9157303370786517, |
|
"eval_PERSON_f1": 0.9606299212598425, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9682539682539683, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.09138376265764236, |
|
"eval_overall_accuracy": 0.9862348178137652, |
|
"eval_overall_f1": 0.9360613810741688, |
|
"eval_overall_precision": 0.9384615384615385, |
|
"eval_overall_recall": 0.9336734693877551, |
|
"eval_runtime": 0.2746, |
|
"eval_samples_per_second": 619.018, |
|
"eval_steps_per_second": 10.924, |
|
"step": 1536 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.003726888680830598, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.002, |
|
"step": 1632 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.8876404494382023, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8586956521739131, |
|
"eval_LOCATION_recall": 0.9186046511627907, |
|
"eval_ORGANIZATION_f1": 0.9491525423728814, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9545454545454546, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.08281037956476212, |
|
"eval_overall_accuracy": 0.9883940620782726, |
|
"eval_overall_f1": 0.94147582697201, |
|
"eval_overall_precision": 0.9390862944162437, |
|
"eval_overall_recall": 0.9438775510204082, |
|
"eval_runtime": 0.2742, |
|
"eval_samples_per_second": 619.907, |
|
"eval_steps_per_second": 10.94, |
|
"step": 1632 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 0.003566289786249399, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.0033, |
|
"step": 1728 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.9120879120879122, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8645833333333334, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.925207756232687, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.912568306010929, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.0640731155872345, |
|
"eval_overall_accuracy": 0.988663967611336, |
|
"eval_overall_f1": 0.9385194479297364, |
|
"eval_overall_precision": 0.9234567901234568, |
|
"eval_overall_recall": 0.9540816326530612, |
|
"eval_runtime": 0.2758, |
|
"eval_samples_per_second": 616.283, |
|
"eval_steps_per_second": 10.876, |
|
"step": 1728 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 0.016631081700325012, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.0024, |
|
"step": 1824 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.8863636363636364, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8666666666666667, |
|
"eval_LOCATION_recall": 0.9069767441860465, |
|
"eval_ORGANIZATION_f1": 0.9476584022038568, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9297297297297298, |
|
"eval_ORGANIZATION_recall": 0.9662921348314607, |
|
"eval_PERSON_f1": 0.9606299212598425, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9682539682539683, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.09817531704902649, |
|
"eval_overall_accuracy": 0.9867746288798921, |
|
"eval_overall_f1": 0.9382093316519546, |
|
"eval_overall_precision": 0.9276807980049875, |
|
"eval_overall_recall": 0.9489795918367347, |
|
"eval_runtime": 0.2771, |
|
"eval_samples_per_second": 613.515, |
|
"eval_steps_per_second": 10.827, |
|
"step": 1824 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 0.35814717411994934, |
|
"learning_rate": 4e-05, |
|
"loss": 0.0037, |
|
"step": 1920 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.8864864864864866, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8282828282828283, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.96045197740113, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9659090909090909, |
|
"eval_ORGANIZATION_recall": 0.9550561797752809, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.0904369205236435, |
|
"eval_overall_accuracy": 0.988663967611336, |
|
"eval_overall_f1": 0.9469696969696969, |
|
"eval_overall_precision": 0.9375, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2871, |
|
"eval_samples_per_second": 592.205, |
|
"eval_steps_per_second": 10.451, |
|
"step": 1920 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 0.010785204358398914, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0038, |
|
"step": 2016 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9411764705882353, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9385474860335196, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.9609375, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9609375, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.0786675289273262, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9444444444444445, |
|
"eval_overall_precision": 0.935, |
|
"eval_overall_recall": 0.9540816326530612, |
|
"eval_runtime": 0.2796, |
|
"eval_samples_per_second": 607.994, |
|
"eval_steps_per_second": 10.729, |
|
"step": 2016 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 0.02177988551557064, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0024, |
|
"step": 2112 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.8950276243093923, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8526315789473684, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9388888888888889, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9285714285714286, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9523809523809523, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.967741935483871, |
|
"eval_PERSON_recall": 0.9375, |
|
"eval_loss": 0.06972306966781616, |
|
"eval_overall_accuracy": 0.9889338731443995, |
|
"eval_overall_f1": 0.9331651954602775, |
|
"eval_overall_precision": 0.9226932668329177, |
|
"eval_overall_recall": 0.9438775510204082, |
|
"eval_runtime": 0.2769, |
|
"eval_samples_per_second": 613.91, |
|
"eval_steps_per_second": 10.834, |
|
"step": 2112 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 0.1288156807422638, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.0041, |
|
"step": 2208 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.9265536723163842, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9010989010989011, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9467787114845938, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9441340782122905, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.0794149860739708, |
|
"eval_overall_accuracy": 0.9875843454790824, |
|
"eval_overall_f1": 0.9480354879594423, |
|
"eval_overall_precision": 0.9420654911838791, |
|
"eval_overall_recall": 0.9540816326530612, |
|
"eval_runtime": 0.2829, |
|
"eval_samples_per_second": 600.817, |
|
"eval_steps_per_second": 10.603, |
|
"step": 2208 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 0.0011946976883336902, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0033, |
|
"step": 2304 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.9204545454545455, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9333333333333335, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9230769230769231, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.9603174603174603, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9758064516129032, |
|
"eval_PERSON_recall": 0.9453125, |
|
"eval_loss": 0.08298368752002716, |
|
"eval_overall_accuracy": 0.9881241565452091, |
|
"eval_overall_f1": 0.9390862944162437, |
|
"eval_overall_precision": 0.9343434343434344, |
|
"eval_overall_recall": 0.9438775510204082, |
|
"eval_runtime": 0.2768, |
|
"eval_samples_per_second": 614.247, |
|
"eval_steps_per_second": 10.84, |
|
"step": 2304 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 0.008975312113761902, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0034, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.9060773480662985, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8631578947368421, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9526462395543176, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9447513812154696, |
|
"eval_ORGANIZATION_recall": 0.9606741573033708, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.08038989454507828, |
|
"eval_overall_accuracy": 0.9881241565452091, |
|
"eval_overall_f1": 0.9496221662468515, |
|
"eval_overall_precision": 0.9378109452736318, |
|
"eval_overall_recall": 0.9617346938775511, |
|
"eval_runtime": 0.2782, |
|
"eval_samples_per_second": 611.154, |
|
"eval_steps_per_second": 10.785, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 0.003603309392929077, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.0012, |
|
"step": 2496 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.9265536723163842, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9010989010989011, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9444444444444444, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9340659340659341, |
|
"eval_ORGANIZATION_recall": 0.9550561797752809, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.07283078134059906, |
|
"eval_overall_accuracy": 0.9902834008097166, |
|
"eval_overall_f1": 0.9506953223767383, |
|
"eval_overall_precision": 0.9423558897243107, |
|
"eval_overall_recall": 0.9591836734693877, |
|
"eval_runtime": 0.2753, |
|
"eval_samples_per_second": 617.432, |
|
"eval_steps_per_second": 10.896, |
|
"step": 2496 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 0.0058512561954557896, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0015, |
|
"step": 2592 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.9257142857142857, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9101123595505618, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9505494505494506, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9301075268817204, |
|
"eval_ORGANIZATION_recall": 0.9719101123595506, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.09567292034626007, |
|
"eval_overall_accuracy": 0.9881241565452091, |
|
"eval_overall_f1": 0.9508196721311475, |
|
"eval_overall_precision": 0.940149625935162, |
|
"eval_overall_recall": 0.9617346938775511, |
|
"eval_runtime": 0.2824, |
|
"eval_samples_per_second": 601.88, |
|
"eval_steps_per_second": 10.621, |
|
"step": 2592 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 1.171476125717163, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.0029, |
|
"step": 2688 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.9222222222222223, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8829787234042553, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9491525423728814, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9545454545454546, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.07663165777921677, |
|
"eval_overall_accuracy": 0.9881241565452091, |
|
"eval_overall_f1": 0.9517766497461929, |
|
"eval_overall_precision": 0.946969696969697, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2755, |
|
"eval_samples_per_second": 617.074, |
|
"eval_steps_per_second": 10.89, |
|
"step": 2688 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.40970727801322937, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0031, |
|
"step": 2784 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.9130434782608695, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8571428571428571, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9455587392550143, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9649122807017544, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9725490196078432, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9763779527559056, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.08022492378950119, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9467005076142132, |
|
"eval_overall_precision": 0.9419191919191919, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2752, |
|
"eval_samples_per_second": 617.806, |
|
"eval_steps_per_second": 10.902, |
|
"step": 2784 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 0.08574865758419037, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.0018, |
|
"step": 2880 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.9050279329608939, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8709677419354839, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9577464788732394, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.96045197740113, |
|
"eval_ORGANIZATION_recall": 0.9550561797752809, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.08365346491336823, |
|
"eval_overall_accuracy": 0.9892037786774629, |
|
"eval_overall_f1": 0.9517766497461929, |
|
"eval_overall_precision": 0.946969696969697, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2756, |
|
"eval_samples_per_second": 616.825, |
|
"eval_steps_per_second": 10.885, |
|
"step": 2880 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.002840681467205286, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0017, |
|
"step": 2976 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.9431818181818181, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9222222222222223, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.961111111111111, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9505494505494505, |
|
"eval_ORGANIZATION_recall": 0.9719101123595506, |
|
"eval_PERSON_f1": 0.9606299212598425, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9682539682539683, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.07920122146606445, |
|
"eval_overall_accuracy": 0.9902834008097166, |
|
"eval_overall_f1": 0.9569620253164557, |
|
"eval_overall_precision": 0.949748743718593, |
|
"eval_overall_recall": 0.9642857142857143, |
|
"eval_runtime": 0.2801, |
|
"eval_samples_per_second": 606.828, |
|
"eval_steps_per_second": 10.709, |
|
"step": 2976 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.001423178124241531, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.0017, |
|
"step": 3072 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.9171270718232045, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8736842105263158, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9633802816901408, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9661016949152542, |
|
"eval_ORGANIZATION_recall": 0.9606741573033708, |
|
"eval_PERSON_f1": 0.9644268774703557, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.976, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.06753446161746979, |
|
"eval_overall_accuracy": 0.99055330634278, |
|
"eval_overall_f1": 0.9531051964512041, |
|
"eval_overall_precision": 0.947103274559194, |
|
"eval_overall_recall": 0.9591836734693877, |
|
"eval_runtime": 0.2741, |
|
"eval_samples_per_second": 620.297, |
|
"eval_steps_per_second": 10.946, |
|
"step": 3072 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.001040176604874432, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0012, |
|
"step": 3168 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9542857142857143, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9709302325581395, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.09092291444540024, |
|
"eval_overall_accuracy": 0.9897435897435898, |
|
"eval_overall_f1": 0.9539641943734015, |
|
"eval_overall_precision": 0.9564102564102565, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2779, |
|
"eval_samples_per_second": 611.82, |
|
"eval_steps_per_second": 10.797, |
|
"step": 3168 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 0.21219216287136078, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.002, |
|
"step": 3264 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.9257142857142857, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9101123595505618, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9287749287749287, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9421965317919075, |
|
"eval_ORGANIZATION_recall": 0.9157303370786517, |
|
"eval_PERSON_f1": 0.9565217391304348, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968, |
|
"eval_PERSON_recall": 0.9453125, |
|
"eval_loss": 0.10773035138845444, |
|
"eval_overall_accuracy": 0.9846153846153847, |
|
"eval_overall_f1": 0.9370988446726572, |
|
"eval_overall_precision": 0.9431524547803618, |
|
"eval_overall_recall": 0.9311224489795918, |
|
"eval_runtime": 0.2753, |
|
"eval_samples_per_second": 617.461, |
|
"eval_steps_per_second": 10.896, |
|
"step": 3264 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 0.002467579208314419, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0023, |
|
"step": 3360 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.9213483146067417, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8913043478260869, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.95, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9395604395604396, |
|
"eval_ORGANIZATION_recall": 0.9606741573033708, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.091239333152771, |
|
"eval_overall_accuracy": 0.9881241565452091, |
|
"eval_overall_f1": 0.9494949494949495, |
|
"eval_overall_precision": 0.94, |
|
"eval_overall_recall": 0.9591836734693877, |
|
"eval_runtime": 0.2753, |
|
"eval_samples_per_second": 617.528, |
|
"eval_steps_per_second": 10.898, |
|
"step": 3360 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.01504553947597742, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0016, |
|
"step": 3456 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9545454545454545, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9655172413793104, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.08393337577581406, |
|
"eval_overall_accuracy": 0.9892037786774629, |
|
"eval_overall_f1": 0.9540816326530612, |
|
"eval_overall_precision": 0.9540816326530612, |
|
"eval_overall_recall": 0.9540816326530612, |
|
"eval_runtime": 0.275, |
|
"eval_samples_per_second": 618.195, |
|
"eval_steps_per_second": 10.909, |
|
"step": 3456 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 0.003291564527899027, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0012, |
|
"step": 3552 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.9162011173184358, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8817204301075269, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9344729344729344, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9479768786127167, |
|
"eval_ORGANIZATION_recall": 0.9213483146067416, |
|
"eval_PERSON_f1": 0.9644268774703557, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.976, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.10695616900920868, |
|
"eval_overall_accuracy": 0.9856950067476383, |
|
"eval_overall_f1": 0.9399744572158366, |
|
"eval_overall_precision": 0.9411764705882353, |
|
"eval_overall_recall": 0.9387755102040817, |
|
"eval_runtime": 0.2752, |
|
"eval_samples_per_second": 617.842, |
|
"eval_steps_per_second": 10.903, |
|
"step": 3552 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 0.0029779509641230106, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0009, |
|
"step": 3648 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.9392265193370165, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8947368421052632, |
|
"eval_LOCATION_recall": 0.9883720930232558, |
|
"eval_ORGANIZATION_f1": 0.9431818181818182, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9540229885057471, |
|
"eval_ORGANIZATION_recall": 0.9325842696629213, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.08564214408397675, |
|
"eval_overall_accuracy": 0.9883940620782726, |
|
"eval_overall_f1": 0.9516539440203563, |
|
"eval_overall_precision": 0.949238578680203, |
|
"eval_overall_recall": 0.9540816326530612, |
|
"eval_runtime": 0.2745, |
|
"eval_samples_per_second": 619.218, |
|
"eval_steps_per_second": 10.927, |
|
"step": 3648 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 0.0008915510843507946, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0006, |
|
"step": 3744 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.9333333333333332, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8936170212765957, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9375000000000001, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9482758620689655, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.09636305272579193, |
|
"eval_overall_accuracy": 0.9862348178137652, |
|
"eval_overall_f1": 0.9453621346886911, |
|
"eval_overall_precision": 0.9417721518987342, |
|
"eval_overall_recall": 0.9489795918367347, |
|
"eval_runtime": 0.2929, |
|
"eval_samples_per_second": 580.423, |
|
"eval_steps_per_second": 10.243, |
|
"step": 3744 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 0.0008046123548410833, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0011, |
|
"step": 3840 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.9265536723163842, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9010989010989011, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9464788732394366, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9491525423728814, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.09920275211334229, |
|
"eval_overall_accuracy": 0.9870445344129555, |
|
"eval_overall_f1": 0.9491094147582698, |
|
"eval_overall_precision": 0.9467005076142132, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2781, |
|
"eval_samples_per_second": 611.234, |
|
"eval_steps_per_second": 10.786, |
|
"step": 3840 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.000929164991248399, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0009, |
|
"step": 3936 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.9385474860335195, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9032258064516129, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9435028248587571, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9488636363636364, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.9644268774703557, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.976, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.1071603074669838, |
|
"eval_overall_accuracy": 0.9859649122807017, |
|
"eval_overall_f1": 0.9491094147582698, |
|
"eval_overall_precision": 0.9467005076142132, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2831, |
|
"eval_samples_per_second": 600.488, |
|
"eval_steps_per_second": 10.597, |
|
"step": 3936 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.00026114823413081467, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0007, |
|
"step": 4032 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.9333333333333332, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8936170212765957, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9458689458689458, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9595375722543352, |
|
"eval_ORGANIZATION_recall": 0.9325842696629213, |
|
"eval_PERSON_f1": 0.9682539682539683, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9838709677419355, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.1193474680185318, |
|
"eval_overall_accuracy": 0.9865047233468286, |
|
"eval_overall_f1": 0.9501915708812262, |
|
"eval_overall_precision": 0.9514066496163683, |
|
"eval_overall_recall": 0.9489795918367347, |
|
"eval_runtime": 0.2756, |
|
"eval_samples_per_second": 616.891, |
|
"eval_steps_per_second": 10.886, |
|
"step": 4032 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.0013629100285470486, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0014, |
|
"step": 4128 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.9385474860335195, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9032258064516129, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9435028248587571, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9488636363636364, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.9606299212598425, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9682539682539683, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.11290433257818222, |
|
"eval_overall_accuracy": 0.9867746288798921, |
|
"eval_overall_f1": 0.9479034307496824, |
|
"eval_overall_precision": 0.9443037974683545, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2779, |
|
"eval_samples_per_second": 611.663, |
|
"eval_steps_per_second": 10.794, |
|
"step": 4128 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 0.0006920368759892881, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.0007, |
|
"step": 4224 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.9438202247191011, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9130434782608695, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9464788732394366, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9491525423728814, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.9609375, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9609375, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.12893009185791016, |
|
"eval_overall_accuracy": 0.9848852901484481, |
|
"eval_overall_f1": 0.9505703422053231, |
|
"eval_overall_precision": 0.9445843828715366, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2752, |
|
"eval_samples_per_second": 617.77, |
|
"eval_steps_per_second": 10.902, |
|
"step": 4224 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 0.0005794434691779315, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0006, |
|
"step": 4320 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.9281767955801105, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8842105263157894, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9470752089136492, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9392265193370166, |
|
"eval_ORGANIZATION_recall": 0.9550561797752809, |
|
"eval_PERSON_f1": 0.96875, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.96875, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.11674495786428452, |
|
"eval_overall_accuracy": 0.9867746288798921, |
|
"eval_overall_f1": 0.949748743718593, |
|
"eval_overall_precision": 0.9356435643564357, |
|
"eval_overall_recall": 0.9642857142857143, |
|
"eval_runtime": 0.2809, |
|
"eval_samples_per_second": 605.289, |
|
"eval_steps_per_second": 10.682, |
|
"step": 4320 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.004815615713596344, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.0014, |
|
"step": 4416 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.9120879120879122, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8645833333333334, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9461756373937678, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9542857142857143, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.9682539682539683, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9838709677419355, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.11675991863012314, |
|
"eval_overall_accuracy": 0.9873144399460189, |
|
"eval_overall_f1": 0.9453621346886911, |
|
"eval_overall_precision": 0.9417721518987342, |
|
"eval_overall_recall": 0.9489795918367347, |
|
"eval_runtime": 0.2778, |
|
"eval_samples_per_second": 612.001, |
|
"eval_steps_per_second": 10.8, |
|
"step": 4416 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 0.0005003380356356502, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0022, |
|
"step": 4512 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.9171270718232045, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8736842105263158, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9421965317919075, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9702380952380952, |
|
"eval_ORGANIZATION_recall": 0.9157303370786517, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.10903999209403992, |
|
"eval_overall_accuracy": 0.9867746288798921, |
|
"eval_overall_f1": 0.9475032010243277, |
|
"eval_overall_precision": 0.9511568123393316, |
|
"eval_overall_recall": 0.9438775510204082, |
|
"eval_runtime": 0.2786, |
|
"eval_samples_per_second": 610.178, |
|
"eval_steps_per_second": 10.768, |
|
"step": 4512 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 34.43635559082031, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0033, |
|
"step": 4608 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.9431818181818181, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9222222222222223, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9385474860335196, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9333333333333333, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.9603174603174603, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9758064516129032, |
|
"eval_PERSON_recall": 0.9453125, |
|
"eval_loss": 0.08986053615808487, |
|
"eval_overall_accuracy": 0.9889338731443995, |
|
"eval_overall_f1": 0.9465648854961832, |
|
"eval_overall_precision": 0.9441624365482234, |
|
"eval_overall_recall": 0.9489795918367347, |
|
"eval_runtime": 0.2751, |
|
"eval_samples_per_second": 617.952, |
|
"eval_steps_per_second": 10.905, |
|
"step": 4608 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.011161034926772118, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.001, |
|
"step": 4704 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.9222222222222223, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8829787234042553, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9452449567723343, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9704142011834319, |
|
"eval_ORGANIZATION_recall": 0.9213483146067416, |
|
"eval_PERSON_f1": 0.9682539682539683, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9838709677419355, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.11230127513408661, |
|
"eval_overall_accuracy": 0.9870445344129555, |
|
"eval_overall_f1": 0.9473684210526317, |
|
"eval_overall_precision": 0.9534883720930233, |
|
"eval_overall_recall": 0.9413265306122449, |
|
"eval_runtime": 0.2762, |
|
"eval_samples_per_second": 615.553, |
|
"eval_steps_per_second": 10.863, |
|
"step": 4704 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 0.007018107455223799, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0007, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.9265536723163842, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9010989010989011, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9405099150141643, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9485714285714286, |
|
"eval_ORGANIZATION_recall": 0.9325842696629213, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.09373489022254944, |
|
"eval_overall_accuracy": 0.988663967611336, |
|
"eval_overall_f1": 0.9476372924648786, |
|
"eval_overall_precision": 0.948849104859335, |
|
"eval_overall_recall": 0.9464285714285714, |
|
"eval_runtime": 0.2788, |
|
"eval_samples_per_second": 609.778, |
|
"eval_steps_per_second": 10.761, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 0.0013735599350184202, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0011, |
|
"step": 4896 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.9385474860335195, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9032258064516129, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9329608938547486, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9277777777777778, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.10816428065299988, |
|
"eval_overall_accuracy": 0.9865047233468286, |
|
"eval_overall_f1": 0.9481668773704172, |
|
"eval_overall_precision": 0.9398496240601504, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2867, |
|
"eval_samples_per_second": 593.04, |
|
"eval_steps_per_second": 10.465, |
|
"step": 4896 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 2.9921071529388428, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0015, |
|
"step": 4992 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.9265536723163842, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9010989010989011, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9394812680115273, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9644970414201184, |
|
"eval_ORGANIZATION_recall": 0.9157303370786517, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.11124741286039352, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9460154241645244, |
|
"eval_overall_precision": 0.9533678756476683, |
|
"eval_overall_recall": 0.9387755102040817, |
|
"eval_runtime": 0.2821, |
|
"eval_samples_per_second": 602.698, |
|
"eval_steps_per_second": 10.636, |
|
"step": 4992 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 0.00152446492575109, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0009, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9444444444444444, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9340659340659341, |
|
"eval_ORGANIZATION_recall": 0.9550561797752809, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10318152606487274, |
|
"eval_overall_accuracy": 0.9881241565452091, |
|
"eval_overall_f1": 0.9494949494949495, |
|
"eval_overall_precision": 0.94, |
|
"eval_overall_recall": 0.9591836734693877, |
|
"eval_runtime": 0.2786, |
|
"eval_samples_per_second": 610.124, |
|
"eval_steps_per_second": 10.767, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 1.4761940240859985, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0033, |
|
"step": 5184 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.942857142857143, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9593023255813954, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.11812768876552582, |
|
"eval_overall_accuracy": 0.9870445344129555, |
|
"eval_overall_f1": 0.9488491048593349, |
|
"eval_overall_precision": 0.9512820512820512, |
|
"eval_overall_recall": 0.9464285714285714, |
|
"eval_runtime": 0.2746, |
|
"eval_samples_per_second": 619.118, |
|
"eval_steps_per_second": 10.926, |
|
"step": 5184 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 0.4280019700527191, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0008, |
|
"step": 5280 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.9325842696629213, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9021739130434783, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9485714285714285, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9651162790697675, |
|
"eval_ORGANIZATION_recall": 0.9325842696629213, |
|
"eval_PERSON_f1": 0.96875, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.96875, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.12067463994026184, |
|
"eval_overall_accuracy": 0.9865047233468286, |
|
"eval_overall_f1": 0.951530612244898, |
|
"eval_overall_precision": 0.951530612244898, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2807, |
|
"eval_samples_per_second": 605.66, |
|
"eval_steps_per_second": 10.688, |
|
"step": 5280 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 0.0007758406572975218, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0009, |
|
"step": 5376 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.9060773480662985, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8631578947368421, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9421965317919075, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9702380952380952, |
|
"eval_ORGANIZATION_recall": 0.9157303370786517, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.13788987696170807, |
|
"eval_overall_accuracy": 0.9856950067476383, |
|
"eval_overall_f1": 0.9435897435897437, |
|
"eval_overall_precision": 0.9484536082474226, |
|
"eval_overall_recall": 0.9387755102040817, |
|
"eval_runtime": 0.2774, |
|
"eval_samples_per_second": 612.89, |
|
"eval_steps_per_second": 10.816, |
|
"step": 5376 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.0007105050608515739, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.001, |
|
"step": 5472 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9512893982808023, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9707602339181286, |
|
"eval_ORGANIZATION_recall": 0.9325842696629213, |
|
"eval_PERSON_f1": 0.9723320158102766, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.984, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.11200056970119476, |
|
"eval_overall_accuracy": 0.9881241565452091, |
|
"eval_overall_f1": 0.9526248399487837, |
|
"eval_overall_precision": 0.9562982005141388, |
|
"eval_overall_recall": 0.9489795918367347, |
|
"eval_runtime": 0.2759, |
|
"eval_samples_per_second": 616.121, |
|
"eval_steps_per_second": 10.873, |
|
"step": 5472 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.0010843342170119286, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0013, |
|
"step": 5568 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.9222222222222223, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8829787234042553, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9375000000000001, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9482758620689655, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.1086345985531807, |
|
"eval_overall_accuracy": 0.9862348178137652, |
|
"eval_overall_f1": 0.9465648854961832, |
|
"eval_overall_precision": 0.9441624365482234, |
|
"eval_overall_recall": 0.9489795918367347, |
|
"eval_runtime": 0.2775, |
|
"eval_samples_per_second": 612.711, |
|
"eval_steps_per_second": 10.813, |
|
"step": 5568 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 0.0003581370983738452, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0005, |
|
"step": 5664 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.9180327868852459, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.865979381443299, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9333333333333333, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9640718562874252, |
|
"eval_ORGANIZATION_recall": 0.9044943820224719, |
|
"eval_PERSON_f1": 0.9612403100775193, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9538461538461539, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.12184558063745499, |
|
"eval_overall_accuracy": 0.9854251012145749, |
|
"eval_overall_f1": 0.9389312977099236, |
|
"eval_overall_precision": 0.9365482233502538, |
|
"eval_overall_recall": 0.9413265306122449, |
|
"eval_runtime": 0.2757, |
|
"eval_samples_per_second": 616.564, |
|
"eval_steps_per_second": 10.881, |
|
"step": 5664 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 0.0011471403995528817, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0007, |
|
"step": 5760 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.9213483146067417, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8913043478260869, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9392265193370166, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9239130434782609, |
|
"eval_ORGANIZATION_recall": 0.9550561797752809, |
|
"eval_PERSON_f1": 0.9682539682539683, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9838709677419355, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.09577618539333344, |
|
"eval_overall_accuracy": 0.9881241565452091, |
|
"eval_overall_f1": 0.9444444444444445, |
|
"eval_overall_precision": 0.935, |
|
"eval_overall_recall": 0.9540816326530612, |
|
"eval_runtime": 0.2772, |
|
"eval_samples_per_second": 613.208, |
|
"eval_steps_per_second": 10.821, |
|
"step": 5760 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 0.1609802097082138, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0002, |
|
"step": 5856 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.9162011173184358, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8817204301075269, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.942857142857143, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9593023255813954, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9644268774703557, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.976, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.10759799927473068, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9437340153452686, |
|
"eval_overall_precision": 0.9461538461538461, |
|
"eval_overall_recall": 0.9413265306122449, |
|
"eval_runtime": 0.278, |
|
"eval_samples_per_second": 611.566, |
|
"eval_steps_per_second": 10.792, |
|
"step": 5856 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 12.48816204071045, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0023, |
|
"step": 5952 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.9497206703910613, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9139784946236559, |
|
"eval_LOCATION_recall": 0.9883720930232558, |
|
"eval_ORGANIZATION_f1": 0.949438202247191, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.949438202247191, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9725490196078432, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9763779527559056, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.08770798146724701, |
|
"eval_overall_accuracy": 0.9894736842105263, |
|
"eval_overall_f1": 0.9569620253164557, |
|
"eval_overall_precision": 0.949748743718593, |
|
"eval_overall_recall": 0.9642857142857143, |
|
"eval_runtime": 0.2765, |
|
"eval_samples_per_second": 614.816, |
|
"eval_steps_per_second": 10.85, |
|
"step": 5952 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 0.0009683805401436985, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0013, |
|
"step": 6048 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.9385474860335195, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9032258064516129, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9526462395543176, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9447513812154696, |
|
"eval_ORGANIZATION_recall": 0.9606741573033708, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.08852725476026535, |
|
"eval_overall_accuracy": 0.9894736842105263, |
|
"eval_overall_f1": 0.9570707070707071, |
|
"eval_overall_precision": 0.9475, |
|
"eval_overall_recall": 0.9668367346938775, |
|
"eval_runtime": 0.2742, |
|
"eval_samples_per_second": 620.036, |
|
"eval_steps_per_second": 10.942, |
|
"step": 6048 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 0.0008049598545767367, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0009, |
|
"step": 6144 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.9385474860335195, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9032258064516129, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9577464788732394, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.96045197740113, |
|
"eval_ORGANIZATION_recall": 0.9550561797752809, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.08247757703065872, |
|
"eval_overall_accuracy": 0.9900134952766532, |
|
"eval_overall_f1": 0.9593908629441624, |
|
"eval_overall_precision": 0.9545454545454546, |
|
"eval_overall_recall": 0.9642857142857143, |
|
"eval_runtime": 0.2795, |
|
"eval_samples_per_second": 608.296, |
|
"eval_steps_per_second": 10.735, |
|
"step": 6144 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 0.0007374592823907733, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0003, |
|
"step": 6240 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.9431818181818181, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9222222222222223, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.951841359773371, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.96, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.0837675929069519, |
|
"eval_overall_accuracy": 0.9883940620782726, |
|
"eval_overall_f1": 0.9578544061302682, |
|
"eval_overall_precision": 0.959079283887468, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2762, |
|
"eval_samples_per_second": 615.537, |
|
"eval_steps_per_second": 10.862, |
|
"step": 6240 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.0010951802833005786, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0006, |
|
"step": 6336 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.9385474860335195, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9032258064516129, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.951841359773371, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.96, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.09569484740495682, |
|
"eval_overall_accuracy": 0.988663967611336, |
|
"eval_overall_f1": 0.9567430025445292, |
|
"eval_overall_precision": 0.9543147208121827, |
|
"eval_overall_recall": 0.9591836734693877, |
|
"eval_runtime": 0.2788, |
|
"eval_samples_per_second": 609.729, |
|
"eval_steps_per_second": 10.76, |
|
"step": 6336 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.005136103834956884, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0004, |
|
"step": 6432 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9455587392550143, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9649122807017544, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.11290714144706726, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9514066496163682, |
|
"eval_overall_precision": 0.9538461538461539, |
|
"eval_overall_recall": 0.9489795918367347, |
|
"eval_runtime": 0.2755, |
|
"eval_samples_per_second": 617.088, |
|
"eval_steps_per_second": 10.89, |
|
"step": 6432 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.0017895177006721497, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0003, |
|
"step": 6528 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.9333333333333332, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8936170212765957, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9401709401709402, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.953757225433526, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9725490196078432, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9763779527559056, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.1161164864897728, |
|
"eval_overall_accuracy": 0.9870445344129555, |
|
"eval_overall_f1": 0.9491094147582698, |
|
"eval_overall_precision": 0.9467005076142132, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2777, |
|
"eval_samples_per_second": 612.091, |
|
"eval_steps_per_second": 10.802, |
|
"step": 6528 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 0.00024917226983234286, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0002, |
|
"step": 6624 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.9333333333333332, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8936170212765957, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9394812680115273, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9644970414201184, |
|
"eval_ORGANIZATION_recall": 0.9157303370786517, |
|
"eval_PERSON_f1": 0.96875, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.96875, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.12338589131832123, |
|
"eval_overall_accuracy": 0.9862348178137652, |
|
"eval_overall_f1": 0.9476372924648786, |
|
"eval_overall_precision": 0.948849104859335, |
|
"eval_overall_recall": 0.9464285714285714, |
|
"eval_runtime": 0.2765, |
|
"eval_samples_per_second": 614.72, |
|
"eval_steps_per_second": 10.848, |
|
"step": 6624 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 0.002585263457149267, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0006, |
|
"step": 6720 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.9491525423728814, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9230769230769231, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9485714285714285, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9651162790697675, |
|
"eval_ORGANIZATION_recall": 0.9325842696629213, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.11618266254663467, |
|
"eval_overall_accuracy": 0.9883940620782726, |
|
"eval_overall_f1": 0.9577464788732394, |
|
"eval_overall_precision": 0.961439588688946, |
|
"eval_overall_recall": 0.9540816326530612, |
|
"eval_runtime": 0.2791, |
|
"eval_samples_per_second": 609.103, |
|
"eval_steps_per_second": 10.749, |
|
"step": 6720 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 0.11092416942119598, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0002, |
|
"step": 6816 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.9545454545454545, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9333333333333333, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.951841359773371, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.96, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.11071506142616272, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9604086845466155, |
|
"eval_overall_precision": 0.9616368286445013, |
|
"eval_overall_recall": 0.9591836734693877, |
|
"eval_runtime": 0.2755, |
|
"eval_samples_per_second": 617.089, |
|
"eval_steps_per_second": 10.89, |
|
"step": 6816 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 0.000154004359501414, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0002, |
|
"step": 6912 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.9491525423728814, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9230769230769231, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9488636363636365, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9597701149425287, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.1120668277144432, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9578544061302682, |
|
"eval_overall_precision": 0.959079283887468, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2766, |
|
"eval_samples_per_second": 614.651, |
|
"eval_steps_per_second": 10.847, |
|
"step": 6912 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.00016238982789218426, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0002, |
|
"step": 7008 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.9491525423728814, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9230769230769231, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9461756373937678, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9542857142857143, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.11216197162866592, |
|
"eval_overall_accuracy": 0.9881241565452091, |
|
"eval_overall_f1": 0.9566326530612245, |
|
"eval_overall_precision": 0.9566326530612245, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.285, |
|
"eval_samples_per_second": 596.506, |
|
"eval_steps_per_second": 10.527, |
|
"step": 7008 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 0.00033696964965201914, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0005, |
|
"step": 7104 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.9491525423728814, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9230769230769231, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9461756373937678, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9542857142857143, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.9763779527559054, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9841269841269841, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.1126818060874939, |
|
"eval_overall_accuracy": 0.9873144399460189, |
|
"eval_overall_f1": 0.9566326530612245, |
|
"eval_overall_precision": 0.9566326530612245, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2829, |
|
"eval_samples_per_second": 600.942, |
|
"eval_steps_per_second": 10.605, |
|
"step": 7104 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.0003657756024040282, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0004, |
|
"step": 7200 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.9438202247191011, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9130434782608695, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9431818181818182, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9540229885057471, |
|
"eval_ORGANIZATION_recall": 0.9325842696629213, |
|
"eval_PERSON_f1": 0.96875, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.96875, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.11697709560394287, |
|
"eval_overall_accuracy": 0.9862348178137652, |
|
"eval_overall_f1": 0.9516539440203563, |
|
"eval_overall_precision": 0.949238578680203, |
|
"eval_overall_recall": 0.9540816326530612, |
|
"eval_runtime": 0.2786, |
|
"eval_samples_per_second": 610.145, |
|
"eval_steps_per_second": 10.767, |
|
"step": 7200 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 0.00010258240217808634, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0003, |
|
"step": 7296 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.9545454545454545, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9333333333333333, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9497206703910613, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9444444444444444, |
|
"eval_ORGANIZATION_recall": 0.9550561797752809, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10894415527582169, |
|
"eval_overall_accuracy": 0.9892037786774629, |
|
"eval_overall_f1": 0.9568527918781725, |
|
"eval_overall_precision": 0.952020202020202, |
|
"eval_overall_recall": 0.9617346938775511, |
|
"eval_runtime": 0.2762, |
|
"eval_samples_per_second": 615.53, |
|
"eval_steps_per_second": 10.862, |
|
"step": 7296 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 0.0007157445070333779, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.001, |
|
"step": 7392 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.9491525423728814, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9230769230769231, |
|
"eval_LOCATION_recall": 0.9767441860465116, |
|
"eval_ORGANIZATION_f1": 0.9582172701949861, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9502762430939227, |
|
"eval_ORGANIZATION_recall": 0.9662921348314607, |
|
"eval_PERSON_f1": 0.9725490196078432, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9763779527559056, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.10824745148420334, |
|
"eval_overall_accuracy": 0.9894736842105263, |
|
"eval_overall_f1": 0.9608091024020227, |
|
"eval_overall_precision": 0.9523809523809523, |
|
"eval_overall_recall": 0.9693877551020408, |
|
"eval_runtime": 0.2772, |
|
"eval_samples_per_second": 613.187, |
|
"eval_steps_per_second": 10.821, |
|
"step": 7392 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 0.013988692313432693, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0012, |
|
"step": 7488 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.9325842696629213, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9021739130434783, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9355742296918768, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9329608938547486, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.96875, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.96875, |
|
"eval_PERSON_recall": 0.96875, |
|
"eval_loss": 0.10093524307012558, |
|
"eval_overall_accuracy": 0.9862348178137652, |
|
"eval_overall_f1": 0.9456384323640962, |
|
"eval_overall_precision": 0.9373433583959899, |
|
"eval_overall_recall": 0.9540816326530612, |
|
"eval_runtime": 0.278, |
|
"eval_samples_per_second": 611.532, |
|
"eval_steps_per_second": 10.792, |
|
"step": 7488 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.0004660775884985924, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0002, |
|
"step": 7584 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.9060773480662985, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8631578947368421, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9435028248587571, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9488636363636364, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.9644268774703557, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.976, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.10507776588201523, |
|
"eval_overall_accuracy": 0.9865047233468286, |
|
"eval_overall_f1": 0.9416243654822335, |
|
"eval_overall_precision": 0.9368686868686869, |
|
"eval_overall_recall": 0.9464285714285714, |
|
"eval_runtime": 0.2738, |
|
"eval_samples_per_second": 620.982, |
|
"eval_steps_per_second": 10.959, |
|
"step": 7584 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.0003681587695609778, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0002, |
|
"step": 7680 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.9111111111111112, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8723404255319149, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9431818181818182, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9540229885057471, |
|
"eval_ORGANIZATION_recall": 0.9325842696629213, |
|
"eval_PERSON_f1": 0.9644268774703557, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.976, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.11081729084253311, |
|
"eval_overall_accuracy": 0.9865047233468286, |
|
"eval_overall_f1": 0.9426751592356687, |
|
"eval_overall_precision": 0.9414758269720102, |
|
"eval_overall_recall": 0.9438775510204082, |
|
"eval_runtime": 0.2753, |
|
"eval_samples_per_second": 617.505, |
|
"eval_steps_per_second": 10.897, |
|
"step": 7680 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 0.0002929773472715169, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0005, |
|
"step": 7776 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.9213483146067417, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8913043478260869, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9461756373937678, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9542857142857143, |
|
"eval_ORGANIZATION_recall": 0.9382022471910112, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10365120321512222, |
|
"eval_overall_accuracy": 0.9870445344129555, |
|
"eval_overall_f1": 0.9477707006369427, |
|
"eval_overall_precision": 0.9465648854961832, |
|
"eval_overall_recall": 0.9489795918367347, |
|
"eval_runtime": 0.2735, |
|
"eval_samples_per_second": 621.671, |
|
"eval_steps_per_second": 10.971, |
|
"step": 7776 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 0.00024136666615959257, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0003, |
|
"step": 7872 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.9050279329608939, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8709677419354839, |
|
"eval_LOCATION_recall": 0.9418604651162791, |
|
"eval_ORGANIZATION_f1": 0.9431818181818182, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9540229885057471, |
|
"eval_ORGANIZATION_recall": 0.9325842696629213, |
|
"eval_PERSON_f1": 0.9644268774703557, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.976, |
|
"eval_PERSON_recall": 0.953125, |
|
"eval_loss": 0.1031210720539093, |
|
"eval_overall_accuracy": 0.9867746288798921, |
|
"eval_overall_f1": 0.9413265306122449, |
|
"eval_overall_precision": 0.9413265306122449, |
|
"eval_overall_recall": 0.9413265306122449, |
|
"eval_runtime": 0.2763, |
|
"eval_samples_per_second": 615.215, |
|
"eval_steps_per_second": 10.857, |
|
"step": 7872 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.00017047034634742886, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0003, |
|
"step": 7968 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.9378531073446328, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9120879120879121, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9548022598870057, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9602272727272727, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.09963062405586243, |
|
"eval_overall_accuracy": 0.988663967611336, |
|
"eval_overall_f1": 0.9541984732824428, |
|
"eval_overall_precision": 0.9517766497461929, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2758, |
|
"eval_samples_per_second": 616.456, |
|
"eval_steps_per_second": 10.879, |
|
"step": 7968 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 0.0007244854350574315, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0002, |
|
"step": 8064 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.9431818181818181, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9222222222222223, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9548022598870057, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9602272727272727, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.09869366884231567, |
|
"eval_overall_accuracy": 0.988663967611336, |
|
"eval_overall_f1": 0.9554140127388535, |
|
"eval_overall_precision": 0.9541984732824428, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2758, |
|
"eval_samples_per_second": 616.49, |
|
"eval_steps_per_second": 10.879, |
|
"step": 8064 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 0.00027018680702894926, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0004, |
|
"step": 8160 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.9431818181818181, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9222222222222223, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9548022598870057, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9602272727272727, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10174024105072021, |
|
"eval_overall_accuracy": 0.988663967611336, |
|
"eval_overall_f1": 0.9554140127388535, |
|
"eval_overall_precision": 0.9541984732824428, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2746, |
|
"eval_samples_per_second": 618.994, |
|
"eval_steps_per_second": 10.923, |
|
"step": 8160 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 0.00015681206423323601, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0002, |
|
"step": 8256 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.9431818181818181, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9222222222222223, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9548022598870057, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9602272727272727, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10175755620002747, |
|
"eval_overall_accuracy": 0.988663967611336, |
|
"eval_overall_f1": 0.9554140127388535, |
|
"eval_overall_precision": 0.9541984732824428, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2831, |
|
"eval_samples_per_second": 600.454, |
|
"eval_steps_per_second": 10.596, |
|
"step": 8256 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.00022313217050395906, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0001, |
|
"step": 8352 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.9431818181818181, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9222222222222223, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.957983193277311, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9553072625698324, |
|
"eval_ORGANIZATION_recall": 0.9606741573033708, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10168375074863434, |
|
"eval_overall_accuracy": 0.9889338731443995, |
|
"eval_overall_f1": 0.9568527918781725, |
|
"eval_overall_precision": 0.952020202020202, |
|
"eval_overall_recall": 0.9617346938775511, |
|
"eval_runtime": 0.2755, |
|
"eval_samples_per_second": 617.136, |
|
"eval_steps_per_second": 10.891, |
|
"step": 8352 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 0.0003491460520308465, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0002, |
|
"step": 8448 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.9431818181818181, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9222222222222223, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9548022598870057, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9602272727272727, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10284104943275452, |
|
"eval_overall_accuracy": 0.988663967611336, |
|
"eval_overall_f1": 0.9554140127388535, |
|
"eval_overall_precision": 0.9541984732824428, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2864, |
|
"eval_samples_per_second": 593.603, |
|
"eval_steps_per_second": 10.475, |
|
"step": 8448 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.00023058451188262552, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0001, |
|
"step": 8544 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.9431818181818181, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9222222222222223, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9548022598870057, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9602272727272727, |
|
"eval_ORGANIZATION_recall": 0.949438202247191, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10325466841459274, |
|
"eval_overall_accuracy": 0.988663967611336, |
|
"eval_overall_f1": 0.9554140127388535, |
|
"eval_overall_precision": 0.9541984732824428, |
|
"eval_overall_recall": 0.9566326530612245, |
|
"eval_runtime": 0.2769, |
|
"eval_samples_per_second": 613.882, |
|
"eval_steps_per_second": 10.833, |
|
"step": 8544 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 0.00042677970486693084, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0002, |
|
"step": 8640 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.9371428571428573, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9213483146067416, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9491525423728814, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9545454545454546, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.1025572419166565, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9527458492975734, |
|
"eval_overall_precision": 0.9539641943734015, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2749, |
|
"eval_samples_per_second": 618.381, |
|
"eval_steps_per_second": 10.913, |
|
"step": 8640 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 0.00043625899706967175, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0002, |
|
"step": 8736 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.9371428571428573, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9213483146067416, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9491525423728814, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9545454545454546, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10244476050138474, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9527458492975734, |
|
"eval_overall_precision": 0.9539641943734015, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2764, |
|
"eval_samples_per_second": 615.112, |
|
"eval_steps_per_second": 10.855, |
|
"step": 8736 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 0.0001665508607402444, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0002, |
|
"step": 8832 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.9371428571428573, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9213483146067416, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9491525423728814, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9545454545454546, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10252244770526886, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9527458492975734, |
|
"eval_overall_precision": 0.9539641943734015, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2809, |
|
"eval_samples_per_second": 605.297, |
|
"eval_steps_per_second": 10.682, |
|
"step": 8832 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.0002152398374164477, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0002, |
|
"step": 8928 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.9371428571428573, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9213483146067416, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9491525423728814, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9545454545454546, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10386810451745987, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9527458492975734, |
|
"eval_overall_precision": 0.9539641943734015, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2851, |
|
"eval_samples_per_second": 596.31, |
|
"eval_steps_per_second": 10.523, |
|
"step": 8928 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 0.00013109896099194884, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0001, |
|
"step": 9024 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.9371428571428573, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9213483146067416, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9491525423728814, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9545454545454546, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10342691838741302, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9527458492975734, |
|
"eval_overall_precision": 0.9539641943734015, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2864, |
|
"eval_samples_per_second": 593.558, |
|
"eval_steps_per_second": 10.475, |
|
"step": 9024 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 8.776304457569495e-05, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0001, |
|
"step": 9120 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.9371428571428573, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.9213483146067416, |
|
"eval_LOCATION_recall": 0.9534883720930233, |
|
"eval_ORGANIZATION_f1": 0.9491525423728814, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.9545454545454546, |
|
"eval_ORGANIZATION_recall": 0.9438202247191011, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.1035594493150711, |
|
"eval_overall_accuracy": 0.9878542510121457, |
|
"eval_overall_f1": 0.9527458492975734, |
|
"eval_overall_precision": 0.9539641943734015, |
|
"eval_overall_recall": 0.951530612244898, |
|
"eval_runtime": 0.2771, |
|
"eval_samples_per_second": 613.457, |
|
"eval_steps_per_second": 10.826, |
|
"step": 9120 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 0.00011784955131588504, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0001, |
|
"step": 9216 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9401709401709402, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.953757225433526, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.968503937007874, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.9761904761904762, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10866863280534744, |
|
"eval_overall_accuracy": 0.9873144399460189, |
|
"eval_overall_f1": 0.9464285714285714, |
|
"eval_overall_precision": 0.9464285714285714, |
|
"eval_overall_recall": 0.9464285714285714, |
|
"eval_runtime": 0.2796, |
|
"eval_samples_per_second": 608.08, |
|
"eval_steps_per_second": 10.731, |
|
"step": 9216 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 0.0001753137621562928, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0005, |
|
"step": 9312 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9401709401709402, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.953757225433526, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10562655329704285, |
|
"eval_overall_accuracy": 0.9875843454790824, |
|
"eval_overall_f1": 0.9452229299363057, |
|
"eval_overall_precision": 0.9440203562340967, |
|
"eval_overall_recall": 0.9464285714285714, |
|
"eval_runtime": 0.2763, |
|
"eval_samples_per_second": 615.195, |
|
"eval_steps_per_second": 10.856, |
|
"step": 9312 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 0.000347200024407357, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0003, |
|
"step": 9408 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9401709401709402, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.953757225433526, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10447113960981369, |
|
"eval_overall_accuracy": 0.9875843454790824, |
|
"eval_overall_f1": 0.9452229299363057, |
|
"eval_overall_precision": 0.9440203562340967, |
|
"eval_overall_recall": 0.9464285714285714, |
|
"eval_runtime": 0.2767, |
|
"eval_samples_per_second": 614.345, |
|
"eval_steps_per_second": 10.841, |
|
"step": 9408 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.0003261720994487405, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0001, |
|
"step": 9504 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9401709401709402, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.953757225433526, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10466174781322479, |
|
"eval_overall_accuracy": 0.9875843454790824, |
|
"eval_overall_f1": 0.9452229299363057, |
|
"eval_overall_precision": 0.9440203562340967, |
|
"eval_overall_recall": 0.9464285714285714, |
|
"eval_runtime": 0.2746, |
|
"eval_samples_per_second": 619.061, |
|
"eval_steps_per_second": 10.925, |
|
"step": 9504 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 9.912410314427689e-05, |
|
"learning_rate": 0.0, |
|
"loss": 0.0002, |
|
"step": 9600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.9273743016759777, |
|
"eval_LOCATION_number": 86, |
|
"eval_LOCATION_precision": 0.8924731182795699, |
|
"eval_LOCATION_recall": 0.9651162790697675, |
|
"eval_ORGANIZATION_f1": 0.9401709401709402, |
|
"eval_ORGANIZATION_number": 178, |
|
"eval_ORGANIZATION_precision": 0.953757225433526, |
|
"eval_ORGANIZATION_recall": 0.9269662921348315, |
|
"eval_PERSON_f1": 0.9647058823529412, |
|
"eval_PERSON_number": 128, |
|
"eval_PERSON_precision": 0.968503937007874, |
|
"eval_PERSON_recall": 0.9609375, |
|
"eval_loss": 0.10467950254678726, |
|
"eval_overall_accuracy": 0.9875843454790824, |
|
"eval_overall_f1": 0.9452229299363057, |
|
"eval_overall_precision": 0.9440203562340967, |
|
"eval_overall_recall": 0.9464285714285714, |
|
"eval_runtime": 0.2862, |
|
"eval_samples_per_second": 593.895, |
|
"eval_steps_per_second": 10.48, |
|
"step": 9600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 9600, |
|
"total_flos": 3867927199316004.0, |
|
"train_loss": 0.005292673466804748, |
|
"train_runtime": 863.5274, |
|
"train_samples_per_second": 177.296, |
|
"train_steps_per_second": 11.117 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 9600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 3867927199316004.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|