m0_flat_ner_ocr_cmbert_io / trainer_state.json
nlpso's picture
Load model and tokenizer
f2a84c8
{
"best_metric": 0.9642591213700671,
"best_model_checkpoint": "/work/stual/res_ICDAR/method_0/tmp/41-flat-ner-pero-ocr-camembert_ner/checkpoint-900",
"epoch": 2.362204724409449,
"global_step": 900,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.26,
"eval_ACT": {
"f1": 0.8502242152466369,
"number": 519,
"precision": 0.7953020134228188,
"recall": 0.9132947976878613
},
"eval_CARDINAL": {
"f1": 0.9723032069970846,
"number": 678,
"precision": 0.9610951008645533,
"recall": 0.9837758112094396
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9184993531694695,
"number": 761,
"precision": 0.9044585987261147,
"recall": 0.9329829172141918
},
"eval_PER": {
"f1": 0.9062957540263543,
"number": 679,
"precision": 0.901018922852984,
"recall": 0.9116347569955817
},
"eval_TITRE": {
"f1": 0.0,
"number": 41,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9454568463680081,
"eval_f1": 0.9069212410501192,
"eval_loss": 0.2516954839229584,
"eval_precision": 0.8942795076031861,
"eval_recall": 0.9199255121042831,
"eval_runtime": 2.036,
"eval_samples_per_second": 332.026,
"eval_steps_per_second": 21.12,
"step": 100
},
{
"epoch": 0.52,
"eval_ACT": {
"f1": 0.8866359447004608,
"number": 519,
"precision": 0.8498233215547704,
"recall": 0.9267822736030829
},
"eval_CARDINAL": {
"f1": 0.9786607799852833,
"number": 678,
"precision": 0.9765051395007343,
"recall": 0.9808259587020649
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9327296248382924,
"number": 761,
"precision": 0.9184713375796179,
"recall": 0.9474375821287779
},
"eval_PER": {
"f1": 0.9166666666666666,
"number": 679,
"precision": 0.9100145137880987,
"recall": 0.9234167893961709
},
"eval_TITRE": {
"f1": 0.0,
"number": 41,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9538091622374083,
"eval_f1": 0.9226785053644099,
"eval_loss": 0.18263815343379974,
"eval_precision": 0.9165747886806321,
"eval_recall": 0.9288640595903166,
"eval_runtime": 2.0314,
"eval_samples_per_second": 332.78,
"eval_steps_per_second": 21.168,
"step": 200
},
{
"epoch": 0.79,
"eval_ACT": {
"f1": 0.9261744966442953,
"number": 519,
"precision": 0.9217557251908397,
"recall": 0.930635838150289
},
"eval_CARDINAL": {
"f1": 0.9816581071166545,
"number": 678,
"precision": 0.9766423357664233,
"recall": 0.9867256637168141
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.947780678851175,
"number": 761,
"precision": 0.9416342412451362,
"recall": 0.9540078843626807
},
"eval_PER": {
"f1": 0.94620486366986,
"number": 679,
"precision": 0.9469026548672567,
"recall": 0.9455081001472754
},
"eval_TITRE": {
"f1": 0.4675324675324676,
"number": 41,
"precision": 0.5,
"recall": 0.43902439024390244
},
"eval_accuracy": 0.9639331814730449,
"eval_f1": 0.9436698271054099,
"eval_loss": 0.13531556725502014,
"eval_precision": 0.9420935412026726,
"eval_recall": 0.9452513966480447,
"eval_runtime": 2.0117,
"eval_samples_per_second": 336.027,
"eval_steps_per_second": 21.375,
"step": 300
},
{
"epoch": 1.05,
"eval_ACT": {
"f1": 0.9381541389153186,
"number": 519,
"precision": 0.9266917293233082,
"recall": 0.9499036608863198
},
"eval_CARDINAL": {
"f1": 0.9852724594992636,
"number": 678,
"precision": 0.9838235294117647,
"recall": 0.9867256637168141
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9483322432962721,
"number": 761,
"precision": 0.9440104166666666,
"recall": 0.9526938239159002
},
"eval_PER": {
"f1": 0.9553113553113554,
"number": 679,
"precision": 0.9504373177842566,
"recall": 0.9602356406480118
},
"eval_TITRE": {
"f1": 0.5813953488372093,
"number": 41,
"precision": 0.5555555555555556,
"recall": 0.6097560975609756
},
"eval_accuracy": 0.9646924829157175,
"eval_f1": 0.9503335804299481,
"eval_loss": 0.11591742187738419,
"eval_precision": 0.9457764662486168,
"eval_recall": 0.9549348230912477,
"eval_runtime": 2.0409,
"eval_samples_per_second": 331.23,
"eval_steps_per_second": 21.069,
"step": 400
},
{
"epoch": 1.31,
"learning_rate": 9e-05,
"loss": 0.2356,
"step": 500
},
{
"epoch": 1.31,
"eval_ACT": {
"f1": 0.9393939393939394,
"number": 519,
"precision": 0.9236499068901304,
"recall": 0.9556840077071291
},
"eval_CARDINAL": {
"f1": 0.9830258302583026,
"number": 678,
"precision": 0.983751846381093,
"recall": 0.9823008849557522
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.944769330734243,
"number": 761,
"precision": 0.9344473007712082,
"recall": 0.9553219448094612
},
"eval_PER": {
"f1": 0.9618208516886931,
"number": 679,
"precision": 0.95900439238653,
"recall": 0.9646539027982327
},
"eval_TITRE": {
"f1": 0.684931506849315,
"number": 41,
"precision": 0.78125,
"recall": 0.6097560975609756
},
"eval_accuracy": 0.9710199949379904,
"eval_f1": 0.952893175074184,
"eval_loss": 0.10950864851474762,
"eval_precision": 0.949021056520133,
"eval_recall": 0.9567970204841714,
"eval_runtime": 2.1232,
"eval_samples_per_second": 318.382,
"eval_steps_per_second": 20.252,
"step": 500
},
{
"epoch": 1.57,
"eval_ACT": {
"f1": 0.9485714285714286,
"number": 519,
"precision": 0.9378531073446328,
"recall": 0.9595375722543352
},
"eval_CARDINAL": {
"f1": 0.9801907556859869,
"number": 678,
"precision": 0.9751824817518249,
"recall": 0.9852507374631269
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9492187500000001,
"number": 761,
"precision": 0.9406451612903226,
"recall": 0.9579500657030223
},
"eval_PER": {
"f1": 0.96759941089838,
"number": 679,
"precision": 0.96759941089838,
"recall": 0.96759941089838
},
"eval_TITRE": {
"f1": 0.7160493827160495,
"number": 41,
"precision": 0.725,
"recall": 0.7073170731707317
},
"eval_accuracy": 0.9716527461402177,
"eval_f1": 0.9568118628359593,
"eval_loss": 0.09932182729244232,
"eval_precision": 0.9523985239852398,
"eval_recall": 0.9612662942271881,
"eval_runtime": 2.1374,
"eval_samples_per_second": 316.273,
"eval_steps_per_second": 20.118,
"step": 600
},
{
"epoch": 1.84,
"eval_ACT": {
"f1": 0.9541984732824428,
"number": 519,
"precision": 0.945179584120983,
"recall": 0.9633911368015414
},
"eval_CARDINAL": {
"f1": 0.9852507374631269,
"number": 678,
"precision": 0.9852507374631269,
"recall": 0.9852507374631269
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9510124101894187,
"number": 761,
"precision": 0.9454545454545454,
"recall": 0.9566360052562418
},
"eval_PER": {
"f1": 0.9771891096394407,
"number": 679,
"precision": 0.9764705882352941,
"recall": 0.9779086892488954
},
"eval_TITRE": {
"f1": 0.7848101265822786,
"number": 41,
"precision": 0.8157894736842105,
"recall": 0.7560975609756098
},
"eval_accuracy": 0.9779802581624905,
"eval_f1": 0.9631970260223048,
"eval_loss": 0.08475597947835922,
"eval_precision": 0.9614100185528757,
"eval_recall": 0.9649906890130354,
"eval_runtime": 2.0431,
"eval_samples_per_second": 330.877,
"eval_steps_per_second": 21.047,
"step": 700
},
{
"epoch": 2.1,
"eval_ACT": {
"f1": 0.9468690702087287,
"number": 519,
"precision": 0.9327102803738317,
"recall": 0.9614643545279383
},
"eval_CARDINAL": {
"f1": 0.9852507374631269,
"number": 678,
"precision": 0.9852507374631269,
"recall": 0.9852507374631269
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9432485322896281,
"number": 761,
"precision": 0.9365284974093264,
"recall": 0.9500657030223391
},
"eval_PER": {
"f1": 0.9705882352941176,
"number": 679,
"precision": 0.9691629955947136,
"recall": 0.9720176730486009
},
"eval_TITRE": {
"f1": 0.7594936708860759,
"number": 41,
"precision": 0.7894736842105263,
"recall": 0.7317073170731707
},
"eval_accuracy": 0.9746899519109087,
"eval_f1": 0.9575060308034886,
"eval_loss": 0.08957625180482864,
"eval_precision": 0.9541420118343196,
"eval_recall": 0.9608938547486033,
"eval_runtime": 2.0502,
"eval_samples_per_second": 329.727,
"eval_steps_per_second": 20.974,
"step": 800
},
{
"epoch": 2.36,
"eval_ACT": {
"f1": 0.9570200573065903,
"number": 519,
"precision": 0.9488636363636364,
"recall": 0.9653179190751445
},
"eval_CARDINAL": {
"f1": 0.9866666666666667,
"number": 678,
"precision": 0.9910714285714286,
"recall": 0.9823008849557522
},
"eval_FT": {
"f1": 0.22222222222222224,
"number": 7,
"precision": 0.5,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9542483660130721,
"number": 761,
"precision": 0.9492847854356307,
"recall": 0.9592641261498029
},
"eval_PER": {
"f1": 0.9779086892488954,
"number": 679,
"precision": 0.9779086892488954,
"recall": 0.9779086892488954
},
"eval_TITRE": {
"f1": 0.7179487179487181,
"number": 41,
"precision": 0.7567567567567568,
"recall": 0.6829268292682927
},
"eval_accuracy": 0.9743103011895723,
"eval_f1": 0.9642591213700671,
"eval_loss": 0.08395500481128693,
"eval_precision": 0.9639002605135839,
"eval_recall": 0.9646182495344506,
"eval_runtime": 2.07,
"eval_samples_per_second": 326.576,
"eval_steps_per_second": 20.773,
"step": 900
}
],
"max_steps": 5000,
"num_train_epochs": 14,
"total_flos": 365778917703408.0,
"trial_name": null,
"trial_params": null
}