{ "best_metric": 0.9642591213700671, "best_model_checkpoint": "/work/stual/res_ICDAR/method_0/tmp/41-flat-ner-pero-ocr-camembert_ner/checkpoint-900", "epoch": 2.362204724409449, "global_step": 900, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.26, "eval_ACT": { "f1": 0.8502242152466369, "number": 519, "precision": 0.7953020134228188, "recall": 0.9132947976878613 }, "eval_CARDINAL": { "f1": 0.9723032069970846, "number": 678, "precision": 0.9610951008645533, "recall": 0.9837758112094396 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9184993531694695, "number": 761, "precision": 0.9044585987261147, "recall": 0.9329829172141918 }, "eval_PER": { "f1": 0.9062957540263543, "number": 679, "precision": 0.901018922852984, "recall": 0.9116347569955817 }, "eval_TITRE": { "f1": 0.0, "number": 41, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.9454568463680081, "eval_f1": 0.9069212410501192, "eval_loss": 0.2516954839229584, "eval_precision": 0.8942795076031861, "eval_recall": 0.9199255121042831, "eval_runtime": 2.036, "eval_samples_per_second": 332.026, "eval_steps_per_second": 21.12, "step": 100 }, { "epoch": 0.52, "eval_ACT": { "f1": 0.8866359447004608, "number": 519, "precision": 0.8498233215547704, "recall": 0.9267822736030829 }, "eval_CARDINAL": { "f1": 0.9786607799852833, "number": 678, "precision": 0.9765051395007343, "recall": 0.9808259587020649 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9327296248382924, "number": 761, "precision": 0.9184713375796179, "recall": 0.9474375821287779 }, "eval_PER": { "f1": 0.9166666666666666, "number": 679, "precision": 0.9100145137880987, "recall": 0.9234167893961709 }, "eval_TITRE": { "f1": 0.0, "number": 41, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.9538091622374083, "eval_f1": 0.9226785053644099, "eval_loss": 0.18263815343379974, "eval_precision": 0.9165747886806321, "eval_recall": 0.9288640595903166, "eval_runtime": 2.0314, "eval_samples_per_second": 332.78, "eval_steps_per_second": 21.168, "step": 200 }, { "epoch": 0.79, "eval_ACT": { "f1": 0.9261744966442953, "number": 519, "precision": 0.9217557251908397, "recall": 0.930635838150289 }, "eval_CARDINAL": { "f1": 0.9816581071166545, "number": 678, "precision": 0.9766423357664233, "recall": 0.9867256637168141 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.947780678851175, "number": 761, "precision": 0.9416342412451362, "recall": 0.9540078843626807 }, "eval_PER": { "f1": 0.94620486366986, "number": 679, "precision": 0.9469026548672567, "recall": 0.9455081001472754 }, "eval_TITRE": { "f1": 0.4675324675324676, "number": 41, "precision": 0.5, "recall": 0.43902439024390244 }, "eval_accuracy": 0.9639331814730449, "eval_f1": 0.9436698271054099, "eval_loss": 0.13531556725502014, "eval_precision": 0.9420935412026726, "eval_recall": 0.9452513966480447, "eval_runtime": 2.0117, "eval_samples_per_second": 336.027, "eval_steps_per_second": 21.375, "step": 300 }, { "epoch": 1.05, "eval_ACT": { "f1": 0.9381541389153186, "number": 519, "precision": 0.9266917293233082, "recall": 0.9499036608863198 }, "eval_CARDINAL": { "f1": 0.9852724594992636, "number": 678, "precision": 0.9838235294117647, "recall": 0.9867256637168141 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9483322432962721, "number": 761, "precision": 0.9440104166666666, "recall": 0.9526938239159002 }, "eval_PER": { "f1": 0.9553113553113554, "number": 679, "precision": 0.9504373177842566, "recall": 0.9602356406480118 }, "eval_TITRE": { "f1": 0.5813953488372093, "number": 41, "precision": 0.5555555555555556, "recall": 0.6097560975609756 }, "eval_accuracy": 0.9646924829157175, "eval_f1": 0.9503335804299481, "eval_loss": 0.11591742187738419, "eval_precision": 0.9457764662486168, "eval_recall": 0.9549348230912477, "eval_runtime": 2.0409, "eval_samples_per_second": 331.23, "eval_steps_per_second": 21.069, "step": 400 }, { "epoch": 1.31, "learning_rate": 9e-05, "loss": 0.2356, "step": 500 }, { "epoch": 1.31, "eval_ACT": { "f1": 0.9393939393939394, "number": 519, "precision": 0.9236499068901304, "recall": 0.9556840077071291 }, "eval_CARDINAL": { "f1": 0.9830258302583026, "number": 678, "precision": 0.983751846381093, "recall": 0.9823008849557522 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.944769330734243, "number": 761, "precision": 0.9344473007712082, "recall": 0.9553219448094612 }, "eval_PER": { "f1": 0.9618208516886931, "number": 679, "precision": 0.95900439238653, "recall": 0.9646539027982327 }, "eval_TITRE": { "f1": 0.684931506849315, "number": 41, "precision": 0.78125, "recall": 0.6097560975609756 }, "eval_accuracy": 0.9710199949379904, "eval_f1": 0.952893175074184, "eval_loss": 0.10950864851474762, "eval_precision": 0.949021056520133, "eval_recall": 0.9567970204841714, "eval_runtime": 2.1232, "eval_samples_per_second": 318.382, "eval_steps_per_second": 20.252, "step": 500 }, { "epoch": 1.57, "eval_ACT": { "f1": 0.9485714285714286, "number": 519, "precision": 0.9378531073446328, "recall": 0.9595375722543352 }, "eval_CARDINAL": { "f1": 0.9801907556859869, "number": 678, "precision": 0.9751824817518249, "recall": 0.9852507374631269 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9492187500000001, "number": 761, "precision": 0.9406451612903226, "recall": 0.9579500657030223 }, "eval_PER": { "f1": 0.96759941089838, "number": 679, "precision": 0.96759941089838, "recall": 0.96759941089838 }, "eval_TITRE": { "f1": 0.7160493827160495, "number": 41, "precision": 0.725, "recall": 0.7073170731707317 }, "eval_accuracy": 0.9716527461402177, "eval_f1": 0.9568118628359593, "eval_loss": 0.09932182729244232, "eval_precision": 0.9523985239852398, "eval_recall": 0.9612662942271881, "eval_runtime": 2.1374, "eval_samples_per_second": 316.273, "eval_steps_per_second": 20.118, "step": 600 }, { "epoch": 1.84, "eval_ACT": { "f1": 0.9541984732824428, "number": 519, "precision": 0.945179584120983, "recall": 0.9633911368015414 }, "eval_CARDINAL": { "f1": 0.9852507374631269, "number": 678, "precision": 0.9852507374631269, "recall": 0.9852507374631269 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9510124101894187, "number": 761, "precision": 0.9454545454545454, "recall": 0.9566360052562418 }, "eval_PER": { "f1": 0.9771891096394407, "number": 679, "precision": 0.9764705882352941, "recall": 0.9779086892488954 }, "eval_TITRE": { "f1": 0.7848101265822786, "number": 41, "precision": 0.8157894736842105, "recall": 0.7560975609756098 }, "eval_accuracy": 0.9779802581624905, "eval_f1": 0.9631970260223048, "eval_loss": 0.08475597947835922, "eval_precision": 0.9614100185528757, "eval_recall": 0.9649906890130354, "eval_runtime": 2.0431, "eval_samples_per_second": 330.877, "eval_steps_per_second": 21.047, "step": 700 }, { "epoch": 2.1, "eval_ACT": { "f1": 0.9468690702087287, "number": 519, "precision": 0.9327102803738317, "recall": 0.9614643545279383 }, "eval_CARDINAL": { "f1": 0.9852507374631269, "number": 678, "precision": 0.9852507374631269, "recall": 0.9852507374631269 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9432485322896281, "number": 761, "precision": 0.9365284974093264, "recall": 0.9500657030223391 }, "eval_PER": { "f1": 0.9705882352941176, "number": 679, "precision": 0.9691629955947136, "recall": 0.9720176730486009 }, "eval_TITRE": { "f1": 0.7594936708860759, "number": 41, "precision": 0.7894736842105263, "recall": 0.7317073170731707 }, "eval_accuracy": 0.9746899519109087, "eval_f1": 0.9575060308034886, "eval_loss": 0.08957625180482864, "eval_precision": 0.9541420118343196, "eval_recall": 0.9608938547486033, "eval_runtime": 2.0502, "eval_samples_per_second": 329.727, "eval_steps_per_second": 20.974, "step": 800 }, { "epoch": 2.36, "eval_ACT": { "f1": 0.9570200573065903, "number": 519, "precision": 0.9488636363636364, "recall": 0.9653179190751445 }, "eval_CARDINAL": { "f1": 0.9866666666666667, "number": 678, "precision": 0.9910714285714286, "recall": 0.9823008849557522 }, "eval_FT": { "f1": 0.22222222222222224, "number": 7, "precision": 0.5, "recall": 0.14285714285714285 }, "eval_LOC": { "f1": 0.9542483660130721, "number": 761, "precision": 0.9492847854356307, "recall": 0.9592641261498029 }, "eval_PER": { "f1": 0.9779086892488954, "number": 679, "precision": 0.9779086892488954, "recall": 0.9779086892488954 }, "eval_TITRE": { "f1": 0.7179487179487181, "number": 41, "precision": 0.7567567567567568, "recall": 0.6829268292682927 }, "eval_accuracy": 0.9743103011895723, "eval_f1": 0.9642591213700671, "eval_loss": 0.08395500481128693, "eval_precision": 0.9639002605135839, "eval_recall": 0.9646182495344506, "eval_runtime": 2.07, "eval_samples_per_second": 326.576, "eval_steps_per_second": 20.773, "step": 900 } ], "max_steps": 5000, "num_train_epochs": 14, "total_flos": 365778917703408.0, "trial_name": null, "trial_params": null }