{ "best_metric": 0.24886493384838104, "best_model_checkpoint": "address_detection_model/checkpoint-480", "epoch": 13.0, "global_step": 1248, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.90849413168888, "eval_f1": 0.59986366734833, "eval_loss": 0.4046468734741211, "eval_precision": 0.561941251596424, "eval_recall": 0.6432748538011696, "eval_runtime": 0.333, "eval_samples_per_second": 576.556, "eval_steps_per_second": 36.035, "step": 96 }, { "epoch": 2.0, "eval_accuracy": 0.9192361249254029, "eval_f1": 0.693135935397039, "eval_loss": 0.305729478597641, "eval_precision": 0.64214463840399, "eval_recall": 0.7529239766081871, "eval_runtime": 0.3645, "eval_samples_per_second": 526.796, "eval_steps_per_second": 32.925, "step": 192 }, { "epoch": 3.0, "eval_accuracy": 0.9305748955639547, "eval_f1": 0.7226428079834825, "eval_loss": 0.25665250420570374, "eval_precision": 0.682704811443433, "eval_recall": 0.7675438596491229, "eval_runtime": 0.3364, "eval_samples_per_second": 570.696, "eval_steps_per_second": 35.669, "step": 288 }, { "epoch": 4.0, "eval_accuracy": 0.9289834891585439, "eval_f1": 0.7248787248787248, "eval_loss": 0.2604641616344452, "eval_precision": 0.689064558629776, "eval_recall": 0.7646198830409356, "eval_runtime": 0.3089, "eval_samples_per_second": 621.464, "eval_steps_per_second": 38.842, "step": 384 }, { "epoch": 5.0, "eval_accuracy": 0.9327630793713945, "eval_f1": 0.7221067221067221, "eval_loss": 0.24886493384838104, "eval_precision": 0.686429512516469, "eval_recall": 0.7616959064327485, "eval_runtime": 0.3123, "eval_samples_per_second": 614.738, "eval_steps_per_second": 38.421, "step": 480 }, { "epoch": 5.21, "learning_rate": 1.9583333333333333e-05, "loss": 0.3477, "step": 500 }, { "epoch": 6.0, "eval_accuracy": 0.9341555599761289, "eval_f1": 0.7311679336558397, "eval_loss": 0.2547823190689087, "eval_precision": 0.6933158584534731, "eval_recall": 0.7733918128654971, "eval_runtime": 0.3117, "eval_samples_per_second": 615.908, "eval_steps_per_second": 38.494, "step": 576 }, { "epoch": 7.0, "eval_accuracy": 0.9307738213646309, "eval_f1": 0.7350069735006974, "eval_loss": 0.26613351702690125, "eval_precision": 0.7026666666666667, "eval_recall": 0.77046783625731, "eval_runtime": 0.3453, "eval_samples_per_second": 555.983, "eval_steps_per_second": 34.749, "step": 672 }, { "epoch": 8.0, "eval_accuracy": 0.9345534115774816, "eval_f1": 0.7416201117318436, "eval_loss": 0.25599348545074463, "eval_precision": 0.7098930481283422, "eval_recall": 0.7763157894736842, "eval_runtime": 0.313, "eval_samples_per_second": 613.472, "eval_steps_per_second": 38.342, "step": 768 }, { "epoch": 9.0, "eval_accuracy": 0.9321663019693655, "eval_f1": 0.7372764786795049, "eval_loss": 0.27552878856658936, "eval_precision": 0.6961038961038961, "eval_recall": 0.783625730994152, "eval_runtime": 0.3343, "eval_samples_per_second": 574.283, "eval_steps_per_second": 35.893, "step": 864 }, { "epoch": 10.0, "eval_accuracy": 0.9299781181619255, "eval_f1": 0.7323549965059398, "eval_loss": 0.2917962074279785, "eval_precision": 0.7014725568942436, "eval_recall": 0.7660818713450293, "eval_runtime": 0.329, "eval_samples_per_second": 583.528, "eval_steps_per_second": 36.47, "step": 960 }, { "epoch": 10.42, "learning_rate": 9.166666666666668e-06, "loss": 0.1205, "step": 1000 }, { "epoch": 11.0, "eval_accuracy": 0.9315695245673364, "eval_f1": 0.7329624478442281, "eval_loss": 0.28479865193367004, "eval_precision": 0.6989389920424404, "eval_recall": 0.77046783625731, "eval_runtime": 0.3325, "eval_samples_per_second": 577.484, "eval_steps_per_second": 36.093, "step": 1056 }, { "epoch": 12.0, "eval_accuracy": 0.9299781181619255, "eval_f1": 0.7342995169082126, "eval_loss": 0.3070613443851471, "eval_precision": 0.6954248366013072, "eval_recall": 0.7777777777777778, "eval_runtime": 0.3292, "eval_samples_per_second": 583.292, "eval_steps_per_second": 36.456, "step": 1152 }, { "epoch": 13.0, "eval_accuracy": 0.9333598567734235, "eval_f1": 0.745998608211552, "eval_loss": 0.2998543679714203, "eval_precision": 0.7118193891102258, "eval_recall": 0.783625730994152, "eval_runtime": 0.3372, "eval_samples_per_second": 569.432, "eval_steps_per_second": 35.589, "step": 1248 } ], "max_steps": 1440, "num_train_epochs": 15, "total_flos": 487199638963260.0, "trial_name": null, "trial_params": null }