{ "best_metric": 0.032893065363168716, "best_model_checkpoint": "/home/jcanete/ft-data/all_results/pos/roberta_base_bne/epochs_2_bs_16_lr_5e-5/checkpoint-1600", "epoch": 2.0, "global_step": 1790, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.22, "eval_accuracy": 0.984541433111356, "eval_f1": 0.9812364013813204, "eval_loss": 0.06434043496847153, "eval_precision": 0.9803362383582953, "eval_recall": 0.982138219016603, "eval_runtime": 2.9618, "eval_samples_per_second": 558.44, "eval_steps_per_second": 35.114, "step": 200 }, { "epoch": 0.45, "eval_accuracy": 0.9877832606716811, "eval_f1": 0.9851088887558137, "eval_loss": 0.04959944263100624, "eval_precision": 0.9842051732046347, "eval_recall": 0.9860142654492418, "eval_runtime": 2.9534, "eval_samples_per_second": 560.023, "eval_steps_per_second": 35.213, "step": 400 }, { "epoch": 0.56, "learning_rate": 3.603351955307263e-05, "loss": 0.1416, "step": 500 }, { "epoch": 0.67, "eval_accuracy": 0.9888212842747409, "eval_f1": 0.9869598210719706, "eval_loss": 0.0426110178232193, "eval_precision": 0.9864673359813178, "eval_recall": 0.9874527981458912, "eval_runtime": 2.954, "eval_samples_per_second": 559.912, "eval_steps_per_second": 35.206, "step": 600 }, { "epoch": 0.89, "eval_accuracy": 0.9898912470655872, "eval_f1": 0.9885165361878895, "eval_loss": 0.03891567513346672, "eval_precision": 0.9881021300381291, "eval_recall": 0.9889312900841142, "eval_runtime": 2.9458, "eval_samples_per_second": 561.485, "eval_steps_per_second": 35.305, "step": 800 }, { "epoch": 1.12, "learning_rate": 2.206703910614525e-05, "loss": 0.0348, "step": 1000 }, { "epoch": 1.12, "eval_accuracy": 0.9904182436640636, "eval_f1": 0.9885959656480927, "eval_loss": 0.03714817017316818, "eval_precision": 0.9882209666793108, "eval_recall": 0.9889712493256878, "eval_runtime": 2.9497, "eval_samples_per_second": 560.735, "eval_steps_per_second": 35.258, "step": 1000 }, { "epoch": 1.34, "eval_accuracy": 0.990514061227423, "eval_f1": 0.9887465425824039, "eval_loss": 0.03583846241235733, "eval_precision": 0.9883024592781858, "eval_recall": 0.9891910251543425, "eval_runtime": 2.9981, "eval_samples_per_second": 551.674, "eval_steps_per_second": 34.688, "step": 1200 }, { "epoch": 1.56, "eval_accuracy": 0.9909133010747536, "eval_f1": 0.9891582142001439, "eval_loss": 0.03380614146590233, "eval_precision": 0.9885068938683481, "eval_recall": 0.9898103933987333, "eval_runtime": 2.9525, "eval_samples_per_second": 560.202, "eval_steps_per_second": 35.224, "step": 1400 }, { "epoch": 1.68, "learning_rate": 8.100558659217877e-06, "loss": 0.0202, "step": 1500 }, { "epoch": 1.79, "eval_accuracy": 0.9914882064549099, "eval_f1": 0.9899645514004692, "eval_loss": 0.032893065363168716, "eval_precision": 0.9895396654289935, "eval_recall": 0.9903898024015504, "eval_runtime": 2.9564, "eval_samples_per_second": 559.471, "eval_steps_per_second": 35.178, "step": 1600 }, { "epoch": 2.0, "step": 1790, "total_flos": 1190583063933120.0, "train_loss": 0.05748698165296842, "train_runtime": 136.7323, "train_samples_per_second": 209.241, "train_steps_per_second": 13.091 } ], "max_steps": 1790, "num_train_epochs": 2, "total_flos": 1190583063933120.0, "trial_name": null, "trial_params": null }