{ "best_metric": 0.08214916288852692, "best_model_checkpoint": "/home/jcanete/ft-data/all_results/ner/roberta_base_bne/epochs_4_bs_32_lr_3e-5/checkpoint-500", "epoch": 4.0, "global_step": 1044, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.38, "eval_accuracy": 0.9629454334483496, "eval_f1": 0.7416711342574863, "eval_loss": 0.1347309798002243, "eval_precision": 0.7229023589131084, "eval_recall": 0.7614404780625884, "eval_runtime": 2.0941, "eval_samples_per_second": 914.935, "eval_steps_per_second": 28.651, "step": 100 }, { "epoch": 0.77, "eval_accuracy": 0.9751748144981526, "eval_f1": 0.846393519239757, "eval_loss": 0.09219810366630554, "eval_precision": 0.8385553326130576, "eval_recall": 0.8543796194370183, "eval_runtime": 2.0125, "eval_samples_per_second": 952.045, "eval_steps_per_second": 29.814, "step": 200 }, { "epoch": 1.15, "eval_accuracy": 0.9743656294848698, "eval_f1": 0.8412611054328171, "eval_loss": 0.09414725750684738, "eval_precision": 0.8411949685534591, "eval_recall": 0.8413272527126907, "eval_runtime": 2.0091, "eval_samples_per_second": 953.677, "eval_steps_per_second": 29.865, "step": 300 }, { "epoch": 1.53, "eval_accuracy": 0.9758313230938349, "eval_f1": 0.854766575127501, "eval_loss": 0.08752118051052094, "eval_precision": 0.8529595991230817, "eval_recall": 0.8565812234628086, "eval_runtime": 2.0067, "eval_samples_per_second": 954.82, "eval_steps_per_second": 29.9, "step": 400 }, { "epoch": 1.92, "learning_rate": 1.5689655172413794e-05, "loss": 0.1335, "step": 500 }, { "epoch": 1.92, "eval_accuracy": 0.9778161165226419, "eval_f1": 0.8677048922447697, "eval_loss": 0.08214916288852692, "eval_precision": 0.8679779701022816, "eval_recall": 0.8674319861613461, "eval_runtime": 2.0137, "eval_samples_per_second": 951.47, "eval_steps_per_second": 29.796, "step": 500 }, { "epoch": 2.3, "eval_accuracy": 0.9771443402851996, "eval_f1": 0.859778020947319, "eval_loss": 0.0927521213889122, "eval_precision": 0.8547008547008547, "eval_recall": 0.8649158672747287, "eval_runtime": 2.07, "eval_samples_per_second": 925.61, "eval_steps_per_second": 28.986, "step": 600 }, { "epoch": 2.68, "eval_accuracy": 0.9763504229136768, "eval_f1": 0.8577878103837472, "eval_loss": 0.092233806848526, "eval_precision": 0.8492601726263872, "eval_recall": 0.8664884415788646, "eval_runtime": 2.0104, "eval_samples_per_second": 953.047, "eval_steps_per_second": 29.845, "step": 700 }, { "epoch": 3.07, "eval_accuracy": 0.9773428196280802, "eval_f1": 0.8647045046451715, "eval_loss": 0.09490890055894852, "eval_precision": 0.8586046511627907, "eval_recall": 0.8708916496304451, "eval_runtime": 1.9928, "eval_samples_per_second": 961.47, "eval_steps_per_second": 30.109, "step": 800 }, { "epoch": 3.45, "eval_accuracy": 0.9767321139576781, "eval_f1": 0.859104384459354, "eval_loss": 0.09667886048555374, "eval_precision": 0.852453940238427, "eval_recall": 0.8658594118572103, "eval_runtime": 2.002, "eval_samples_per_second": 957.043, "eval_steps_per_second": 29.97, "step": 900 }, { "epoch": 3.83, "learning_rate": 1.32183908045977e-06, "loss": 0.0189, "step": 1000 }, { "epoch": 3.83, "eval_accuracy": 0.977556566612721, "eval_f1": 0.8655850772004076, "eval_loss": 0.09368374198675156, "eval_precision": 0.8628125, "eval_recall": 0.8683755307438277, "eval_runtime": 2.004, "eval_samples_per_second": 956.073, "eval_steps_per_second": 29.94, "step": 1000 }, { "epoch": 4.0, "step": 1044, "total_flos": 1723769471413440.0, "train_loss": 0.07351639238810631, "train_runtime": 113.4173, "train_samples_per_second": 293.571, "train_steps_per_second": 9.205 } ], "max_steps": 1044, "num_train_epochs": 4, "total_flos": 1723769471413440.0, "trial_name": null, "trial_params": null }