{ "best_metric": 0.12875927984714508, "best_model_checkpoint": "/home/jcanete/ft-data/all_results/ner/albeto_base_10/epochs_4_bs_32_lr_5e-5/checkpoint-700", "epoch": 4.0, "global_step": 1044, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.38, "eval_accuracy": 0.9292493244579186, "eval_f1": 0.6192774836499534, "eval_loss": 0.2619832754135132, "eval_precision": 0.6041318547774571, "eval_recall": 0.6352020444018528, "eval_runtime": 1.8554, "eval_samples_per_second": 1032.641, "eval_steps_per_second": 32.337, "step": 100 }, { "epoch": 0.77, "eval_accuracy": 0.9522177552230936, "eval_f1": 0.7341891045710708, "eval_loss": 0.1654893010854721, "eval_precision": 0.7198772064466615, "eval_recall": 0.7490816163552149, "eval_runtime": 1.7972, "eval_samples_per_second": 1066.105, "eval_steps_per_second": 33.385, "step": 200 }, { "epoch": 1.15, "eval_accuracy": 0.9579516245963224, "eval_f1": 0.7919559492458702, "eval_loss": 0.149013951420784, "eval_precision": 0.7913875598086124, "eval_recall": 0.7925251557259224, "eval_runtime": 1.8699, "eval_samples_per_second": 1024.659, "eval_steps_per_second": 32.087, "step": 300 }, { "epoch": 1.53, "eval_accuracy": 0.9607032228300271, "eval_f1": 0.7946535126103907, "eval_loss": 0.13737879693508148, "eval_precision": 0.7916930881420419, "eval_recall": 0.7976361603577703, "eval_runtime": 1.8043, "eval_samples_per_second": 1061.881, "eval_steps_per_second": 33.253, "step": 400 }, { "epoch": 1.92, "learning_rate": 2.6149425287356323e-05, "loss": 0.2123, "step": 500 }, { "epoch": 1.92, "eval_accuracy": 0.9636525406972912, "eval_f1": 0.8209348781462246, "eval_loss": 0.12951940298080444, "eval_precision": 0.8213943076431084, "eval_recall": 0.8204759623063408, "eval_runtime": 1.7875, "eval_samples_per_second": 1071.873, "eval_steps_per_second": 33.566, "step": 500 }, { "epoch": 2.3, "eval_accuracy": 0.9627463257101431, "eval_f1": 0.8149384187524832, "eval_loss": 0.13606947660446167, "eval_precision": 0.8108791903858318, "eval_recall": 0.8190384922536336, "eval_runtime": 1.798, "eval_samples_per_second": 1065.622, "eval_steps_per_second": 33.37, "step": 600 }, { "epoch": 2.68, "eval_accuracy": 0.962762802346273, "eval_f1": 0.8076046822216985, "eval_loss": 0.12875927984714508, "eval_precision": 0.7946815089672232, "eval_recall": 0.8209551189905766, "eval_runtime": 1.8023, "eval_samples_per_second": 1063.059, "eval_steps_per_second": 33.29, "step": 700 }, { "epoch": 3.07, "eval_accuracy": 0.9635866341527713, "eval_f1": 0.8158271094867312, "eval_loss": 0.1313953548669815, "eval_precision": 0.811699604743083, "eval_recall": 0.8199968056221051, "eval_runtime": 1.7921, "eval_samples_per_second": 1069.118, "eval_steps_per_second": 33.48, "step": 800 }, { "epoch": 3.45, "eval_accuracy": 0.9627957556185329, "eval_f1": 0.8106307021023402, "eval_loss": 0.13798536360263824, "eval_precision": 0.805327868852459, "eval_recall": 0.8160038332534739, "eval_runtime": 1.8024, "eval_samples_per_second": 1063.055, "eval_steps_per_second": 33.29, "step": 900 }, { "epoch": 3.83, "learning_rate": 2.2030651340996167e-06, "loss": 0.0591, "step": 1000 }, { "epoch": 3.83, "eval_accuracy": 0.9642292229618401, "eval_f1": 0.818637194879542, "eval_loss": 0.13375717401504517, "eval_precision": 0.8150728309056364, "eval_recall": 0.8222328701485385, "eval_runtime": 1.8609, "eval_samples_per_second": 1029.628, "eval_steps_per_second": 32.243, "step": 1000 }, { "epoch": 4.0, "step": 1044, "total_flos": 139056718739136.0, "train_loss": 0.13201307291272044, "train_runtime": 54.4964, "train_samples_per_second": 610.976, "train_steps_per_second": 19.157 } ], "max_steps": 1044, "num_train_epochs": 4, "total_flos": 139056718739136.0, "trial_name": null, "trial_params": null }