|
{ |
|
"best_metric": 77.32269615784104, |
|
"best_model_checkpoint": "/home/jcanete/ft-data/all_results/tar/roberta_large_bne/epochs_2_bs_32_lr_2e-5/checkpoint-4500", |
|
"epoch": 2.0, |
|
"global_step": 5486, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.11, |
|
"eval_exact_match": 52.72469252601703, |
|
"eval_f1": 70.31979377504159, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 0.18, |
|
"learning_rate": 1.8177178271965002e-05, |
|
"loss": 2.0124, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"eval_exact_match": 55.37369914853358, |
|
"eval_f1": 72.79425345069818, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"eval_exact_match": 57.142857142857146, |
|
"eval_f1": 74.00444934296571, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"learning_rate": 1.6354356543930007e-05, |
|
"loss": 1.6158, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_exact_match": 57.899716177861876, |
|
"eval_f1": 75.07716154126113, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"learning_rate": 1.4531534815895008e-05, |
|
"loss": 1.5421, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_exact_match": 59.08230842005676, |
|
"eval_f1": 75.72655876274406, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.66, |
|
"eval_exact_match": 58.77010406811731, |
|
"eval_f1": 75.5986676698771, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 0.73, |
|
"learning_rate": 1.2712358731316079e-05, |
|
"loss": 1.4971, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"eval_exact_match": 59.40397350993378, |
|
"eval_f1": 76.56550651885689, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 0.87, |
|
"eval_exact_match": 60.33112582781457, |
|
"eval_f1": 77.04475615318619, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 0.91, |
|
"learning_rate": 1.0889537003281081e-05, |
|
"loss": 1.4532, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"eval_exact_match": 60.179754020813625, |
|
"eval_f1": 76.98820150102628, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 1.09, |
|
"learning_rate": 9.066715275246082e-06, |
|
"loss": 1.1553, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 1.09, |
|
"eval_exact_match": 59.735099337748345, |
|
"eval_f1": 76.60782983695076, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 1.2, |
|
"eval_exact_match": 59.7918637653737, |
|
"eval_f1": 76.76732218063003, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 1.28, |
|
"learning_rate": 7.243893547211084e-06, |
|
"loss": 0.9124, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"eval_exact_match": 59.83916745506149, |
|
"eval_f1": 76.96753684496848, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 1.42, |
|
"eval_exact_match": 59.99053926206244, |
|
"eval_f1": 76.84857447005851, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 1.46, |
|
"learning_rate": 5.421071819176085e-06, |
|
"loss": 0.8835, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 1.53, |
|
"eval_exact_match": 59.422894985808895, |
|
"eval_f1": 76.94657837246879, |
|
"step": 4200 |
|
}, |
|
{ |
|
"epoch": 1.64, |
|
"learning_rate": 3.6018957345971567e-06, |
|
"loss": 0.8727, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 1.64, |
|
"eval_exact_match": 60.416272469252604, |
|
"eval_f1": 77.32269615784104, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 1.75, |
|
"eval_exact_match": 60.2081362346263, |
|
"eval_f1": 77.1919063305815, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 1.82, |
|
"learning_rate": 1.7827196500182284e-06, |
|
"loss": 0.8503, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 1.86, |
|
"eval_exact_match": 60.06622516556291, |
|
"eval_f1": 77.17743863949298, |
|
"step": 5100 |
|
}, |
|
{ |
|
"epoch": 1.97, |
|
"eval_exact_match": 60.31220435193945, |
|
"eval_f1": 77.30000861688039, |
|
"step": 5400 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"step": 5486, |
|
"total_flos": 1.1863529489772403e+17, |
|
"train_loss": 1.2413271612987178, |
|
"train_runtime": 3098.796, |
|
"train_samples_per_second": 56.634, |
|
"train_steps_per_second": 1.77 |
|
} |
|
], |
|
"max_steps": 5486, |
|
"num_train_epochs": 2, |
|
"total_flos": 1.1863529489772403e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|