josecannete's picture
adding model finetuned on sqac
39afa5e
{
"best_metric": 80.94744810096695,
"best_model_checkpoint": "/home/jcanete/ft-data/all_results/sqac/roberta_base_bne/epochs_3_bs_16_lr_3e-5/checkpoint-2000",
"epoch": 3.0,
"global_step": 3105,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.19,
"eval_exact_match": 47.532188841201716,
"eval_f1": 69.33897723912453,
"step": 200
},
{
"epoch": 0.39,
"eval_exact_match": 53.862660944206006,
"eval_f1": 73.09612890375904,
"step": 400
},
{
"epoch": 0.48,
"learning_rate": 2.518840579710145e-05,
"loss": 1.7311,
"step": 500
},
{
"epoch": 0.58,
"eval_exact_match": 56.33047210300429,
"eval_f1": 76.36054486750021,
"step": 600
},
{
"epoch": 0.77,
"eval_exact_match": 59.17381974248927,
"eval_f1": 78.2471790298137,
"step": 800
},
{
"epoch": 0.97,
"learning_rate": 2.0357487922705316e-05,
"loss": 1.0008,
"step": 1000
},
{
"epoch": 0.97,
"eval_exact_match": 62.82188841201717,
"eval_f1": 79.9716859895811,
"step": 1000
},
{
"epoch": 1.16,
"eval_exact_match": 62.1244635193133,
"eval_f1": 79.20024477578876,
"step": 1200
},
{
"epoch": 1.35,
"eval_exact_match": 63.09012875536481,
"eval_f1": 80.33927406223063,
"step": 1400
},
{
"epoch": 1.45,
"learning_rate": 1.552657004830918e-05,
"loss": 0.5026,
"step": 1500
},
{
"epoch": 1.55,
"eval_exact_match": 62.28540772532189,
"eval_f1": 79.52570777544153,
"step": 1600
},
{
"epoch": 1.74,
"eval_exact_match": 62.607296137339056,
"eval_f1": 80.02469983579446,
"step": 1800
},
{
"epoch": 1.93,
"learning_rate": 1.0695652173913044e-05,
"loss": 0.4535,
"step": 2000
},
{
"epoch": 1.93,
"eval_exact_match": 63.62660944206009,
"eval_f1": 80.94744810096695,
"step": 2000
},
{
"epoch": 2.13,
"eval_exact_match": 63.09012875536481,
"eval_f1": 80.42628565826091,
"step": 2200
},
{
"epoch": 2.32,
"eval_exact_match": 63.358369098712444,
"eval_f1": 80.76418115011096,
"step": 2400
},
{
"epoch": 2.42,
"learning_rate": 5.864734299516909e-06,
"loss": 0.1763,
"step": 2500
},
{
"epoch": 2.51,
"eval_exact_match": 62.92918454935622,
"eval_f1": 80.63880344911603,
"step": 2600
},
{
"epoch": 2.71,
"eval_exact_match": 62.98283261802575,
"eval_f1": 80.47469561336324,
"step": 2800
},
{
"epoch": 2.9,
"learning_rate": 1.033816425120773e-06,
"loss": 0.1245,
"step": 3000
},
{
"epoch": 2.9,
"eval_exact_match": 64.05579399141631,
"eval_f1": 80.84469008915202,
"step": 3000
},
{
"epoch": 3.0,
"step": 3105,
"total_flos": 1.2663698322068352e+16,
"train_loss": 0.6470010164663219,
"train_runtime": 876.8981,
"train_samples_per_second": 56.613,
"train_steps_per_second": 3.541
}
],
"max_steps": 3105,
"num_train_epochs": 3,
"total_flos": 1.2663698322068352e+16,
"trial_name": null,
"trial_params": null
}