josecannete's picture
adding model finetuned on sqac
ecb4914
{
"best_metric": 80.15398176853643,
"best_model_checkpoint": "/home/jcanete/ft-data/all_results/sqac/bertin_roberta_base/epochs_2_bs_16_lr_3e-5/checkpoint-2000",
"epoch": 2.0,
"global_step": 2070,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.19,
"eval_exact_match": 44.527896995708154,
"eval_f1": 65.6105308029204,
"step": 200
},
{
"epoch": 0.39,
"eval_exact_match": 53.487124463519315,
"eval_f1": 72.463429226185,
"step": 400
},
{
"epoch": 0.48,
"learning_rate": 2.279710144927536e-05,
"loss": 2.0283,
"step": 500
},
{
"epoch": 0.58,
"eval_exact_match": 55.472103004291846,
"eval_f1": 73.77270325735508,
"step": 600
},
{
"epoch": 0.77,
"eval_exact_match": 59.38841201716738,
"eval_f1": 76.95926171469165,
"step": 800
},
{
"epoch": 0.97,
"learning_rate": 1.555072463768116e-05,
"loss": 1.0347,
"step": 1000
},
{
"epoch": 0.97,
"eval_exact_match": 59.97854077253219,
"eval_f1": 78.2749680853618,
"step": 1000
},
{
"epoch": 1.16,
"eval_exact_match": 59.44206008583691,
"eval_f1": 78.2209721909282,
"step": 1200
},
{
"epoch": 1.35,
"eval_exact_match": 61.48068669527897,
"eval_f1": 78.9917873380796,
"step": 1400
},
{
"epoch": 1.45,
"learning_rate": 8.304347826086955e-06,
"loss": 0.4519,
"step": 1500
},
{
"epoch": 1.55,
"eval_exact_match": 60.997854077253216,
"eval_f1": 79.01542543724356,
"step": 1600
},
{
"epoch": 1.74,
"eval_exact_match": 62.17811158798283,
"eval_f1": 79.82176827691146,
"step": 1800
},
{
"epoch": 1.93,
"learning_rate": 1.0579710144927535e-06,
"loss": 0.3936,
"step": 2000
},
{
"epoch": 1.93,
"eval_exact_match": 62.5,
"eval_f1": 80.15398176853643,
"step": 2000
},
{
"epoch": 2.0,
"step": 2070,
"total_flos": 8445258157133184.0,
"train_loss": 0.9571071643184349,
"train_runtime": 543.2284,
"train_samples_per_second": 60.925,
"train_steps_per_second": 3.811
}
],
"max_steps": 2070,
"num_train_epochs": 2,
"total_flos": 8445258157133184.0,
"trial_name": null,
"trial_params": null
}