Harish Tayyar Madabushi
added model
50d1635
{
"best_metric": 0.7565779291131405,
"best_model_checkpoint": "output-no-git/EN-OUTPUT/distilbert-base-cased/FalseTrue-0/2/checkpoint-520",
"epoch": 5.0,
"global_step": 520,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.7446351647377014,
"eval_f1": 0.7378445712448767,
"eval_f1_binary": 0.7800369685767097,
"eval_f1_weighted": 0.7470798170127886,
"eval_loss": 0.7295559048652649,
"eval_runtime": 0.9453,
"eval_samples_per_second": 492.97,
"eval_steps_per_second": 62.415,
"step": 104
},
{
"epoch": 2.0,
"eval_accuracy": 0.7424892783164978,
"eval_f1": 0.7401728463897408,
"eval_f1_binary": 0.7647058823529411,
"eval_f1_weighted": 0.7455427383816858,
"eval_loss": 0.9534124732017517,
"eval_runtime": 0.7364,
"eval_samples_per_second": 632.823,
"eval_steps_per_second": 80.121,
"step": 208
},
{
"epoch": 3.0,
"eval_accuracy": 0.7618025541305542,
"eval_f1": 0.7543816329922364,
"eval_f1_binary": 0.7970749542961609,
"eval_f1_weighted": 0.7637265230630523,
"eval_loss": 1.0867007970809937,
"eval_runtime": 0.736,
"eval_samples_per_second": 633.169,
"eval_steps_per_second": 80.165,
"step": 312
},
{
"epoch": 4.0,
"eval_accuracy": 0.7532188892364502,
"eval_f1": 0.7470105321795617,
"eval_f1_binary": 0.7866419294990724,
"eval_f1_weighted": 0.7556852157130167,
"eval_loss": 1.2413438558578491,
"eval_runtime": 0.7367,
"eval_samples_per_second": 632.508,
"eval_steps_per_second": 80.082,
"step": 416
},
{
"epoch": 4.81,
"learning_rate": 9.316239316239318e-06,
"loss": 0.1347,
"step": 500
},
{
"epoch": 5.0,
"eval_accuracy": 0.7682403326034546,
"eval_f1": 0.7565779291131405,
"eval_f1_binary": 0.8098591549295775,
"eval_f1_weighted": 0.7682403433476395,
"eval_loss": 1.2424249649047852,
"eval_runtime": 0.7359,
"eval_samples_per_second": 633.202,
"eval_steps_per_second": 80.169,
"step": 520
}
],
"max_steps": 936,
"num_train_epochs": 9,
"total_flos": 550898794160640.0,
"trial_name": null,
"trial_params": null
}