Ubuntu
updated model
1fd6c85
{
"best_metric": 0.7736625514403291,
"best_model_checkpoint": "OS_OUT/harish/PT-UP-xlmR-FalseFalse-0_0_BEST/FalseFalse-0/2/checkpoint-40",
"epoch": 8.0,
"global_step": 40,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.6300366520881653,
"eval_f1": 0.597609561752988,
"eval_loss": 0.6447749137878418,
"eval_runtime": 0.7675,
"eval_samples_per_second": 355.702,
"eval_steps_per_second": 45.603,
"step": 5
},
{
"epoch": 2.0,
"eval_accuracy": 0.6813187003135681,
"eval_f1": 0.6200873362445415,
"eval_loss": 0.5641180872917175,
"eval_runtime": 0.7675,
"eval_samples_per_second": 355.721,
"eval_steps_per_second": 45.605,
"step": 10
},
{
"epoch": 3.0,
"eval_accuracy": 0.7289377450942993,
"eval_f1": 0.6372549019607843,
"eval_loss": 0.5698391795158386,
"eval_runtime": 0.7673,
"eval_samples_per_second": 355.789,
"eval_steps_per_second": 45.614,
"step": 15
},
{
"epoch": 4.0,
"eval_accuracy": 0.7289377450942993,
"eval_f1": 0.7153846153846154,
"eval_loss": 0.5229743719100952,
"eval_runtime": 0.7688,
"eval_samples_per_second": 355.082,
"eval_steps_per_second": 45.523,
"step": 20
},
{
"epoch": 5.0,
"eval_accuracy": 0.7582417726516724,
"eval_f1": 0.7421875,
"eval_loss": 0.5236229300498962,
"eval_runtime": 0.7675,
"eval_samples_per_second": 355.716,
"eval_steps_per_second": 45.605,
"step": 25
},
{
"epoch": 6.0,
"eval_accuracy": 0.7655677795410156,
"eval_f1": 0.719298245614035,
"eval_loss": 0.5164700150489807,
"eval_runtime": 0.7779,
"eval_samples_per_second": 350.939,
"eval_steps_per_second": 44.992,
"step": 30
},
{
"epoch": 7.0,
"eval_accuracy": 0.791208803653717,
"eval_f1": 0.7673469387755103,
"eval_loss": 0.5138589143753052,
"eval_runtime": 0.7778,
"eval_samples_per_second": 350.983,
"eval_steps_per_second": 44.998,
"step": 35
},
{
"epoch": 8.0,
"eval_accuracy": 0.7985348105430603,
"eval_f1": 0.7736625514403291,
"eval_loss": 0.5282412767410278,
"eval_runtime": 0.7588,
"eval_samples_per_second": 359.786,
"eval_steps_per_second": 46.126,
"step": 40
}
],
"max_steps": 45,
"num_train_epochs": 9,
"total_flos": 82090649272320.0,
"trial_name": null,
"trial_params": null
}