File size: 2,655 Bytes
e30176f 1fd6c85 b7433e3 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f 1fd6c85 e30176f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 |
{
"best_metric": 0.7736625514403291,
"best_model_checkpoint": "OS_OUT/harish/PT-UP-xlmR-FalseFalse-0_0_BEST/FalseFalse-0/2/checkpoint-40",
"epoch": 8.0,
"global_step": 40,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.6300366520881653,
"eval_f1": 0.597609561752988,
"eval_loss": 0.6447749137878418,
"eval_runtime": 0.7675,
"eval_samples_per_second": 355.702,
"eval_steps_per_second": 45.603,
"step": 5
},
{
"epoch": 2.0,
"eval_accuracy": 0.6813187003135681,
"eval_f1": 0.6200873362445415,
"eval_loss": 0.5641180872917175,
"eval_runtime": 0.7675,
"eval_samples_per_second": 355.721,
"eval_steps_per_second": 45.605,
"step": 10
},
{
"epoch": 3.0,
"eval_accuracy": 0.7289377450942993,
"eval_f1": 0.6372549019607843,
"eval_loss": 0.5698391795158386,
"eval_runtime": 0.7673,
"eval_samples_per_second": 355.789,
"eval_steps_per_second": 45.614,
"step": 15
},
{
"epoch": 4.0,
"eval_accuracy": 0.7289377450942993,
"eval_f1": 0.7153846153846154,
"eval_loss": 0.5229743719100952,
"eval_runtime": 0.7688,
"eval_samples_per_second": 355.082,
"eval_steps_per_second": 45.523,
"step": 20
},
{
"epoch": 5.0,
"eval_accuracy": 0.7582417726516724,
"eval_f1": 0.7421875,
"eval_loss": 0.5236229300498962,
"eval_runtime": 0.7675,
"eval_samples_per_second": 355.716,
"eval_steps_per_second": 45.605,
"step": 25
},
{
"epoch": 6.0,
"eval_accuracy": 0.7655677795410156,
"eval_f1": 0.719298245614035,
"eval_loss": 0.5164700150489807,
"eval_runtime": 0.7779,
"eval_samples_per_second": 350.939,
"eval_steps_per_second": 44.992,
"step": 30
},
{
"epoch": 7.0,
"eval_accuracy": 0.791208803653717,
"eval_f1": 0.7673469387755103,
"eval_loss": 0.5138589143753052,
"eval_runtime": 0.7778,
"eval_samples_per_second": 350.983,
"eval_steps_per_second": 44.998,
"step": 35
},
{
"epoch": 8.0,
"eval_accuracy": 0.7985348105430603,
"eval_f1": 0.7736625514403291,
"eval_loss": 0.5282412767410278,
"eval_runtime": 0.7588,
"eval_samples_per_second": 359.786,
"eval_steps_per_second": 46.126,
"step": 40
}
],
"max_steps": 45,
"num_train_epochs": 9,
"total_flos": 82090649272320.0,
"trial_name": null,
"trial_params": null
}
|