|
{ |
|
"best_metric": 0.7736625514403291, |
|
"best_model_checkpoint": "OS_OUT/harish/PT-UP-xlmR-FalseFalse-0_0_BEST/FalseFalse-0/2/checkpoint-40", |
|
"epoch": 8.0, |
|
"global_step": 40, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.6300366520881653, |
|
"eval_f1": 0.597609561752988, |
|
"eval_loss": 0.6447749137878418, |
|
"eval_runtime": 0.7675, |
|
"eval_samples_per_second": 355.702, |
|
"eval_steps_per_second": 45.603, |
|
"step": 5 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.6813187003135681, |
|
"eval_f1": 0.6200873362445415, |
|
"eval_loss": 0.5641180872917175, |
|
"eval_runtime": 0.7675, |
|
"eval_samples_per_second": 355.721, |
|
"eval_steps_per_second": 45.605, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7289377450942993, |
|
"eval_f1": 0.6372549019607843, |
|
"eval_loss": 0.5698391795158386, |
|
"eval_runtime": 0.7673, |
|
"eval_samples_per_second": 355.789, |
|
"eval_steps_per_second": 45.614, |
|
"step": 15 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.7289377450942993, |
|
"eval_f1": 0.7153846153846154, |
|
"eval_loss": 0.5229743719100952, |
|
"eval_runtime": 0.7688, |
|
"eval_samples_per_second": 355.082, |
|
"eval_steps_per_second": 45.523, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.7582417726516724, |
|
"eval_f1": 0.7421875, |
|
"eval_loss": 0.5236229300498962, |
|
"eval_runtime": 0.7675, |
|
"eval_samples_per_second": 355.716, |
|
"eval_steps_per_second": 45.605, |
|
"step": 25 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.7655677795410156, |
|
"eval_f1": 0.719298245614035, |
|
"eval_loss": 0.5164700150489807, |
|
"eval_runtime": 0.7779, |
|
"eval_samples_per_second": 350.939, |
|
"eval_steps_per_second": 44.992, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.791208803653717, |
|
"eval_f1": 0.7673469387755103, |
|
"eval_loss": 0.5138589143753052, |
|
"eval_runtime": 0.7778, |
|
"eval_samples_per_second": 350.983, |
|
"eval_steps_per_second": 44.998, |
|
"step": 35 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.7985348105430603, |
|
"eval_f1": 0.7736625514403291, |
|
"eval_loss": 0.5282412767410278, |
|
"eval_runtime": 0.7588, |
|
"eval_samples_per_second": 359.786, |
|
"eval_steps_per_second": 46.126, |
|
"step": 40 |
|
} |
|
], |
|
"max_steps": 45, |
|
"num_train_epochs": 9, |
|
"total_flos": 82090649272320.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|