|
{ |
|
"best_metric": 1.0, |
|
"best_model_checkpoint": "./saved-model-all-data/checkpoint-882", |
|
"epoch": 25.0, |
|
"global_step": 1575, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.8670662363608421, |
|
"eval_f1": 0.5017103762827823, |
|
"eval_loss": 0.42577993869781494, |
|
"eval_precision": 0.4592901878914405, |
|
"eval_recall": 0.5527638190954773, |
|
"eval_runtime": 0.6534, |
|
"eval_samples_per_second": 76.527, |
|
"eval_steps_per_second": 10.714, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9293069002612571, |
|
"eval_f1": 0.7072289156626506, |
|
"eval_loss": 0.22081975638866425, |
|
"eval_precision": 0.6793981481481481, |
|
"eval_recall": 0.7374371859296482, |
|
"eval_runtime": 0.5804, |
|
"eval_samples_per_second": 86.142, |
|
"eval_steps_per_second": 12.06, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9549715690794529, |
|
"eval_f1": 0.8209500609013398, |
|
"eval_loss": 0.13680364191532135, |
|
"eval_precision": 0.7966903073286052, |
|
"eval_recall": 0.8467336683417085, |
|
"eval_runtime": 0.5883, |
|
"eval_samples_per_second": 84.997, |
|
"eval_steps_per_second": 11.9, |
|
"step": 189 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9778699861687413, |
|
"eval_f1": 0.8866995073891626, |
|
"eval_loss": 0.07373423129320145, |
|
"eval_precision": 0.8695652173913043, |
|
"eval_recall": 0.9045226130653267, |
|
"eval_runtime": 0.6005, |
|
"eval_samples_per_second": 83.259, |
|
"eval_steps_per_second": 11.656, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9855540187490395, |
|
"eval_f1": 0.9316239316239316, |
|
"eval_loss": 0.04712964966893196, |
|
"eval_precision": 0.9061757719714965, |
|
"eval_recall": 0.9585427135678392, |
|
"eval_runtime": 0.6021, |
|
"eval_samples_per_second": 83.049, |
|
"eval_steps_per_second": 11.627, |
|
"step": 315 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.9929306900261257, |
|
"eval_f1": 0.9652605459057072, |
|
"eval_loss": 0.02583940699696541, |
|
"eval_precision": 0.9534313725490197, |
|
"eval_recall": 0.9773869346733668, |
|
"eval_runtime": 0.5826, |
|
"eval_samples_per_second": 85.82, |
|
"eval_steps_per_second": 12.015, |
|
"step": 378 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.9967727063162748, |
|
"eval_f1": 0.9849435382685068, |
|
"eval_loss": 0.015803957358002663, |
|
"eval_precision": 0.9837092731829574, |
|
"eval_recall": 0.9861809045226131, |
|
"eval_runtime": 0.5833, |
|
"eval_samples_per_second": 85.718, |
|
"eval_steps_per_second": 12.0, |
|
"step": 441 |
|
}, |
|
{ |
|
"epoch": 7.94, |
|
"learning_rate": 3.644067796610169e-05, |
|
"loss": 0.268, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9972337482710927, |
|
"eval_f1": 0.9880578252671276, |
|
"eval_loss": 0.012770027853548527, |
|
"eval_precision": 0.9886792452830189, |
|
"eval_recall": 0.9874371859296482, |
|
"eval_runtime": 0.5723, |
|
"eval_samples_per_second": 87.36, |
|
"eval_steps_per_second": 12.23, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.9978484708775165, |
|
"eval_f1": 0.9861809045226131, |
|
"eval_loss": 0.008633743040263653, |
|
"eval_precision": 0.9861809045226131, |
|
"eval_recall": 0.9861809045226131, |
|
"eval_runtime": 0.5754, |
|
"eval_samples_per_second": 86.898, |
|
"eval_steps_per_second": 12.166, |
|
"step": 567 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.9983095128323344, |
|
"eval_f1": 0.9899497487437185, |
|
"eval_loss": 0.006678320933133364, |
|
"eval_precision": 0.9899497487437185, |
|
"eval_recall": 0.9899497487437185, |
|
"eval_runtime": 0.5717, |
|
"eval_samples_per_second": 87.461, |
|
"eval_steps_per_second": 12.245, |
|
"step": 630 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.9990779160903642, |
|
"eval_f1": 0.9962311557788944, |
|
"eval_loss": 0.004529367666691542, |
|
"eval_precision": 0.9962311557788944, |
|
"eval_recall": 0.9962311557788944, |
|
"eval_runtime": 0.5852, |
|
"eval_samples_per_second": 85.445, |
|
"eval_steps_per_second": 11.962, |
|
"step": 693 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.999692638696788, |
|
"eval_f1": 0.9987437185929648, |
|
"eval_loss": 0.0013231054181233048, |
|
"eval_precision": 0.9987437185929648, |
|
"eval_recall": 0.9987437185929648, |
|
"eval_runtime": 0.5808, |
|
"eval_samples_per_second": 86.093, |
|
"eval_steps_per_second": 12.053, |
|
"step": 756 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.9990779160903642, |
|
"eval_f1": 0.9956112852664577, |
|
"eval_loss": 0.0035528314765542746, |
|
"eval_precision": 0.9937421777221527, |
|
"eval_recall": 0.9974874371859297, |
|
"eval_runtime": 0.6108, |
|
"eval_samples_per_second": 81.86, |
|
"eval_steps_per_second": 11.46, |
|
"step": 819 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.00045324634993448853, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.5759, |
|
"eval_samples_per_second": 86.817, |
|
"eval_steps_per_second": 12.154, |
|
"step": 882 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.00044708128552883863, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.575, |
|
"eval_samples_per_second": 86.954, |
|
"eval_steps_per_second": 12.174, |
|
"step": 945 |
|
}, |
|
{ |
|
"epoch": 15.87, |
|
"learning_rate": 1.9491525423728814e-05, |
|
"loss": 0.0097, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.00018117745639756322, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.5823, |
|
"eval_samples_per_second": 85.872, |
|
"eval_steps_per_second": 12.022, |
|
"step": 1008 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.00018171708506997675, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.6909, |
|
"eval_samples_per_second": 72.373, |
|
"eval_steps_per_second": 10.132, |
|
"step": 1071 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.0002043112035607919, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.6068, |
|
"eval_samples_per_second": 82.399, |
|
"eval_steps_per_second": 11.536, |
|
"step": 1134 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.00015518060536123812, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.594, |
|
"eval_samples_per_second": 84.176, |
|
"eval_steps_per_second": 11.785, |
|
"step": 1197 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.00014525999722536653, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.5981, |
|
"eval_samples_per_second": 83.6, |
|
"eval_steps_per_second": 11.704, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.00013857503654435277, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.5825, |
|
"eval_samples_per_second": 85.832, |
|
"eval_steps_per_second": 12.017, |
|
"step": 1323 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.00013503569061867893, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.573, |
|
"eval_samples_per_second": 87.267, |
|
"eval_steps_per_second": 12.217, |
|
"step": 1386 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.00012487478670664132, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.5904, |
|
"eval_samples_per_second": 84.687, |
|
"eval_steps_per_second": 11.856, |
|
"step": 1449 |
|
}, |
|
{ |
|
"epoch": 23.81, |
|
"learning_rate": 2.5423728813559323e-06, |
|
"loss": 0.0019, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.00012091387179680169, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.5792, |
|
"eval_samples_per_second": 86.322, |
|
"eval_steps_per_second": 12.085, |
|
"step": 1512 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_accuracy": 1.0, |
|
"eval_f1": 1.0, |
|
"eval_loss": 0.00011829046707134694, |
|
"eval_precision": 1.0, |
|
"eval_recall": 1.0, |
|
"eval_runtime": 0.6205, |
|
"eval_samples_per_second": 80.581, |
|
"eval_steps_per_second": 11.281, |
|
"step": 1575 |
|
} |
|
], |
|
"max_steps": 1575, |
|
"num_train_epochs": 25, |
|
"total_flos": 1550715696271320.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|