|
{ |
|
"best_metric": 0.07052170485258102, |
|
"best_model_checkpoint": "token_level_model/best_model/checkpoint-948", |
|
"epoch": 12.0, |
|
"global_step": 3792, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_balanced accuracy": 0.5633085631676005, |
|
"eval_f1": 0.5303163390780957, |
|
"eval_loss": 0.09163307398557663, |
|
"eval_precision": 0.6548165588282941, |
|
"eval_recall": 0.5633085631676005, |
|
"eval_runtime": 5.3367, |
|
"eval_samples_per_second": 236.852, |
|
"eval_steps_per_second": 14.803, |
|
"step": 316 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"learning_rate": 1.7362869198312237e-05, |
|
"loss": 0.1839, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_balanced accuracy": 0.7195902052549533, |
|
"eval_f1": 0.7255288809894066, |
|
"eval_loss": 0.0722324550151825, |
|
"eval_precision": 0.7454575741625619, |
|
"eval_recall": 0.7195902052549533, |
|
"eval_runtime": 5.3534, |
|
"eval_samples_per_second": 236.111, |
|
"eval_steps_per_second": 14.757, |
|
"step": 632 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_balanced accuracy": 0.7147400555506803, |
|
"eval_f1": 0.7192305114894215, |
|
"eval_loss": 0.07052170485258102, |
|
"eval_precision": 0.7756273409712318, |
|
"eval_recall": 0.7147400555506803, |
|
"eval_runtime": 5.4755, |
|
"eval_samples_per_second": 230.847, |
|
"eval_steps_per_second": 14.428, |
|
"step": 948 |
|
}, |
|
{ |
|
"epoch": 3.16, |
|
"learning_rate": 1.4725738396624474e-05, |
|
"loss": 0.0587, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_balanced accuracy": 0.7295185936273012, |
|
"eval_f1": 0.7296703416168215, |
|
"eval_loss": 0.07182055711746216, |
|
"eval_precision": 0.7401045017667032, |
|
"eval_recall": 0.7295185936273012, |
|
"eval_runtime": 5.3937, |
|
"eval_samples_per_second": 234.345, |
|
"eval_steps_per_second": 14.647, |
|
"step": 1264 |
|
}, |
|
{ |
|
"epoch": 4.75, |
|
"learning_rate": 1.208860759493671e-05, |
|
"loss": 0.0376, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_balanced accuracy": 0.735330002568732, |
|
"eval_f1": 0.743746101471838, |
|
"eval_loss": 0.07561135292053223, |
|
"eval_precision": 0.758929084908083, |
|
"eval_recall": 0.735330002568732, |
|
"eval_runtime": 5.5304, |
|
"eval_samples_per_second": 228.555, |
|
"eval_steps_per_second": 14.285, |
|
"step": 1580 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_balanced accuracy": 0.7487913019838482, |
|
"eval_f1": 0.7539294881409199, |
|
"eval_loss": 0.08333344757556915, |
|
"eval_precision": 0.7640729935139194, |
|
"eval_recall": 0.7487913019838482, |
|
"eval_runtime": 5.304, |
|
"eval_samples_per_second": 238.312, |
|
"eval_steps_per_second": 14.894, |
|
"step": 1896 |
|
}, |
|
{ |
|
"epoch": 6.33, |
|
"learning_rate": 9.451476793248946e-06, |
|
"loss": 0.0239, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_balanced accuracy": 0.7495077050154062, |
|
"eval_f1": 0.7547220689413356, |
|
"eval_loss": 0.09176070988178253, |
|
"eval_precision": 0.7680132999431392, |
|
"eval_recall": 0.7495077050154062, |
|
"eval_runtime": 5.4894, |
|
"eval_samples_per_second": 230.262, |
|
"eval_steps_per_second": 14.391, |
|
"step": 2212 |
|
}, |
|
{ |
|
"epoch": 7.91, |
|
"learning_rate": 6.814345991561182e-06, |
|
"loss": 0.0161, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_balanced accuracy": 0.7519480763726148, |
|
"eval_f1": 0.7441340002103095, |
|
"eval_loss": 0.10090441256761551, |
|
"eval_precision": 0.7421918161304624, |
|
"eval_recall": 0.7519480763726148, |
|
"eval_runtime": 5.4772, |
|
"eval_samples_per_second": 230.774, |
|
"eval_steps_per_second": 14.423, |
|
"step": 2528 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_balanced accuracy": 0.7372305744818235, |
|
"eval_f1": 0.7418663358868686, |
|
"eval_loss": 0.10627683997154236, |
|
"eval_precision": 0.747694948865169, |
|
"eval_recall": 0.7372305744818235, |
|
"eval_runtime": 5.673, |
|
"eval_samples_per_second": 222.809, |
|
"eval_steps_per_second": 13.926, |
|
"step": 2844 |
|
}, |
|
{ |
|
"epoch": 9.49, |
|
"learning_rate": 4.177215189873418e-06, |
|
"loss": 0.0107, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_balanced accuracy": 0.7454153105654866, |
|
"eval_f1": 0.7532278014935634, |
|
"eval_loss": 0.11291743814945221, |
|
"eval_precision": 0.7635910633921945, |
|
"eval_recall": 0.7454153105654866, |
|
"eval_runtime": 5.7497, |
|
"eval_samples_per_second": 219.839, |
|
"eval_steps_per_second": 13.74, |
|
"step": 3160 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_balanced accuracy": 0.7422514651185799, |
|
"eval_f1": 0.7462413455365297, |
|
"eval_loss": 0.11802595853805542, |
|
"eval_precision": 0.7518280300030182, |
|
"eval_recall": 0.7422514651185799, |
|
"eval_runtime": 5.6277, |
|
"eval_samples_per_second": 224.602, |
|
"eval_steps_per_second": 14.038, |
|
"step": 3476 |
|
}, |
|
{ |
|
"epoch": 11.08, |
|
"learning_rate": 1.5400843881856542e-06, |
|
"loss": 0.007, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_balanced accuracy": 0.7397630177088332, |
|
"eval_f1": 0.7454360643197575, |
|
"eval_loss": 0.11985792219638824, |
|
"eval_precision": 0.7526407260582226, |
|
"eval_recall": 0.7397630177088332, |
|
"eval_runtime": 5.7001, |
|
"eval_samples_per_second": 221.752, |
|
"eval_steps_per_second": 13.859, |
|
"step": 3792 |
|
} |
|
], |
|
"max_steps": 3792, |
|
"num_train_epochs": 12, |
|
"total_flos": 302819736843288.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|