|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 10.0, |
|
"global_step": 2330, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.8702409035670884, |
|
"eval_f1": 0.2995999407319603, |
|
"eval_loss": 0.5389052033424377, |
|
"eval_precision": 0.33331959612610756, |
|
"eval_recall": 0.27207589060450094, |
|
"eval_runtime": 14.1196, |
|
"eval_samples_per_second": 1054.99, |
|
"eval_steps_per_second": 2.125, |
|
"step": 233 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9681749946386446, |
|
"eval_f1": 0.8514915583419936, |
|
"eval_loss": 0.12146873772144318, |
|
"eval_precision": 0.8626164998274076, |
|
"eval_recall": 0.8406499142193965, |
|
"eval_runtime": 15.0925, |
|
"eval_samples_per_second": 986.983, |
|
"eval_steps_per_second": 1.988, |
|
"step": 466 |
|
}, |
|
{ |
|
"epoch": 2.15, |
|
"learning_rate": 6.25e-06, |
|
"loss": 1.2635, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9790478232897276, |
|
"eval_f1": 0.9141998345125719, |
|
"eval_loss": 0.0771816298365593, |
|
"eval_precision": 0.9178421266784212, |
|
"eval_recall": 0.9105863356544556, |
|
"eval_runtime": 14.0091, |
|
"eval_samples_per_second": 1063.307, |
|
"eval_steps_per_second": 2.141, |
|
"step": 699 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.98271141611266, |
|
"eval_f1": 0.9309382867251821, |
|
"eval_loss": 0.06554248929023743, |
|
"eval_precision": 0.9416055882454148, |
|
"eval_recall": 0.9205099740976217, |
|
"eval_runtime": 14.0197, |
|
"eval_samples_per_second": 1062.501, |
|
"eval_steps_per_second": 2.14, |
|
"step": 932 |
|
}, |
|
{ |
|
"epoch": 4.29, |
|
"learning_rate": 8.69281045751634e-06, |
|
"loss": 0.0906, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.984880977911216, |
|
"eval_f1": 0.9419223941161552, |
|
"eval_loss": 0.06115253269672394, |
|
"eval_precision": 0.9468692637160921, |
|
"eval_recall": 0.9370269452013321, |
|
"eval_runtime": 14.0288, |
|
"eval_samples_per_second": 1061.817, |
|
"eval_steps_per_second": 2.138, |
|
"step": 1165 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.9843269711916506, |
|
"eval_f1": 0.9446501919062689, |
|
"eval_loss": 0.062205445021390915, |
|
"eval_precision": 0.9454459682582471, |
|
"eval_recall": 0.9438557540283244, |
|
"eval_runtime": 14.4851, |
|
"eval_samples_per_second": 1028.367, |
|
"eval_steps_per_second": 2.071, |
|
"step": 1398 |
|
}, |
|
{ |
|
"epoch": 6.44, |
|
"learning_rate": 5.4248366013071894e-06, |
|
"loss": 0.0429, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.9854850239473872, |
|
"eval_f1": 0.9466268938436389, |
|
"eval_loss": 0.06088804826140404, |
|
"eval_precision": 0.9484971293481932, |
|
"eval_recall": 0.9447640192417668, |
|
"eval_runtime": 14.327, |
|
"eval_samples_per_second": 1039.716, |
|
"eval_steps_per_second": 2.094, |
|
"step": 1631 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9853885195510759, |
|
"eval_f1": 0.9475256832068758, |
|
"eval_loss": 0.06388872861862183, |
|
"eval_precision": 0.9456525381135868, |
|
"eval_recall": 0.9494062636660275, |
|
"eval_runtime": 14.5864, |
|
"eval_samples_per_second": 1021.225, |
|
"eval_steps_per_second": 2.057, |
|
"step": 1864 |
|
}, |
|
{ |
|
"epoch": 8.58, |
|
"learning_rate": 2.1568627450980393e-06, |
|
"loss": 0.0265, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.9858710415326328, |
|
"eval_f1": 0.9485348353785288, |
|
"eval_loss": 0.06375858187675476, |
|
"eval_precision": 0.9453968253968253, |
|
"eval_recall": 0.9516937464258082, |
|
"eval_runtime": 14.1094, |
|
"eval_samples_per_second": 1055.751, |
|
"eval_steps_per_second": 2.126, |
|
"step": 2097 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.9859925655872471, |
|
"eval_f1": 0.949012494961709, |
|
"eval_loss": 0.06480085104703903, |
|
"eval_precision": 0.9475802394607103, |
|
"eval_recall": 0.9504490866888687, |
|
"eval_runtime": 13.7245, |
|
"eval_samples_per_second": 1085.359, |
|
"eval_steps_per_second": 2.186, |
|
"step": 2330 |
|
} |
|
], |
|
"max_steps": 2330, |
|
"num_train_epochs": 10, |
|
"total_flos": 1.6349634872247114e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|