|
{ |
|
"best_metric": 0.7565779291131405, |
|
"best_model_checkpoint": "output-no-git/EN-OUTPUT/distilbert-base-cased/FalseTrue-0/2/checkpoint-520", |
|
"epoch": 5.0, |
|
"global_step": 520, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.7446351647377014, |
|
"eval_f1": 0.7378445712448767, |
|
"eval_f1_binary": 0.7800369685767097, |
|
"eval_f1_weighted": 0.7470798170127886, |
|
"eval_loss": 0.7295559048652649, |
|
"eval_runtime": 0.9453, |
|
"eval_samples_per_second": 492.97, |
|
"eval_steps_per_second": 62.415, |
|
"step": 104 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7424892783164978, |
|
"eval_f1": 0.7401728463897408, |
|
"eval_f1_binary": 0.7647058823529411, |
|
"eval_f1_weighted": 0.7455427383816858, |
|
"eval_loss": 0.9534124732017517, |
|
"eval_runtime": 0.7364, |
|
"eval_samples_per_second": 632.823, |
|
"eval_steps_per_second": 80.121, |
|
"step": 208 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7618025541305542, |
|
"eval_f1": 0.7543816329922364, |
|
"eval_f1_binary": 0.7970749542961609, |
|
"eval_f1_weighted": 0.7637265230630523, |
|
"eval_loss": 1.0867007970809937, |
|
"eval_runtime": 0.736, |
|
"eval_samples_per_second": 633.169, |
|
"eval_steps_per_second": 80.165, |
|
"step": 312 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.7532188892364502, |
|
"eval_f1": 0.7470105321795617, |
|
"eval_f1_binary": 0.7866419294990724, |
|
"eval_f1_weighted": 0.7556852157130167, |
|
"eval_loss": 1.2413438558578491, |
|
"eval_runtime": 0.7367, |
|
"eval_samples_per_second": 632.508, |
|
"eval_steps_per_second": 80.082, |
|
"step": 416 |
|
}, |
|
{ |
|
"epoch": 4.81, |
|
"learning_rate": 9.316239316239318e-06, |
|
"loss": 0.1347, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.7682403326034546, |
|
"eval_f1": 0.7565779291131405, |
|
"eval_f1_binary": 0.8098591549295775, |
|
"eval_f1_weighted": 0.7682403433476395, |
|
"eval_loss": 1.2424249649047852, |
|
"eval_runtime": 0.7359, |
|
"eval_samples_per_second": 633.202, |
|
"eval_steps_per_second": 80.169, |
|
"step": 520 |
|
} |
|
], |
|
"max_steps": 936, |
|
"num_train_epochs": 9, |
|
"total_flos": 550898794160640.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|