|
{ |
|
"best_metric": 0.8578431372549019, |
|
"best_model_checkpoint": "./bert-base-uncased/fine_tuned_models/checkpoint-460", |
|
"epoch": 10.0, |
|
"global_step": 1150, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 1e-05, |
|
"loss": 0.6308, |
|
"step": 115 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.7058823529411765, |
|
"eval_combined_score": 0.7639204049572351, |
|
"eval_f1": 0.8219584569732937, |
|
"eval_loss": 0.5484543442726135, |
|
"eval_runtime": 1.1176, |
|
"eval_samples_per_second": 365.063, |
|
"eval_steps_per_second": 45.633, |
|
"step": 115 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 2e-05, |
|
"loss": 0.488, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7990196078431373, |
|
"eval_combined_score": 0.8344304388422037, |
|
"eval_f1": 0.86984126984127, |
|
"eval_loss": 0.44723159074783325, |
|
"eval_runtime": 1.121, |
|
"eval_samples_per_second": 363.966, |
|
"eval_steps_per_second": 45.496, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 1.7500000000000002e-05, |
|
"loss": 0.3019, |
|
"step": 345 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.8406862745098039, |
|
"eval_combined_score": 0.8653515974917887, |
|
"eval_f1": 0.8900169204737733, |
|
"eval_loss": 0.3739049434661865, |
|
"eval_runtime": 1.1236, |
|
"eval_samples_per_second": 363.103, |
|
"eval_steps_per_second": 45.388, |
|
"step": 345 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 1.5000000000000002e-05, |
|
"loss": 0.1395, |
|
"step": 460 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8578431372549019, |
|
"eval_combined_score": 0.8790933899332929, |
|
"eval_f1": 0.9003436426116839, |
|
"eval_loss": 0.48073676228523254, |
|
"eval_runtime": 1.1302, |
|
"eval_samples_per_second": 360.994, |
|
"eval_steps_per_second": 45.124, |
|
"step": 460 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0603, |
|
"step": 575 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.8357843137254902, |
|
"eval_combined_score": 0.8594279334770557, |
|
"eval_f1": 0.8830715532286212, |
|
"eval_loss": 0.6254621148109436, |
|
"eval_runtime": 1.1347, |
|
"eval_samples_per_second": 359.579, |
|
"eval_steps_per_second": 44.947, |
|
"step": 575 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0356, |
|
"step": 690 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.8431372549019608, |
|
"eval_combined_score": 0.8676965735789266, |
|
"eval_f1": 0.8922558922558923, |
|
"eval_loss": 0.8049449324607849, |
|
"eval_runtime": 1.1199, |
|
"eval_samples_per_second": 364.325, |
|
"eval_steps_per_second": 45.541, |
|
"step": 690 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 7.500000000000001e-06, |
|
"loss": 0.0267, |
|
"step": 805 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.8455882352941176, |
|
"eval_combined_score": 0.8668438512172187, |
|
"eval_f1": 0.8880994671403197, |
|
"eval_loss": 0.7565263509750366, |
|
"eval_runtime": 1.1371, |
|
"eval_samples_per_second": 358.818, |
|
"eval_steps_per_second": 44.852, |
|
"step": 805 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0117, |
|
"step": 920 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8382352941176471, |
|
"eval_combined_score": 0.8622210953346856, |
|
"eval_f1": 0.8862068965517241, |
|
"eval_loss": 0.8377837538719177, |
|
"eval_runtime": 1.1383, |
|
"eval_samples_per_second": 358.436, |
|
"eval_steps_per_second": 44.805, |
|
"step": 920 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0086, |
|
"step": 1035 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.8382352941176471, |
|
"eval_combined_score": 0.8614253393665159, |
|
"eval_f1": 0.8846153846153846, |
|
"eval_loss": 0.870381772518158, |
|
"eval_runtime": 1.1281, |
|
"eval_samples_per_second": 361.659, |
|
"eval_steps_per_second": 45.207, |
|
"step": 1035 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 0.0, |
|
"loss": 0.0075, |
|
"step": 1150 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.8406862745098039, |
|
"eval_combined_score": 0.8640173140313319, |
|
"eval_f1": 0.8873483535528597, |
|
"eval_loss": 0.8665909171104431, |
|
"eval_runtime": 1.1293, |
|
"eval_samples_per_second": 361.28, |
|
"eval_steps_per_second": 45.16, |
|
"step": 1150 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 1150, |
|
"total_flos": 2412728377651200.0, |
|
"train_loss": 0.17106628703034443, |
|
"train_runtime": 327.4394, |
|
"train_samples_per_second": 112.021, |
|
"train_steps_per_second": 3.512 |
|
} |
|
], |
|
"max_steps": 1150, |
|
"num_train_epochs": 10, |
|
"total_flos": 2412728377651200.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|