|
{ |
|
"best_metric": 0.8970588235294118, |
|
"best_model_checkpoint": "./bert-base-uncased/fine_tuned_models/checkpoint-575", |
|
"epoch": 10.0, |
|
"global_step": 1150, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 1e-05, |
|
"loss": 0.6336, |
|
"step": 115 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.6838235294117647, |
|
"eval_combined_score": 0.7480253018237863, |
|
"eval_f1": 0.8122270742358079, |
|
"eval_loss": 0.538364589214325, |
|
"eval_runtime": 1.089, |
|
"eval_samples_per_second": 374.663, |
|
"eval_steps_per_second": 46.833, |
|
"step": 115 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 2e-05, |
|
"loss": 0.482, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.8357843137254902, |
|
"eval_combined_score": 0.8625202560362988, |
|
"eval_f1": 0.8892561983471075, |
|
"eval_loss": 0.40759965777397156, |
|
"eval_runtime": 1.0806, |
|
"eval_samples_per_second": 377.572, |
|
"eval_steps_per_second": 47.196, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 1.7500000000000002e-05, |
|
"loss": 0.3576, |
|
"step": 345 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.875, |
|
"eval_combined_score": 0.8912205081669691, |
|
"eval_f1": 0.9074410163339381, |
|
"eval_loss": 0.2955787181854248, |
|
"eval_runtime": 1.0806, |
|
"eval_samples_per_second": 377.557, |
|
"eval_steps_per_second": 47.195, |
|
"step": 345 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 1.5000000000000002e-05, |
|
"loss": 0.2205, |
|
"step": 460 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8921568627450981, |
|
"eval_combined_score": 0.9076168929110106, |
|
"eval_f1": 0.923076923076923, |
|
"eval_loss": 0.3020019829273224, |
|
"eval_runtime": 1.0822, |
|
"eval_samples_per_second": 376.994, |
|
"eval_steps_per_second": 47.124, |
|
"step": 460 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.1258, |
|
"step": 575 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.8970588235294118, |
|
"eval_combined_score": 0.9106232745805904, |
|
"eval_f1": 0.924187725631769, |
|
"eval_loss": 0.3507114052772522, |
|
"eval_runtime": 1.0903, |
|
"eval_samples_per_second": 374.196, |
|
"eval_steps_per_second": 46.775, |
|
"step": 575 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0893, |
|
"step": 690 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.8848039215686274, |
|
"eval_combined_score": 0.8994403520091766, |
|
"eval_f1": 0.9140767824497258, |
|
"eval_loss": 0.46679043769836426, |
|
"eval_runtime": 1.0897, |
|
"eval_samples_per_second": 374.408, |
|
"eval_steps_per_second": 46.801, |
|
"step": 690 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 7.500000000000001e-06, |
|
"loss": 0.0635, |
|
"step": 805 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.8921568627450981, |
|
"eval_combined_score": 0.906510086048808, |
|
"eval_f1": 0.9208633093525179, |
|
"eval_loss": 0.5193934440612793, |
|
"eval_runtime": 1.1035, |
|
"eval_samples_per_second": 369.736, |
|
"eval_steps_per_second": 46.217, |
|
"step": 805 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0391, |
|
"step": 920 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8897058823529411, |
|
"eval_combined_score": 0.9040180954414434, |
|
"eval_f1": 0.9183303085299456, |
|
"eval_loss": 0.642646312713623, |
|
"eval_runtime": 1.0978, |
|
"eval_samples_per_second": 371.638, |
|
"eval_steps_per_second": 46.455, |
|
"step": 920 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0294, |
|
"step": 1035 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.8848039215686274, |
|
"eval_combined_score": 0.9003626047914693, |
|
"eval_f1": 0.9159212880143113, |
|
"eval_loss": 0.6596136689186096, |
|
"eval_runtime": 1.1007, |
|
"eval_samples_per_second": 370.671, |
|
"eval_steps_per_second": 46.334, |
|
"step": 1035 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 0.0, |
|
"loss": 0.0163, |
|
"step": 1150 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.8921568627450981, |
|
"eval_combined_score": 0.9063672400368089, |
|
"eval_f1": 0.9205776173285197, |
|
"eval_loss": 0.6627745628356934, |
|
"eval_runtime": 1.1037, |
|
"eval_samples_per_second": 369.676, |
|
"eval_steps_per_second": 46.209, |
|
"step": 1150 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 1150, |
|
"total_flos": 2412728377651200.0, |
|
"train_loss": 0.20570029414218405, |
|
"train_runtime": 332.3723, |
|
"train_samples_per_second": 110.358, |
|
"train_steps_per_second": 3.46 |
|
} |
|
], |
|
"max_steps": 1150, |
|
"num_train_epochs": 10, |
|
"total_flos": 2412728377651200.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|