|
{ |
|
"best_metric": 0.5126270055770874, |
|
"best_model_checkpoint": "distilbert_sa_GLUE_Experiment_data_aug_qqp_256/checkpoint-29671", |
|
"epoch": 6.0, |
|
"global_step": 178026, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 4.900033702942267e-05, |
|
"loss": 0.3952, |
|
"step": 29671 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.7887954489240663, |
|
"eval_combined_score": 0.7594535100431197, |
|
"eval_f1": 0.7301115711621732, |
|
"eval_loss": 0.5126270055770874, |
|
"eval_runtime": 29.5581, |
|
"eval_samples_per_second": 1367.815, |
|
"eval_steps_per_second": 5.345, |
|
"step": 29671 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 4.8000808870614404e-05, |
|
"loss": 0.2233, |
|
"step": 59342 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7960178085580015, |
|
"eval_combined_score": 0.7653223515229433, |
|
"eval_f1": 0.7346268944878849, |
|
"eval_loss": 0.5941275954246521, |
|
"eval_runtime": 29.386, |
|
"eval_samples_per_second": 1375.825, |
|
"eval_steps_per_second": 5.377, |
|
"step": 59342 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 4.700131441474841e-05, |
|
"loss": 0.147, |
|
"step": 89013 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7996537224833045, |
|
"eval_combined_score": 0.7668394047498941, |
|
"eval_f1": 0.7340250870164838, |
|
"eval_loss": 0.6602815985679626, |
|
"eval_runtime": 29.2551, |
|
"eval_samples_per_second": 1381.981, |
|
"eval_steps_per_second": 5.401, |
|
"step": 89013 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 4.6001786255940145e-05, |
|
"loss": 0.1067, |
|
"step": 118684 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.801187237200099, |
|
"eval_combined_score": 0.7693823877805914, |
|
"eval_f1": 0.737577538361084, |
|
"eval_loss": 0.7090513110160828, |
|
"eval_runtime": 29.4929, |
|
"eval_samples_per_second": 1370.841, |
|
"eval_steps_per_second": 5.357, |
|
"step": 118684 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 4.500229180007415e-05, |
|
"loss": 0.082, |
|
"step": 148355 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.7999505317833292, |
|
"eval_combined_score": 0.7688298514410226, |
|
"eval_f1": 0.7377091710987158, |
|
"eval_loss": 0.8757410645484924, |
|
"eval_runtime": 29.0987, |
|
"eval_samples_per_second": 1389.41, |
|
"eval_steps_per_second": 5.43, |
|
"step": 148355 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 4.400269623538135e-05, |
|
"loss": 0.0652, |
|
"step": 178026 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.8043779371753649, |
|
"eval_combined_score": 0.7711193984706826, |
|
"eval_f1": 0.7378608597660004, |
|
"eval_loss": 0.8331958055496216, |
|
"eval_runtime": 29.279, |
|
"eval_samples_per_second": 1380.855, |
|
"eval_steps_per_second": 5.396, |
|
"step": 178026 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"step": 178026, |
|
"total_flos": 7.776503176668119e+17, |
|
"train_loss": 0.16987583515715401, |
|
"train_runtime": 50655.2686, |
|
"train_samples_per_second": 7497.346, |
|
"train_steps_per_second": 29.287 |
|
} |
|
], |
|
"max_steps": 1483550, |
|
"num_train_epochs": 50, |
|
"total_flos": 7.776503176668119e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|