gokuls's picture
End of training
8090099
{
"best_metric": 0.611058235168457,
"best_model_checkpoint": "mobilebert_sa_GLUE_Experiment_mrpc_256/checkpoint-232",
"epoch": 13.0,
"global_step": 377,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"learning_rate": 4.9e-05,
"loss": 0.6431,
"step": 29
},
{
"epoch": 1.0,
"eval_accuracy": 0.6838235294117647,
"eval_combined_score": 0.7480253018237863,
"eval_f1": 0.8122270742358079,
"eval_loss": 0.626089870929718,
"eval_runtime": 0.9456,
"eval_samples_per_second": 431.492,
"eval_steps_per_second": 4.23,
"step": 29
},
{
"epoch": 2.0,
"learning_rate": 4.8e-05,
"loss": 0.6296,
"step": 58
},
{
"epoch": 2.0,
"eval_accuracy": 0.6838235294117647,
"eval_combined_score": 0.7480253018237863,
"eval_f1": 0.8122270742358079,
"eval_loss": 0.6234638094902039,
"eval_runtime": 0.9411,
"eval_samples_per_second": 433.528,
"eval_steps_per_second": 4.25,
"step": 58
},
{
"epoch": 3.0,
"learning_rate": 4.7e-05,
"loss": 0.6306,
"step": 87
},
{
"epoch": 3.0,
"eval_accuracy": 0.6838235294117647,
"eval_combined_score": 0.7480253018237863,
"eval_f1": 0.8122270742358079,
"eval_loss": 0.6237208247184753,
"eval_runtime": 0.937,
"eval_samples_per_second": 435.41,
"eval_steps_per_second": 4.269,
"step": 87
},
{
"epoch": 4.0,
"learning_rate": 4.600000000000001e-05,
"loss": 0.6297,
"step": 116
},
{
"epoch": 4.0,
"eval_accuracy": 0.6838235294117647,
"eval_combined_score": 0.7480253018237863,
"eval_f1": 0.8122270742358079,
"eval_loss": 0.6237556338310242,
"eval_runtime": 0.9403,
"eval_samples_per_second": 433.895,
"eval_steps_per_second": 4.254,
"step": 116
},
{
"epoch": 5.0,
"learning_rate": 4.5e-05,
"loss": 0.6276,
"step": 145
},
{
"epoch": 5.0,
"eval_accuracy": 0.6838235294117647,
"eval_combined_score": 0.7480253018237863,
"eval_f1": 0.8122270742358079,
"eval_loss": 0.6206657290458679,
"eval_runtime": 0.9389,
"eval_samples_per_second": 434.555,
"eval_steps_per_second": 4.26,
"step": 145
},
{
"epoch": 6.0,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.6197,
"step": 174
},
{
"epoch": 6.0,
"eval_accuracy": 0.6838235294117647,
"eval_combined_score": 0.7480253018237863,
"eval_f1": 0.8122270742358079,
"eval_loss": 0.6212654709815979,
"eval_runtime": 0.9398,
"eval_samples_per_second": 434.126,
"eval_steps_per_second": 4.256,
"step": 174
},
{
"epoch": 7.0,
"learning_rate": 4.3e-05,
"loss": 0.6065,
"step": 203
},
{
"epoch": 7.0,
"eval_accuracy": 0.6911764705882353,
"eval_combined_score": 0.7477621483375959,
"eval_f1": 0.8043478260869565,
"eval_loss": 0.6284083724021912,
"eval_runtime": 0.9178,
"eval_samples_per_second": 444.537,
"eval_steps_per_second": 4.358,
"step": 203
},
{
"epoch": 8.0,
"learning_rate": 4.2e-05,
"loss": 0.5258,
"step": 232
},
{
"epoch": 8.0,
"eval_accuracy": 0.6911764705882353,
"eval_combined_score": 0.7429823721019352,
"eval_f1": 0.7947882736156351,
"eval_loss": 0.611058235168457,
"eval_runtime": 0.9172,
"eval_samples_per_second": 444.815,
"eval_steps_per_second": 4.361,
"step": 232
},
{
"epoch": 9.0,
"learning_rate": 4.1e-05,
"loss": 0.4596,
"step": 261
},
{
"epoch": 9.0,
"eval_accuracy": 0.7034313725490197,
"eval_combined_score": 0.7542921758075211,
"eval_f1": 0.8051529790660225,
"eval_loss": 0.6506468057632446,
"eval_runtime": 0.9479,
"eval_samples_per_second": 430.438,
"eval_steps_per_second": 4.22,
"step": 261
},
{
"epoch": 10.0,
"learning_rate": 4e-05,
"loss": 0.3953,
"step": 290
},
{
"epoch": 10.0,
"eval_accuracy": 0.7034313725490197,
"eval_combined_score": 0.7482968828557064,
"eval_f1": 0.7931623931623932,
"eval_loss": 0.7271472811698914,
"eval_runtime": 0.9357,
"eval_samples_per_second": 436.055,
"eval_steps_per_second": 4.275,
"step": 290
},
{
"epoch": 11.0,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.3426,
"step": 319
},
{
"epoch": 11.0,
"eval_accuracy": 0.6740196078431373,
"eval_combined_score": 0.7140892863614947,
"eval_f1": 0.7541589648798522,
"eval_loss": 0.9509055018424988,
"eval_runtime": 0.944,
"eval_samples_per_second": 432.196,
"eval_steps_per_second": 4.237,
"step": 319
},
{
"epoch": 12.0,
"learning_rate": 3.8e-05,
"loss": 0.2821,
"step": 348
},
{
"epoch": 12.0,
"eval_accuracy": 0.6862745098039216,
"eval_combined_score": 0.7335482138060704,
"eval_f1": 0.7808219178082192,
"eval_loss": 1.0021162033081055,
"eval_runtime": 0.9425,
"eval_samples_per_second": 432.902,
"eval_steps_per_second": 4.244,
"step": 348
},
{
"epoch": 13.0,
"learning_rate": 3.7e-05,
"loss": 0.2177,
"step": 377
},
{
"epoch": 13.0,
"eval_accuracy": 0.6691176470588235,
"eval_combined_score": 0.7183798218082413,
"eval_f1": 0.7676419965576592,
"eval_loss": 1.0359125137329102,
"eval_runtime": 0.9408,
"eval_samples_per_second": 433.683,
"eval_steps_per_second": 4.252,
"step": 377
},
{
"epoch": 13.0,
"step": 377,
"total_flos": 1256051433275392.0,
"train_loss": 0.5084376322495843,
"train_runtime": 493.204,
"train_samples_per_second": 371.854,
"train_steps_per_second": 2.94
}
],
"max_steps": 1450,
"num_train_epochs": 50,
"total_flos": 1256051433275392.0,
"trial_name": null,
"trial_params": null
}