resnet-18-finetuned-eurosat / trainer_state.json
sngsfydy's picture
Model save
25203a2
{
"best_metric": 0.8363636363636363,
"best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/Classification/ViT/models/resnet-18-finetuned-eurosat/checkpoint-303",
"epoch": 19.753086419753085,
"global_step": 400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.49,
"learning_rate": 1.25e-05,
"loss": 0.3227,
"step": 10
},
{
"epoch": 0.99,
"learning_rate": 2.5e-05,
"loss": 0.3846,
"step": 20
},
{
"epoch": 0.99,
"eval_accuracy": 0.7575757575757576,
"eval_loss": 0.6352207660675049,
"eval_runtime": 46.0823,
"eval_samples_per_second": 7.161,
"eval_steps_per_second": 0.239,
"step": 20
},
{
"epoch": 1.48,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.3732,
"step": 30
},
{
"epoch": 1.98,
"learning_rate": 5e-05,
"loss": 0.5009,
"step": 40
},
{
"epoch": 1.98,
"eval_accuracy": 0.7484848484848485,
"eval_loss": 0.6438900828361511,
"eval_runtime": 49.1686,
"eval_samples_per_second": 6.712,
"eval_steps_per_second": 0.224,
"step": 40
},
{
"epoch": 2.47,
"learning_rate": 4.8611111111111115e-05,
"loss": 0.4765,
"step": 50
},
{
"epoch": 2.96,
"learning_rate": 4.722222222222222e-05,
"loss": 0.5625,
"step": 60
},
{
"epoch": 2.96,
"eval_accuracy": 0.7909090909090909,
"eval_loss": 0.5722424387931824,
"eval_runtime": 46.1274,
"eval_samples_per_second": 7.154,
"eval_steps_per_second": 0.238,
"step": 60
},
{
"epoch": 3.46,
"learning_rate": 4.5833333333333334e-05,
"loss": 0.5104,
"step": 70
},
{
"epoch": 3.95,
"learning_rate": 4.4444444444444447e-05,
"loss": 0.4928,
"step": 80
},
{
"epoch": 4.0,
"eval_accuracy": 0.796969696969697,
"eval_loss": 0.5514332056045532,
"eval_runtime": 45.9331,
"eval_samples_per_second": 7.184,
"eval_steps_per_second": 0.239,
"step": 81
},
{
"epoch": 4.44,
"learning_rate": 4.305555555555556e-05,
"loss": 0.5148,
"step": 90
},
{
"epoch": 4.94,
"learning_rate": 4.166666666666667e-05,
"loss": 0.4621,
"step": 100
},
{
"epoch": 4.99,
"eval_accuracy": 0.7696969696969697,
"eval_loss": 0.6103599071502686,
"eval_runtime": 47.2344,
"eval_samples_per_second": 6.986,
"eval_steps_per_second": 0.233,
"step": 101
},
{
"epoch": 5.43,
"learning_rate": 4.027777777777778e-05,
"loss": 0.4939,
"step": 110
},
{
"epoch": 5.93,
"learning_rate": 3.888888888888889e-05,
"loss": 0.4367,
"step": 120
},
{
"epoch": 5.98,
"eval_accuracy": 0.793939393939394,
"eval_loss": 0.573406994342804,
"eval_runtime": 46.1152,
"eval_samples_per_second": 7.156,
"eval_steps_per_second": 0.239,
"step": 121
},
{
"epoch": 6.42,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.4252,
"step": 130
},
{
"epoch": 6.91,
"learning_rate": 3.611111111111111e-05,
"loss": 0.4238,
"step": 140
},
{
"epoch": 6.96,
"eval_accuracy": 0.8,
"eval_loss": 0.5557721853256226,
"eval_runtime": 48.2781,
"eval_samples_per_second": 6.835,
"eval_steps_per_second": 0.228,
"step": 141
},
{
"epoch": 7.41,
"learning_rate": 3.472222222222222e-05,
"loss": 0.4367,
"step": 150
},
{
"epoch": 7.9,
"learning_rate": 3.3333333333333335e-05,
"loss": 0.4011,
"step": 160
},
{
"epoch": 8.0,
"eval_accuracy": 0.803030303030303,
"eval_loss": 0.554872989654541,
"eval_runtime": 46.9595,
"eval_samples_per_second": 7.027,
"eval_steps_per_second": 0.234,
"step": 162
},
{
"epoch": 8.4,
"learning_rate": 3.194444444444444e-05,
"loss": 0.4059,
"step": 170
},
{
"epoch": 8.89,
"learning_rate": 3.055555555555556e-05,
"loss": 0.4129,
"step": 180
},
{
"epoch": 8.99,
"eval_accuracy": 0.806060606060606,
"eval_loss": 0.5553537607192993,
"eval_runtime": 46.217,
"eval_samples_per_second": 7.14,
"eval_steps_per_second": 0.238,
"step": 182
},
{
"epoch": 9.38,
"learning_rate": 2.916666666666667e-05,
"loss": 0.4125,
"step": 190
},
{
"epoch": 9.88,
"learning_rate": 2.777777777777778e-05,
"loss": 0.384,
"step": 200
},
{
"epoch": 9.98,
"eval_accuracy": 0.8151515151515152,
"eval_loss": 0.5550632476806641,
"eval_runtime": 47.8897,
"eval_samples_per_second": 6.891,
"eval_steps_per_second": 0.23,
"step": 202
},
{
"epoch": 10.37,
"learning_rate": 2.6388888888888892e-05,
"loss": 0.3823,
"step": 210
},
{
"epoch": 10.86,
"learning_rate": 2.5e-05,
"loss": 0.3839,
"step": 220
},
{
"epoch": 10.96,
"eval_accuracy": 0.8090909090909091,
"eval_loss": 0.5741792917251587,
"eval_runtime": 46.8547,
"eval_samples_per_second": 7.043,
"eval_steps_per_second": 0.235,
"step": 222
},
{
"epoch": 11.36,
"learning_rate": 2.361111111111111e-05,
"loss": 0.4025,
"step": 230
},
{
"epoch": 11.85,
"learning_rate": 2.2222222222222223e-05,
"loss": 0.3496,
"step": 240
},
{
"epoch": 12.0,
"eval_accuracy": 0.8303030303030303,
"eval_loss": 0.5517680048942566,
"eval_runtime": 45.796,
"eval_samples_per_second": 7.206,
"eval_steps_per_second": 0.24,
"step": 243
},
{
"epoch": 12.35,
"learning_rate": 2.0833333333333336e-05,
"loss": 0.3389,
"step": 250
},
{
"epoch": 12.84,
"learning_rate": 1.9444444444444445e-05,
"loss": 0.3482,
"step": 260
},
{
"epoch": 12.99,
"eval_accuracy": 0.8303030303030303,
"eval_loss": 0.5389552116394043,
"eval_runtime": 45.5677,
"eval_samples_per_second": 7.242,
"eval_steps_per_second": 0.241,
"step": 263
},
{
"epoch": 13.33,
"learning_rate": 1.8055555555555555e-05,
"loss": 0.3486,
"step": 270
},
{
"epoch": 13.83,
"learning_rate": 1.6666666666666667e-05,
"loss": 0.357,
"step": 280
},
{
"epoch": 13.98,
"eval_accuracy": 0.8181818181818182,
"eval_loss": 0.5543653964996338,
"eval_runtime": 45.3586,
"eval_samples_per_second": 7.275,
"eval_steps_per_second": 0.243,
"step": 283
},
{
"epoch": 14.32,
"learning_rate": 1.527777777777778e-05,
"loss": 0.3397,
"step": 290
},
{
"epoch": 14.81,
"learning_rate": 1.388888888888889e-05,
"loss": 0.3341,
"step": 300
},
{
"epoch": 14.96,
"eval_accuracy": 0.8363636363636363,
"eval_loss": 0.5505930185317993,
"eval_runtime": 45.3368,
"eval_samples_per_second": 7.279,
"eval_steps_per_second": 0.243,
"step": 303
},
{
"epoch": 15.31,
"learning_rate": 1.25e-05,
"loss": 0.3923,
"step": 310
},
{
"epoch": 15.8,
"learning_rate": 1.1111111111111112e-05,
"loss": 0.3605,
"step": 320
},
{
"epoch": 16.0,
"eval_accuracy": 0.8212121212121212,
"eval_loss": 0.5546284914016724,
"eval_runtime": 45.4708,
"eval_samples_per_second": 7.257,
"eval_steps_per_second": 0.242,
"step": 324
},
{
"epoch": 16.3,
"learning_rate": 9.722222222222223e-06,
"loss": 0.3401,
"step": 330
},
{
"epoch": 16.79,
"learning_rate": 8.333333333333334e-06,
"loss": 0.3041,
"step": 340
},
{
"epoch": 16.99,
"eval_accuracy": 0.8212121212121212,
"eval_loss": 0.5597090125083923,
"eval_runtime": 45.2134,
"eval_samples_per_second": 7.299,
"eval_steps_per_second": 0.243,
"step": 344
},
{
"epoch": 17.28,
"learning_rate": 6.944444444444445e-06,
"loss": 0.3422,
"step": 350
},
{
"epoch": 17.78,
"learning_rate": 5.555555555555556e-06,
"loss": 0.3364,
"step": 360
},
{
"epoch": 17.98,
"eval_accuracy": 0.8090909090909091,
"eval_loss": 0.5729926228523254,
"eval_runtime": 45.0505,
"eval_samples_per_second": 7.325,
"eval_steps_per_second": 0.244,
"step": 364
},
{
"epoch": 18.27,
"learning_rate": 4.166666666666667e-06,
"loss": 0.3156,
"step": 370
},
{
"epoch": 18.77,
"learning_rate": 2.777777777777778e-06,
"loss": 0.2976,
"step": 380
},
{
"epoch": 18.96,
"eval_accuracy": 0.8090909090909091,
"eval_loss": 0.5741696357727051,
"eval_runtime": 45.8457,
"eval_samples_per_second": 7.198,
"eval_steps_per_second": 0.24,
"step": 384
},
{
"epoch": 19.26,
"learning_rate": 1.388888888888889e-06,
"loss": 0.3209,
"step": 390
},
{
"epoch": 19.75,
"learning_rate": 0.0,
"loss": 0.3229,
"step": 400
},
{
"epoch": 19.75,
"eval_accuracy": 0.8121212121212121,
"eval_loss": 0.5653126835823059,
"eval_runtime": 41.6194,
"eval_samples_per_second": 7.929,
"eval_steps_per_second": 0.264,
"step": 400
},
{
"epoch": 19.75,
"step": 400,
"total_flos": 5.1138191421254246e+17,
"train_loss": 0.39375978350639346,
"train_runtime": 7915.8379,
"train_samples_per_second": 6.476,
"train_steps_per_second": 0.051
}
],
"max_steps": 400,
"num_train_epochs": 20,
"total_flos": 5.1138191421254246e+17,
"trial_name": null,
"trial_params": null
}