|
{ |
|
"best_metric": 0.8363636363636363, |
|
"best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/Classification/ViT/models/resnet-18-finetuned-eurosat/checkpoint-303", |
|
"epoch": 19.753086419753085, |
|
"global_step": 400, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.49, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.3227, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.3846, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"eval_accuracy": 0.7575757575757576, |
|
"eval_loss": 0.6352207660675049, |
|
"eval_runtime": 46.0823, |
|
"eval_samples_per_second": 7.161, |
|
"eval_steps_per_second": 0.239, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 1.48, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.3732, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"learning_rate": 5e-05, |
|
"loss": 0.5009, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"eval_accuracy": 0.7484848484848485, |
|
"eval_loss": 0.6438900828361511, |
|
"eval_runtime": 49.1686, |
|
"eval_samples_per_second": 6.712, |
|
"eval_steps_per_second": 0.224, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 2.47, |
|
"learning_rate": 4.8611111111111115e-05, |
|
"loss": 0.4765, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 2.96, |
|
"learning_rate": 4.722222222222222e-05, |
|
"loss": 0.5625, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 2.96, |
|
"eval_accuracy": 0.7909090909090909, |
|
"eval_loss": 0.5722424387931824, |
|
"eval_runtime": 46.1274, |
|
"eval_samples_per_second": 7.154, |
|
"eval_steps_per_second": 0.238, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 3.46, |
|
"learning_rate": 4.5833333333333334e-05, |
|
"loss": 0.5104, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 3.95, |
|
"learning_rate": 4.4444444444444447e-05, |
|
"loss": 0.4928, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.796969696969697, |
|
"eval_loss": 0.5514332056045532, |
|
"eval_runtime": 45.9331, |
|
"eval_samples_per_second": 7.184, |
|
"eval_steps_per_second": 0.239, |
|
"step": 81 |
|
}, |
|
{ |
|
"epoch": 4.44, |
|
"learning_rate": 4.305555555555556e-05, |
|
"loss": 0.5148, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 4.94, |
|
"learning_rate": 4.166666666666667e-05, |
|
"loss": 0.4621, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 4.99, |
|
"eval_accuracy": 0.7696969696969697, |
|
"eval_loss": 0.6103599071502686, |
|
"eval_runtime": 47.2344, |
|
"eval_samples_per_second": 6.986, |
|
"eval_steps_per_second": 0.233, |
|
"step": 101 |
|
}, |
|
{ |
|
"epoch": 5.43, |
|
"learning_rate": 4.027777777777778e-05, |
|
"loss": 0.4939, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 5.93, |
|
"learning_rate": 3.888888888888889e-05, |
|
"loss": 0.4367, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 5.98, |
|
"eval_accuracy": 0.793939393939394, |
|
"eval_loss": 0.573406994342804, |
|
"eval_runtime": 46.1152, |
|
"eval_samples_per_second": 7.156, |
|
"eval_steps_per_second": 0.239, |
|
"step": 121 |
|
}, |
|
{ |
|
"epoch": 6.42, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.4252, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 6.91, |
|
"learning_rate": 3.611111111111111e-05, |
|
"loss": 0.4238, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 6.96, |
|
"eval_accuracy": 0.8, |
|
"eval_loss": 0.5557721853256226, |
|
"eval_runtime": 48.2781, |
|
"eval_samples_per_second": 6.835, |
|
"eval_steps_per_second": 0.228, |
|
"step": 141 |
|
}, |
|
{ |
|
"epoch": 7.41, |
|
"learning_rate": 3.472222222222222e-05, |
|
"loss": 0.4367, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 7.9, |
|
"learning_rate": 3.3333333333333335e-05, |
|
"loss": 0.4011, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.803030303030303, |
|
"eval_loss": 0.554872989654541, |
|
"eval_runtime": 46.9595, |
|
"eval_samples_per_second": 7.027, |
|
"eval_steps_per_second": 0.234, |
|
"step": 162 |
|
}, |
|
{ |
|
"epoch": 8.4, |
|
"learning_rate": 3.194444444444444e-05, |
|
"loss": 0.4059, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 8.89, |
|
"learning_rate": 3.055555555555556e-05, |
|
"loss": 0.4129, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 8.99, |
|
"eval_accuracy": 0.806060606060606, |
|
"eval_loss": 0.5553537607192993, |
|
"eval_runtime": 46.217, |
|
"eval_samples_per_second": 7.14, |
|
"eval_steps_per_second": 0.238, |
|
"step": 182 |
|
}, |
|
{ |
|
"epoch": 9.38, |
|
"learning_rate": 2.916666666666667e-05, |
|
"loss": 0.4125, |
|
"step": 190 |
|
}, |
|
{ |
|
"epoch": 9.88, |
|
"learning_rate": 2.777777777777778e-05, |
|
"loss": 0.384, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 9.98, |
|
"eval_accuracy": 0.8151515151515152, |
|
"eval_loss": 0.5550632476806641, |
|
"eval_runtime": 47.8897, |
|
"eval_samples_per_second": 6.891, |
|
"eval_steps_per_second": 0.23, |
|
"step": 202 |
|
}, |
|
{ |
|
"epoch": 10.37, |
|
"learning_rate": 2.6388888888888892e-05, |
|
"loss": 0.3823, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 10.86, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.3839, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 10.96, |
|
"eval_accuracy": 0.8090909090909091, |
|
"eval_loss": 0.5741792917251587, |
|
"eval_runtime": 46.8547, |
|
"eval_samples_per_second": 7.043, |
|
"eval_steps_per_second": 0.235, |
|
"step": 222 |
|
}, |
|
{ |
|
"epoch": 11.36, |
|
"learning_rate": 2.361111111111111e-05, |
|
"loss": 0.4025, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 11.85, |
|
"learning_rate": 2.2222222222222223e-05, |
|
"loss": 0.3496, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.8303030303030303, |
|
"eval_loss": 0.5517680048942566, |
|
"eval_runtime": 45.796, |
|
"eval_samples_per_second": 7.206, |
|
"eval_steps_per_second": 0.24, |
|
"step": 243 |
|
}, |
|
{ |
|
"epoch": 12.35, |
|
"learning_rate": 2.0833333333333336e-05, |
|
"loss": 0.3389, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 12.84, |
|
"learning_rate": 1.9444444444444445e-05, |
|
"loss": 0.3482, |
|
"step": 260 |
|
}, |
|
{ |
|
"epoch": 12.99, |
|
"eval_accuracy": 0.8303030303030303, |
|
"eval_loss": 0.5389552116394043, |
|
"eval_runtime": 45.5677, |
|
"eval_samples_per_second": 7.242, |
|
"eval_steps_per_second": 0.241, |
|
"step": 263 |
|
}, |
|
{ |
|
"epoch": 13.33, |
|
"learning_rate": 1.8055555555555555e-05, |
|
"loss": 0.3486, |
|
"step": 270 |
|
}, |
|
{ |
|
"epoch": 13.83, |
|
"learning_rate": 1.6666666666666667e-05, |
|
"loss": 0.357, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 13.98, |
|
"eval_accuracy": 0.8181818181818182, |
|
"eval_loss": 0.5543653964996338, |
|
"eval_runtime": 45.3586, |
|
"eval_samples_per_second": 7.275, |
|
"eval_steps_per_second": 0.243, |
|
"step": 283 |
|
}, |
|
{ |
|
"epoch": 14.32, |
|
"learning_rate": 1.527777777777778e-05, |
|
"loss": 0.3397, |
|
"step": 290 |
|
}, |
|
{ |
|
"epoch": 14.81, |
|
"learning_rate": 1.388888888888889e-05, |
|
"loss": 0.3341, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 14.96, |
|
"eval_accuracy": 0.8363636363636363, |
|
"eval_loss": 0.5505930185317993, |
|
"eval_runtime": 45.3368, |
|
"eval_samples_per_second": 7.279, |
|
"eval_steps_per_second": 0.243, |
|
"step": 303 |
|
}, |
|
{ |
|
"epoch": 15.31, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.3923, |
|
"step": 310 |
|
}, |
|
{ |
|
"epoch": 15.8, |
|
"learning_rate": 1.1111111111111112e-05, |
|
"loss": 0.3605, |
|
"step": 320 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.8212121212121212, |
|
"eval_loss": 0.5546284914016724, |
|
"eval_runtime": 45.4708, |
|
"eval_samples_per_second": 7.257, |
|
"eval_steps_per_second": 0.242, |
|
"step": 324 |
|
}, |
|
{ |
|
"epoch": 16.3, |
|
"learning_rate": 9.722222222222223e-06, |
|
"loss": 0.3401, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 16.79, |
|
"learning_rate": 8.333333333333334e-06, |
|
"loss": 0.3041, |
|
"step": 340 |
|
}, |
|
{ |
|
"epoch": 16.99, |
|
"eval_accuracy": 0.8212121212121212, |
|
"eval_loss": 0.5597090125083923, |
|
"eval_runtime": 45.2134, |
|
"eval_samples_per_second": 7.299, |
|
"eval_steps_per_second": 0.243, |
|
"step": 344 |
|
}, |
|
{ |
|
"epoch": 17.28, |
|
"learning_rate": 6.944444444444445e-06, |
|
"loss": 0.3422, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 17.78, |
|
"learning_rate": 5.555555555555556e-06, |
|
"loss": 0.3364, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 17.98, |
|
"eval_accuracy": 0.8090909090909091, |
|
"eval_loss": 0.5729926228523254, |
|
"eval_runtime": 45.0505, |
|
"eval_samples_per_second": 7.325, |
|
"eval_steps_per_second": 0.244, |
|
"step": 364 |
|
}, |
|
{ |
|
"epoch": 18.27, |
|
"learning_rate": 4.166666666666667e-06, |
|
"loss": 0.3156, |
|
"step": 370 |
|
}, |
|
{ |
|
"epoch": 18.77, |
|
"learning_rate": 2.777777777777778e-06, |
|
"loss": 0.2976, |
|
"step": 380 |
|
}, |
|
{ |
|
"epoch": 18.96, |
|
"eval_accuracy": 0.8090909090909091, |
|
"eval_loss": 0.5741696357727051, |
|
"eval_runtime": 45.8457, |
|
"eval_samples_per_second": 7.198, |
|
"eval_steps_per_second": 0.24, |
|
"step": 384 |
|
}, |
|
{ |
|
"epoch": 19.26, |
|
"learning_rate": 1.388888888888889e-06, |
|
"loss": 0.3209, |
|
"step": 390 |
|
}, |
|
{ |
|
"epoch": 19.75, |
|
"learning_rate": 0.0, |
|
"loss": 0.3229, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 19.75, |
|
"eval_accuracy": 0.8121212121212121, |
|
"eval_loss": 0.5653126835823059, |
|
"eval_runtime": 41.6194, |
|
"eval_samples_per_second": 7.929, |
|
"eval_steps_per_second": 0.264, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 19.75, |
|
"step": 400, |
|
"total_flos": 5.1138191421254246e+17, |
|
"train_loss": 0.39375978350639346, |
|
"train_runtime": 7915.8379, |
|
"train_samples_per_second": 6.476, |
|
"train_steps_per_second": 0.051 |
|
} |
|
], |
|
"max_steps": 400, |
|
"num_train_epochs": 20, |
|
"total_flos": 5.1138191421254246e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|