|
{ |
|
"best_metric": 0.18469373881816864, |
|
"best_model_checkpoint": "vessel_ship_types_image_detection/checkpoint-6650", |
|
"epoch": 50.0, |
|
"eval_steps": 500, |
|
"global_step": 6650, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.7160377358490566, |
|
"eval_loss": 1.4629170894622803, |
|
"eval_runtime": 18.5467, |
|
"eval_samples_per_second": 114.306, |
|
"eval_steps_per_second": 3.613, |
|
"step": 133 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.8495283018867924, |
|
"eval_loss": 1.2206131219863892, |
|
"eval_runtime": 18.2977, |
|
"eval_samples_per_second": 115.862, |
|
"eval_steps_per_second": 3.662, |
|
"step": 266 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.870754716981132, |
|
"eval_loss": 1.0089887380599976, |
|
"eval_runtime": 18.4043, |
|
"eval_samples_per_second": 115.19, |
|
"eval_steps_per_second": 3.64, |
|
"step": 399 |
|
}, |
|
{ |
|
"epoch": 3.76, |
|
"learning_rate": 1.8636363636363635e-06, |
|
"loss": 1.1877, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8962264150943396, |
|
"eval_loss": 0.8400751352310181, |
|
"eval_runtime": 18.4514, |
|
"eval_samples_per_second": 114.896, |
|
"eval_steps_per_second": 3.631, |
|
"step": 532 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9155660377358491, |
|
"eval_loss": 0.714967668056488, |
|
"eval_runtime": 18.5178, |
|
"eval_samples_per_second": 114.484, |
|
"eval_steps_per_second": 3.618, |
|
"step": 665 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.9292452830188679, |
|
"eval_loss": 0.625623345375061, |
|
"eval_runtime": 18.8638, |
|
"eval_samples_per_second": 112.385, |
|
"eval_steps_per_second": 3.552, |
|
"step": 798 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.9382075471698114, |
|
"eval_loss": 0.556588888168335, |
|
"eval_runtime": 18.4533, |
|
"eval_samples_per_second": 114.885, |
|
"eval_steps_per_second": 3.631, |
|
"step": 931 |
|
}, |
|
{ |
|
"epoch": 7.52, |
|
"learning_rate": 1.712121212121212e-06, |
|
"loss": 0.5507, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9424528301886792, |
|
"eval_loss": 0.5028243064880371, |
|
"eval_runtime": 18.7405, |
|
"eval_samples_per_second": 113.124, |
|
"eval_steps_per_second": 3.575, |
|
"step": 1064 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.9481132075471698, |
|
"eval_loss": 0.4585725665092468, |
|
"eval_runtime": 18.5812, |
|
"eval_samples_per_second": 114.094, |
|
"eval_steps_per_second": 3.606, |
|
"step": 1197 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.9495283018867925, |
|
"eval_loss": 0.42831137776374817, |
|
"eval_runtime": 18.6399, |
|
"eval_samples_per_second": 113.734, |
|
"eval_steps_per_second": 3.594, |
|
"step": 1330 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.9537735849056603, |
|
"eval_loss": 0.398691326379776, |
|
"eval_runtime": 18.7098, |
|
"eval_samples_per_second": 113.309, |
|
"eval_steps_per_second": 3.581, |
|
"step": 1463 |
|
}, |
|
{ |
|
"epoch": 11.28, |
|
"learning_rate": 1.5606060606060604e-06, |
|
"loss": 0.3457, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.9556603773584905, |
|
"eval_loss": 0.37774720788002014, |
|
"eval_runtime": 18.6811, |
|
"eval_samples_per_second": 113.484, |
|
"eval_steps_per_second": 3.587, |
|
"step": 1596 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.9570754716981132, |
|
"eval_loss": 0.35789886116981506, |
|
"eval_runtime": 19.0448, |
|
"eval_samples_per_second": 111.317, |
|
"eval_steps_per_second": 3.518, |
|
"step": 1729 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.9584905660377359, |
|
"eval_loss": 0.3406927287578583, |
|
"eval_runtime": 18.7362, |
|
"eval_samples_per_second": 113.15, |
|
"eval_steps_per_second": 3.576, |
|
"step": 1862 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_accuracy": 0.9580188679245283, |
|
"eval_loss": 0.3256920874118805, |
|
"eval_runtime": 18.4691, |
|
"eval_samples_per_second": 114.786, |
|
"eval_steps_per_second": 3.628, |
|
"step": 1995 |
|
}, |
|
{ |
|
"epoch": 15.04, |
|
"learning_rate": 1.409090909090909e-06, |
|
"loss": 0.2582, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.9589622641509434, |
|
"eval_loss": 0.3142967224121094, |
|
"eval_runtime": 18.7522, |
|
"eval_samples_per_second": 113.053, |
|
"eval_steps_per_second": 3.573, |
|
"step": 2128 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_accuracy": 0.9599056603773585, |
|
"eval_loss": 0.30126336216926575, |
|
"eval_runtime": 18.4133, |
|
"eval_samples_per_second": 115.134, |
|
"eval_steps_per_second": 3.639, |
|
"step": 2261 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 0.9627358490566038, |
|
"eval_loss": 0.29247793555259705, |
|
"eval_runtime": 18.4149, |
|
"eval_samples_per_second": 115.124, |
|
"eval_steps_per_second": 3.638, |
|
"step": 2394 |
|
}, |
|
{ |
|
"epoch": 18.8, |
|
"learning_rate": 1.2575757575757576e-06, |
|
"loss": 0.2081, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_accuracy": 0.9617924528301887, |
|
"eval_loss": 0.2814226746559143, |
|
"eval_runtime": 18.5345, |
|
"eval_samples_per_second": 114.381, |
|
"eval_steps_per_second": 3.615, |
|
"step": 2527 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.964622641509434, |
|
"eval_loss": 0.27146387100219727, |
|
"eval_runtime": 18.387, |
|
"eval_samples_per_second": 115.299, |
|
"eval_steps_per_second": 3.644, |
|
"step": 2660 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_accuracy": 0.9627358490566038, |
|
"eval_loss": 0.26703450083732605, |
|
"eval_runtime": 18.3186, |
|
"eval_samples_per_second": 115.73, |
|
"eval_steps_per_second": 3.657, |
|
"step": 2793 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_accuracy": 0.9650943396226415, |
|
"eval_loss": 0.2572649121284485, |
|
"eval_runtime": 18.5302, |
|
"eval_samples_per_second": 114.408, |
|
"eval_steps_per_second": 3.616, |
|
"step": 2926 |
|
}, |
|
{ |
|
"epoch": 22.56, |
|
"learning_rate": 1.106060606060606e-06, |
|
"loss": 0.1768, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_accuracy": 0.964622641509434, |
|
"eval_loss": 0.2507427930831909, |
|
"eval_runtime": 18.696, |
|
"eval_samples_per_second": 113.393, |
|
"eval_steps_per_second": 3.584, |
|
"step": 3059 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.9660377358490566, |
|
"eval_loss": 0.24606208503246307, |
|
"eval_runtime": 18.2252, |
|
"eval_samples_per_second": 116.322, |
|
"eval_steps_per_second": 3.676, |
|
"step": 3192 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_accuracy": 0.9679245283018868, |
|
"eval_loss": 0.2419576346874237, |
|
"eval_runtime": 18.4449, |
|
"eval_samples_per_second": 114.937, |
|
"eval_steps_per_second": 3.632, |
|
"step": 3325 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_accuracy": 0.965566037735849, |
|
"eval_loss": 0.23377002775669098, |
|
"eval_runtime": 18.4276, |
|
"eval_samples_per_second": 115.045, |
|
"eval_steps_per_second": 3.636, |
|
"step": 3458 |
|
}, |
|
{ |
|
"epoch": 26.32, |
|
"learning_rate": 9.545454545454546e-07, |
|
"loss": 0.154, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_accuracy": 0.9683962264150944, |
|
"eval_loss": 0.22959384322166443, |
|
"eval_runtime": 18.5635, |
|
"eval_samples_per_second": 114.203, |
|
"eval_steps_per_second": 3.609, |
|
"step": 3591 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_accuracy": 0.9674528301886792, |
|
"eval_loss": 0.22633853554725647, |
|
"eval_runtime": 18.435, |
|
"eval_samples_per_second": 114.999, |
|
"eval_steps_per_second": 3.634, |
|
"step": 3724 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_accuracy": 0.9669811320754716, |
|
"eval_loss": 0.22211851179599762, |
|
"eval_runtime": 18.6045, |
|
"eval_samples_per_second": 113.951, |
|
"eval_steps_per_second": 3.601, |
|
"step": 3857 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_accuracy": 0.9674528301886792, |
|
"eval_loss": 0.21722418069839478, |
|
"eval_runtime": 18.5078, |
|
"eval_samples_per_second": 114.546, |
|
"eval_steps_per_second": 3.62, |
|
"step": 3990 |
|
}, |
|
{ |
|
"epoch": 30.08, |
|
"learning_rate": 8.030303030303029e-07, |
|
"loss": 0.137, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_accuracy": 0.9688679245283018, |
|
"eval_loss": 0.21657830476760864, |
|
"eval_runtime": 18.4696, |
|
"eval_samples_per_second": 114.783, |
|
"eval_steps_per_second": 3.628, |
|
"step": 4123 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_accuracy": 0.9693396226415094, |
|
"eval_loss": 0.21263349056243896, |
|
"eval_runtime": 18.5165, |
|
"eval_samples_per_second": 114.492, |
|
"eval_steps_per_second": 3.618, |
|
"step": 4256 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_accuracy": 0.9693396226415094, |
|
"eval_loss": 0.20656518638134003, |
|
"eval_runtime": 18.53, |
|
"eval_samples_per_second": 114.409, |
|
"eval_steps_per_second": 3.616, |
|
"step": 4389 |
|
}, |
|
{ |
|
"epoch": 33.83, |
|
"learning_rate": 6.515151515151515e-07, |
|
"loss": 0.1249, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_accuracy": 0.9688679245283018, |
|
"eval_loss": 0.2059292197227478, |
|
"eval_runtime": 18.417, |
|
"eval_samples_per_second": 115.111, |
|
"eval_steps_per_second": 3.638, |
|
"step": 4522 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_accuracy": 0.9688679245283018, |
|
"eval_loss": 0.202570378780365, |
|
"eval_runtime": 18.4563, |
|
"eval_samples_per_second": 114.866, |
|
"eval_steps_per_second": 3.63, |
|
"step": 4655 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_accuracy": 0.9683962264150944, |
|
"eval_loss": 0.20071472227573395, |
|
"eval_runtime": 18.5005, |
|
"eval_samples_per_second": 114.591, |
|
"eval_steps_per_second": 3.622, |
|
"step": 4788 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_accuracy": 0.9702830188679246, |
|
"eval_loss": 0.19722311198711395, |
|
"eval_runtime": 18.4376, |
|
"eval_samples_per_second": 114.982, |
|
"eval_steps_per_second": 3.634, |
|
"step": 4921 |
|
}, |
|
{ |
|
"epoch": 37.59, |
|
"learning_rate": 5e-07, |
|
"loss": 0.115, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_accuracy": 0.9712264150943396, |
|
"eval_loss": 0.19501303136348724, |
|
"eval_runtime": 18.4088, |
|
"eval_samples_per_second": 115.162, |
|
"eval_steps_per_second": 3.64, |
|
"step": 5054 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_accuracy": 0.9702830188679246, |
|
"eval_loss": 0.19410006701946259, |
|
"eval_runtime": 18.3341, |
|
"eval_samples_per_second": 115.632, |
|
"eval_steps_per_second": 3.654, |
|
"step": 5187 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_accuracy": 0.9702830188679246, |
|
"eval_loss": 0.192692831158638, |
|
"eval_runtime": 18.4143, |
|
"eval_samples_per_second": 115.128, |
|
"eval_steps_per_second": 3.638, |
|
"step": 5320 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_accuracy": 0.9693396226415094, |
|
"eval_loss": 0.19077734649181366, |
|
"eval_runtime": 18.4866, |
|
"eval_samples_per_second": 114.678, |
|
"eval_steps_per_second": 3.624, |
|
"step": 5453 |
|
}, |
|
{ |
|
"epoch": 41.35, |
|
"learning_rate": 3.484848484848485e-07, |
|
"loss": 0.1092, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_accuracy": 0.9712264150943396, |
|
"eval_loss": 0.18846099078655243, |
|
"eval_runtime": 18.4309, |
|
"eval_samples_per_second": 115.024, |
|
"eval_steps_per_second": 3.635, |
|
"step": 5586 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_accuracy": 0.970754716981132, |
|
"eval_loss": 0.18755605816841125, |
|
"eval_runtime": 18.4541, |
|
"eval_samples_per_second": 114.88, |
|
"eval_steps_per_second": 3.631, |
|
"step": 5719 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_accuracy": 0.9702830188679246, |
|
"eval_loss": 0.18720585107803345, |
|
"eval_runtime": 18.5754, |
|
"eval_samples_per_second": 114.129, |
|
"eval_steps_per_second": 3.607, |
|
"step": 5852 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_accuracy": 0.9726415094339622, |
|
"eval_loss": 0.1874205619096756, |
|
"eval_runtime": 18.384, |
|
"eval_samples_per_second": 115.318, |
|
"eval_steps_per_second": 3.644, |
|
"step": 5985 |
|
}, |
|
{ |
|
"epoch": 45.11, |
|
"learning_rate": 1.9696969696969696e-07, |
|
"loss": 0.1037, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_accuracy": 0.9726415094339622, |
|
"eval_loss": 0.18643254041671753, |
|
"eval_runtime": 18.3487, |
|
"eval_samples_per_second": 115.54, |
|
"eval_steps_per_second": 3.651, |
|
"step": 6118 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_accuracy": 0.9721698113207548, |
|
"eval_loss": 0.1849406659603119, |
|
"eval_runtime": 18.5194, |
|
"eval_samples_per_second": 114.474, |
|
"eval_steps_per_second": 3.618, |
|
"step": 6251 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_accuracy": 0.9712264150943396, |
|
"eval_loss": 0.18540790677070618, |
|
"eval_runtime": 18.5314, |
|
"eval_samples_per_second": 114.4, |
|
"eval_steps_per_second": 3.615, |
|
"step": 6384 |
|
}, |
|
{ |
|
"epoch": 48.87, |
|
"learning_rate": 4.545454545454545e-08, |
|
"loss": 0.1022, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_accuracy": 0.9712264150943396, |
|
"eval_loss": 0.18494902551174164, |
|
"eval_runtime": 18.5992, |
|
"eval_samples_per_second": 113.983, |
|
"eval_steps_per_second": 3.602, |
|
"step": 6517 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_accuracy": 0.9712264150943396, |
|
"eval_loss": 0.18469373881816864, |
|
"eval_runtime": 18.4003, |
|
"eval_samples_per_second": 115.216, |
|
"eval_steps_per_second": 3.641, |
|
"step": 6650 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 6650, |
|
"num_train_epochs": 50, |
|
"save_steps": 500, |
|
"total_flos": 3.285748704662323e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|