|
{ |
|
"best_metric": 3.882021427154541, |
|
"best_model_checkpoint": "detr-r50-mist1-bg-2ah-6l/checkpoint-2760", |
|
"epoch": 25.0, |
|
"eval_steps": 500, |
|
"global_step": 2875, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 9.624347826086956e-06, |
|
"loss": 4.6721, |
|
"step": 115 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_loss": 5.003213882446289, |
|
"eval_runtime": 5.6326, |
|
"eval_samples_per_second": 7.101, |
|
"eval_steps_per_second": 0.888, |
|
"step": 115 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 9.224347826086957e-06, |
|
"loss": 4.4438, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_loss": 4.679709434509277, |
|
"eval_runtime": 5.7025, |
|
"eval_samples_per_second": 7.015, |
|
"eval_steps_per_second": 0.877, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 8.824347826086957e-06, |
|
"loss": 4.2953, |
|
"step": 345 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_loss": 4.702702522277832, |
|
"eval_runtime": 5.7246, |
|
"eval_samples_per_second": 6.987, |
|
"eval_steps_per_second": 0.873, |
|
"step": 345 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 8.424347826086958e-06, |
|
"loss": 4.3899, |
|
"step": 460 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_loss": 5.431577682495117, |
|
"eval_runtime": 5.6954, |
|
"eval_samples_per_second": 7.023, |
|
"eval_steps_per_second": 0.878, |
|
"step": 460 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 8.024347826086956e-06, |
|
"loss": 4.3184, |
|
"step": 575 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_loss": 4.41250467300415, |
|
"eval_runtime": 5.6729, |
|
"eval_samples_per_second": 7.051, |
|
"eval_steps_per_second": 0.881, |
|
"step": 575 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 7.624347826086958e-06, |
|
"loss": 4.2749, |
|
"step": 690 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_loss": 4.161060810089111, |
|
"eval_runtime": 5.6652, |
|
"eval_samples_per_second": 7.061, |
|
"eval_steps_per_second": 0.883, |
|
"step": 690 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 7.227826086956522e-06, |
|
"loss": 4.2153, |
|
"step": 805 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_loss": 4.672310829162598, |
|
"eval_runtime": 5.6197, |
|
"eval_samples_per_second": 7.118, |
|
"eval_steps_per_second": 0.89, |
|
"step": 805 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 6.827826086956523e-06, |
|
"loss": 4.0788, |
|
"step": 920 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_loss": 4.12662410736084, |
|
"eval_runtime": 5.6637, |
|
"eval_samples_per_second": 7.062, |
|
"eval_steps_per_second": 0.883, |
|
"step": 920 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 6.427826086956523e-06, |
|
"loss": 4.0752, |
|
"step": 1035 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_loss": 4.052855014801025, |
|
"eval_runtime": 5.641, |
|
"eval_samples_per_second": 7.091, |
|
"eval_steps_per_second": 0.886, |
|
"step": 1035 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 6.027826086956522e-06, |
|
"loss": 4.0073, |
|
"step": 1150 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_loss": 4.448337078094482, |
|
"eval_runtime": 5.6934, |
|
"eval_samples_per_second": 7.026, |
|
"eval_steps_per_second": 0.878, |
|
"step": 1150 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"learning_rate": 5.627826086956523e-06, |
|
"loss": 4.011, |
|
"step": 1265 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_loss": 4.200244426727295, |
|
"eval_runtime": 5.6368, |
|
"eval_samples_per_second": 7.096, |
|
"eval_steps_per_second": 0.887, |
|
"step": 1265 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"learning_rate": 5.227826086956522e-06, |
|
"loss": 3.9993, |
|
"step": 1380 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_loss": 4.2449798583984375, |
|
"eval_runtime": 5.6784, |
|
"eval_samples_per_second": 7.044, |
|
"eval_steps_per_second": 0.881, |
|
"step": 1380 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"learning_rate": 4.827826086956522e-06, |
|
"loss": 4.0028, |
|
"step": 1495 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_loss": 4.170295715332031, |
|
"eval_runtime": 5.8028, |
|
"eval_samples_per_second": 6.893, |
|
"eval_steps_per_second": 0.862, |
|
"step": 1495 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"learning_rate": 4.427826086956522e-06, |
|
"loss": 3.9572, |
|
"step": 1610 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_loss": 4.186112880706787, |
|
"eval_runtime": 5.7389, |
|
"eval_samples_per_second": 6.97, |
|
"eval_steps_per_second": 0.871, |
|
"step": 1610 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"learning_rate": 4.027826086956522e-06, |
|
"loss": 3.9009, |
|
"step": 1725 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_loss": 4.02849006652832, |
|
"eval_runtime": 5.8134, |
|
"eval_samples_per_second": 6.881, |
|
"eval_steps_per_second": 0.86, |
|
"step": 1725 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"learning_rate": 3.627826086956522e-06, |
|
"loss": 3.9173, |
|
"step": 1840 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_loss": 4.06730842590332, |
|
"eval_runtime": 5.7961, |
|
"eval_samples_per_second": 6.901, |
|
"eval_steps_per_second": 0.863, |
|
"step": 1840 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"learning_rate": 3.227826086956522e-06, |
|
"loss": 3.8884, |
|
"step": 1955 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_loss": 3.9875235557556152, |
|
"eval_runtime": 5.7593, |
|
"eval_samples_per_second": 6.945, |
|
"eval_steps_per_second": 0.868, |
|
"step": 1955 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"learning_rate": 2.8278260869565224e-06, |
|
"loss": 3.8415, |
|
"step": 2070 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_loss": 4.106224536895752, |
|
"eval_runtime": 5.7793, |
|
"eval_samples_per_second": 6.921, |
|
"eval_steps_per_second": 0.865, |
|
"step": 2070 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"learning_rate": 2.427826086956522e-06, |
|
"loss": 3.8132, |
|
"step": 2185 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_loss": 4.049378871917725, |
|
"eval_runtime": 5.6624, |
|
"eval_samples_per_second": 7.064, |
|
"eval_steps_per_second": 0.883, |
|
"step": 2185 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"learning_rate": 2.027826086956522e-06, |
|
"loss": 3.8297, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_loss": 4.011868476867676, |
|
"eval_runtime": 5.745, |
|
"eval_samples_per_second": 6.963, |
|
"eval_steps_per_second": 0.87, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"learning_rate": 1.6278260869565218e-06, |
|
"loss": 3.8262, |
|
"step": 2415 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_loss": 3.953753709793091, |
|
"eval_runtime": 5.7295, |
|
"eval_samples_per_second": 6.981, |
|
"eval_steps_per_second": 0.873, |
|
"step": 2415 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"learning_rate": 1.2278260869565218e-06, |
|
"loss": 3.8045, |
|
"step": 2530 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_loss": 3.950028657913208, |
|
"eval_runtime": 5.8404, |
|
"eval_samples_per_second": 6.849, |
|
"eval_steps_per_second": 0.856, |
|
"step": 2530 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"learning_rate": 8.278260869565217e-07, |
|
"loss": 3.8067, |
|
"step": 2645 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_loss": 3.92639422416687, |
|
"eval_runtime": 5.7491, |
|
"eval_samples_per_second": 6.958, |
|
"eval_steps_per_second": 0.87, |
|
"step": 2645 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"learning_rate": 4.278260869565218e-07, |
|
"loss": 3.7651, |
|
"step": 2760 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_loss": 3.882021427154541, |
|
"eval_runtime": 5.8762, |
|
"eval_samples_per_second": 6.807, |
|
"eval_steps_per_second": 0.851, |
|
"step": 2760 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"learning_rate": 2.7826086956521744e-08, |
|
"loss": 3.756, |
|
"step": 2875 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_loss": 3.9051177501678467, |
|
"eval_runtime": 5.7364, |
|
"eval_samples_per_second": 6.973, |
|
"eval_steps_per_second": 0.872, |
|
"step": 2875 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"step": 2875, |
|
"total_flos": 5.49474551424e+18, |
|
"train_loss": 4.035632897418478, |
|
"train_runtime": 2307.326, |
|
"train_samples_per_second": 4.984, |
|
"train_steps_per_second": 1.246 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 2875, |
|
"num_train_epochs": 25, |
|
"save_steps": 500, |
|
"total_flos": 5.49474551424e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|