{ "best_metric": 1.6447107791900635, "best_model_checkpoint": "detr-r101-cd45rb-8ah-12l\\checkpoint-115150", "epoch": 25.0, "global_step": 115150, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 9.00238818931828e-06, "loss": 3.0401, "step": 4606 }, { "epoch": 1.0, "eval_loss": 2.163705587387085, "eval_runtime": 222.5701, "eval_samples_per_second": 8.002, "eval_steps_per_second": 1.002, "step": 4606 }, { "epoch": 2.0, "learning_rate": 8.002822405557968e-06, "loss": 2.7151, "step": 9212 }, { "epoch": 2.0, "eval_loss": 2.06657338142395, "eval_runtime": 222.3447, "eval_samples_per_second": 8.01, "eval_steps_per_second": 1.003, "step": 9212 }, { "epoch": 3.0, "learning_rate": 7.003039513677812e-06, "loss": 2.6021, "step": 13818 }, { "epoch": 3.0, "eval_loss": 1.986824870109558, "eval_runtime": 226.29, "eval_samples_per_second": 7.87, "eval_steps_per_second": 0.985, "step": 13818 }, { "epoch": 4.0, "learning_rate": 6.003473729917499e-06, "loss": 2.5221, "step": 18424 }, { "epoch": 4.0, "eval_loss": 1.8957558870315552, "eval_runtime": 219.599, "eval_samples_per_second": 8.11, "eval_steps_per_second": 1.015, "step": 18424 }, { "epoch": 5.0, "learning_rate": 5.003907946157187e-06, "loss": 2.4541, "step": 23030 }, { "epoch": 5.0, "eval_loss": 1.8809998035430908, "eval_runtime": 222.9944, "eval_samples_per_second": 7.987, "eval_steps_per_second": 1.0, "step": 23030 }, { "epoch": 6.0, "learning_rate": 4.0041250542770305e-06, "loss": 2.4155, "step": 27636 }, { "epoch": 6.0, "eval_loss": 1.8369228839874268, "eval_runtime": 220.1885, "eval_samples_per_second": 8.089, "eval_steps_per_second": 1.013, "step": 27636 }, { "epoch": 7.0, "learning_rate": 3.0047763786365614e-06, "loss": 2.3531, "step": 32242 }, { "epoch": 7.0, "eval_loss": 1.8039908409118652, "eval_runtime": 225.4193, "eval_samples_per_second": 7.901, "eval_steps_per_second": 0.989, "step": 32242 }, { "epoch": 8.0, "learning_rate": 2.004993486756405e-06, "loss": 2.31, "step": 36848 }, { "epoch": 8.0, "eval_loss": 1.797875165939331, "eval_runtime": 219.4975, "eval_samples_per_second": 8.114, "eval_steps_per_second": 1.016, "step": 36848 }, { "epoch": 9.0, "learning_rate": 1.0054277029960922e-06, "loss": 2.2841, "step": 41454 }, { "epoch": 9.0, "eval_loss": 1.7520661354064941, "eval_runtime": 222.6235, "eval_samples_per_second": 8.0, "eval_steps_per_second": 1.002, "step": 41454 }, { "epoch": 10.0, "learning_rate": 5.644811115935737e-09, "loss": 2.2555, "step": 46060 }, { "epoch": 10.0, "eval_loss": 1.7242921590805054, "eval_runtime": 220.3572, "eval_samples_per_second": 8.082, "eval_steps_per_second": 1.012, "step": 46060 }, { "epoch": 11.0, "learning_rate": 5.602518454190186e-06, "loss": 2.3388, "step": 50666 }, { "epoch": 11.0, "eval_loss": 1.8519611358642578, "eval_runtime": 224.9013, "eval_samples_per_second": 7.919, "eval_steps_per_second": 0.992, "step": 50666 }, { "epoch": 12.0, "learning_rate": 5.202605297438124e-06, "loss": 2.3523, "step": 55272 }, { "epoch": 12.0, "eval_loss": 1.8499144315719604, "eval_runtime": 224.2008, "eval_samples_per_second": 7.944, "eval_steps_per_second": 0.995, "step": 55272 }, { "epoch": 13.0, "learning_rate": 4.802778983933999e-06, "loss": 2.3515, "step": 59878 }, { "epoch": 13.0, "eval_loss": 1.7634978294372559, "eval_runtime": 225.8943, "eval_samples_per_second": 7.884, "eval_steps_per_second": 0.987, "step": 59878 }, { "epoch": 14.0, "learning_rate": 4.402865827181937e-06, "loss": 2.3236, "step": 64484 }, { "epoch": 14.0, "eval_loss": 1.7787134647369385, "eval_runtime": 223.7953, "eval_samples_per_second": 7.958, "eval_steps_per_second": 0.996, "step": 64484 }, { "epoch": 15.0, "learning_rate": 4.002952670429874e-06, "loss": 2.2676, "step": 69090 }, { "epoch": 15.0, "eval_loss": 1.7517672777175903, "eval_runtime": 226.211, "eval_samples_per_second": 7.873, "eval_steps_per_second": 0.986, "step": 69090 }, { "epoch": 16.0, "learning_rate": 3.6033000434216243e-06, "loss": 2.2787, "step": 73696 }, { "epoch": 16.0, "eval_loss": 1.7879087924957275, "eval_runtime": 223.8881, "eval_samples_per_second": 7.955, "eval_steps_per_second": 0.996, "step": 73696 }, { "epoch": 17.0, "learning_rate": 3.2033868866695615e-06, "loss": 2.2523, "step": 78302 }, { "epoch": 17.0, "eval_loss": 1.7303467988967896, "eval_runtime": 223.161, "eval_samples_per_second": 7.981, "eval_steps_per_second": 0.999, "step": 78302 }, { "epoch": 18.0, "learning_rate": 2.8035605731654363e-06, "loss": 2.2357, "step": 82908 }, { "epoch": 18.0, "eval_loss": 1.7361239194869995, "eval_runtime": 222.8596, "eval_samples_per_second": 7.992, "eval_steps_per_second": 1.001, "step": 82908 }, { "epoch": 19.0, "learning_rate": 2.4036474164133743e-06, "loss": 2.2068, "step": 87514 }, { "epoch": 19.0, "eval_loss": 1.691589117050171, "eval_runtime": 223.3285, "eval_samples_per_second": 7.975, "eval_steps_per_second": 0.999, "step": 87514 }, { "epoch": 20.0, "learning_rate": 2.0037342596613115e-06, "loss": 2.1972, "step": 92120 }, { "epoch": 20.0, "eval_loss": 1.6940640211105347, "eval_runtime": 222.4012, "eval_samples_per_second": 8.008, "eval_steps_per_second": 1.003, "step": 92120 }, { "epoch": 21.0, "learning_rate": 1.6039079461571863e-06, "loss": 2.1856, "step": 96726 }, { "epoch": 21.0, "eval_loss": 1.6824039220809937, "eval_runtime": 219.7189, "eval_samples_per_second": 8.106, "eval_steps_per_second": 1.015, "step": 96726 }, { "epoch": 22.0, "learning_rate": 1.2039947894051239e-06, "loss": 2.1611, "step": 101332 }, { "epoch": 22.0, "eval_loss": 1.6710505485534668, "eval_runtime": 219.2608, "eval_samples_per_second": 8.123, "eval_steps_per_second": 1.017, "step": 101332 }, { "epoch": 23.0, "learning_rate": 8.041684759009987e-07, "loss": 2.1419, "step": 105938 }, { "epoch": 23.0, "eval_loss": 1.6535351276397705, "eval_runtime": 220.9951, "eval_samples_per_second": 8.059, "eval_steps_per_second": 1.009, "step": 105938 }, { "epoch": 24.0, "learning_rate": 4.0425531914893625e-07, "loss": 2.1412, "step": 110544 }, { "epoch": 24.0, "eval_loss": 1.6602009534835815, "eval_runtime": 477.2637, "eval_samples_per_second": 3.732, "eval_steps_per_second": 0.467, "step": 110544 }, { "epoch": 25.0, "learning_rate": 4.515848892748589e-09, "loss": 2.1285, "step": 115150 }, { "epoch": 25.0, "eval_loss": 1.6447107791900635, "eval_runtime": 581.8045, "eval_samples_per_second": 3.061, "eval_steps_per_second": 0.383, "step": 115150 }, { "epoch": 25.0, "step": 115150, "total_flos": 4.126770236983678e+20, "train_loss": 0.4303329726172384, "train_runtime": 23864.0904, "train_samples_per_second": 19.298, "train_steps_per_second": 4.825 } ], "max_steps": 115150, "num_train_epochs": 25, "total_flos": 4.126770236983678e+20, "trial_name": null, "trial_params": null }