{ "best_metric": 2.917006731033325, "best_model_checkpoint": "detr-r50-mist1-bg-8ah-4l/checkpoint-2415", "epoch": 25.0, "eval_steps": 500, "global_step": 2875, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 9.624347826086956e-06, "loss": 4.4466, "step": 115 }, { "epoch": 1.0, "eval_loss": 3.812701463699341, "eval_runtime": 5.8935, "eval_samples_per_second": 6.787, "eval_steps_per_second": 0.848, "step": 115 }, { "epoch": 2.0, "learning_rate": 9.224347826086957e-06, "loss": 3.85, "step": 230 }, { "epoch": 2.0, "eval_loss": 3.863551378250122, "eval_runtime": 5.9222, "eval_samples_per_second": 6.754, "eval_steps_per_second": 0.844, "step": 230 }, { "epoch": 3.0, "learning_rate": 8.824347826086957e-06, "loss": 3.8198, "step": 345 }, { "epoch": 3.0, "eval_loss": 3.617934465408325, "eval_runtime": 5.9064, "eval_samples_per_second": 6.772, "eval_steps_per_second": 0.847, "step": 345 }, { "epoch": 4.0, "learning_rate": 8.427826086956521e-06, "loss": 3.6799, "step": 460 }, { "epoch": 4.0, "eval_loss": 3.455796003341675, "eval_runtime": 6.041, "eval_samples_per_second": 6.621, "eval_steps_per_second": 0.828, "step": 460 }, { "epoch": 5.0, "learning_rate": 8.027826086956523e-06, "loss": 3.5806, "step": 575 }, { "epoch": 5.0, "eval_loss": 3.2327613830566406, "eval_runtime": 5.9282, "eval_samples_per_second": 6.747, "eval_steps_per_second": 0.843, "step": 575 }, { "epoch": 6.0, "learning_rate": 7.631304347826087e-06, "loss": 3.4958, "step": 690 }, { "epoch": 6.0, "eval_loss": 3.340712070465088, "eval_runtime": 5.9472, "eval_samples_per_second": 6.726, "eval_steps_per_second": 0.841, "step": 690 }, { "epoch": 7.0, "learning_rate": 7.231304347826088e-06, "loss": 3.4662, "step": 805 }, { "epoch": 7.0, "eval_loss": 3.156733989715576, "eval_runtime": 5.8659, "eval_samples_per_second": 6.819, "eval_steps_per_second": 0.852, "step": 805 }, { "epoch": 8.0, "learning_rate": 6.8313043478260874e-06, "loss": 3.4295, "step": 920 }, { "epoch": 8.0, "eval_loss": 3.049887180328369, "eval_runtime": 5.8059, "eval_samples_per_second": 6.89, "eval_steps_per_second": 0.861, "step": 920 }, { "epoch": 9.0, "learning_rate": 6.431304347826087e-06, "loss": 3.3977, "step": 1035 }, { "epoch": 9.0, "eval_loss": 3.0459601879119873, "eval_runtime": 5.876, "eval_samples_per_second": 6.807, "eval_steps_per_second": 0.851, "step": 1035 }, { "epoch": 10.0, "learning_rate": 6.031304347826088e-06, "loss": 3.3853, "step": 1150 }, { "epoch": 10.0, "eval_loss": 3.048147678375244, "eval_runtime": 5.737, "eval_samples_per_second": 6.972, "eval_steps_per_second": 0.872, "step": 1150 }, { "epoch": 11.0, "learning_rate": 5.631304347826088e-06, "loss": 3.3608, "step": 1265 }, { "epoch": 11.0, "eval_loss": 3.033698558807373, "eval_runtime": 5.8795, "eval_samples_per_second": 6.803, "eval_steps_per_second": 0.85, "step": 1265 }, { "epoch": 12.0, "learning_rate": 5.2313043478260875e-06, "loss": 3.2873, "step": 1380 }, { "epoch": 12.0, "eval_loss": 3.053478479385376, "eval_runtime": 5.7373, "eval_samples_per_second": 6.972, "eval_steps_per_second": 0.871, "step": 1380 }, { "epoch": 13.0, "learning_rate": 4.831304347826087e-06, "loss": 3.3164, "step": 1495 }, { "epoch": 13.0, "eval_loss": 3.0139570236206055, "eval_runtime": 5.7591, "eval_samples_per_second": 6.945, "eval_steps_per_second": 0.868, "step": 1495 }, { "epoch": 14.0, "learning_rate": 4.4313043478260875e-06, "loss": 3.2745, "step": 1610 }, { "epoch": 14.0, "eval_loss": 3.0666890144348145, "eval_runtime": 5.6397, "eval_samples_per_second": 7.093, "eval_steps_per_second": 0.887, "step": 1610 }, { "epoch": 15.0, "learning_rate": 4.031304347826087e-06, "loss": 3.2691, "step": 1725 }, { "epoch": 15.0, "eval_loss": 3.013432264328003, "eval_runtime": 5.7704, "eval_samples_per_second": 6.932, "eval_steps_per_second": 0.866, "step": 1725 }, { "epoch": 16.0, "learning_rate": 3.631304347826087e-06, "loss": 3.2735, "step": 1840 }, { "epoch": 16.0, "eval_loss": 3.020738124847412, "eval_runtime": 5.8757, "eval_samples_per_second": 6.808, "eval_steps_per_second": 0.851, "step": 1840 }, { "epoch": 17.0, "learning_rate": 3.2313043478260876e-06, "loss": 3.2718, "step": 1955 }, { "epoch": 17.0, "eval_loss": 3.0004284381866455, "eval_runtime": 5.6729, "eval_samples_per_second": 7.051, "eval_steps_per_second": 0.881, "step": 1955 }, { "epoch": 18.0, "learning_rate": 2.831304347826087e-06, "loss": 3.2504, "step": 2070 }, { "epoch": 18.0, "eval_loss": 3.1082119941711426, "eval_runtime": 5.6759, "eval_samples_per_second": 7.047, "eval_steps_per_second": 0.881, "step": 2070 }, { "epoch": 19.0, "learning_rate": 2.431304347826087e-06, "loss": 3.243, "step": 2185 }, { "epoch": 19.0, "eval_loss": 2.9369025230407715, "eval_runtime": 5.8335, "eval_samples_per_second": 6.857, "eval_steps_per_second": 0.857, "step": 2185 }, { "epoch": 20.0, "learning_rate": 2.0313043478260872e-06, "loss": 3.1669, "step": 2300 }, { "epoch": 20.0, "eval_loss": 2.9595999717712402, "eval_runtime": 5.8209, "eval_samples_per_second": 6.872, "eval_steps_per_second": 0.859, "step": 2300 }, { "epoch": 21.0, "learning_rate": 1.6347826086956523e-06, "loss": 3.1844, "step": 2415 }, { "epoch": 21.0, "eval_loss": 2.917006731033325, "eval_runtime": 5.8161, "eval_samples_per_second": 6.877, "eval_steps_per_second": 0.86, "step": 2415 }, { "epoch": 22.0, "learning_rate": 1.2347826086956523e-06, "loss": 3.1979, "step": 2530 }, { "epoch": 22.0, "eval_loss": 2.934359073638916, "eval_runtime": 5.7645, "eval_samples_per_second": 6.939, "eval_steps_per_second": 0.867, "step": 2530 }, { "epoch": 23.0, "learning_rate": 8.347826086956523e-07, "loss": 3.1702, "step": 2645 }, { "epoch": 23.0, "eval_loss": 2.9261698722839355, "eval_runtime": 5.8376, "eval_samples_per_second": 6.852, "eval_steps_per_second": 0.857, "step": 2645 }, { "epoch": 24.0, "learning_rate": 4.347826086956522e-07, "loss": 3.1738, "step": 2760 }, { "epoch": 24.0, "eval_loss": 2.925136089324951, "eval_runtime": 5.7559, "eval_samples_per_second": 6.949, "eval_steps_per_second": 0.869, "step": 2760 }, { "epoch": 25.0, "learning_rate": 3.478260869565218e-08, "loss": 3.1606, "step": 2875 }, { "epoch": 25.0, "eval_loss": 2.9274065494537354, "eval_runtime": 5.8001, "eval_samples_per_second": 6.896, "eval_steps_per_second": 0.862, "step": 2875 }, { "epoch": 25.0, "step": 2875, "total_flos": 4.7279979072e+18, "train_loss": 3.4060823072350543, "train_runtime": 2285.4543, "train_samples_per_second": 5.032, "train_steps_per_second": 1.258 } ], "logging_steps": 500, "max_steps": 2875, "num_train_epochs": 25, "save_steps": 500, "total_flos": 4.7279979072e+18, "trial_name": null, "trial_params": null }