{ "best_metric": 2.1030609607696533, "best_model_checkpoint": "detr-r50-mist1-bg-8ah-6l/checkpoint-2875", "epoch": 25.0, "eval_steps": 500, "global_step": 2875, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 9.620869565217393e-06, "loss": 3.6794, "step": 115 }, { "epoch": 1.0, "eval_loss": 2.8221545219421387, "eval_runtime": 6.0762, "eval_samples_per_second": 6.583, "eval_steps_per_second": 0.823, "step": 115 }, { "epoch": 2.0, "learning_rate": 9.224347826086957e-06, "loss": 3.0269, "step": 230 }, { "epoch": 2.0, "eval_loss": 2.8120057582855225, "eval_runtime": 5.8393, "eval_samples_per_second": 6.85, "eval_steps_per_second": 0.856, "step": 230 }, { "epoch": 3.0, "learning_rate": 8.824347826086957e-06, "loss": 2.8681, "step": 345 }, { "epoch": 3.0, "eval_loss": 2.7979869842529297, "eval_runtime": 5.8717, "eval_samples_per_second": 6.812, "eval_steps_per_second": 0.852, "step": 345 }, { "epoch": 4.0, "learning_rate": 8.424347826086958e-06, "loss": 2.752, "step": 460 }, { "epoch": 4.0, "eval_loss": 2.485291004180908, "eval_runtime": 5.9082, "eval_samples_per_second": 6.77, "eval_steps_per_second": 0.846, "step": 460 }, { "epoch": 5.0, "learning_rate": 8.027826086956523e-06, "loss": 2.7715, "step": 575 }, { "epoch": 5.0, "eval_loss": 2.413987159729004, "eval_runtime": 5.8023, "eval_samples_per_second": 6.894, "eval_steps_per_second": 0.862, "step": 575 }, { "epoch": 6.0, "learning_rate": 7.627826086956522e-06, "loss": 2.6846, "step": 690 }, { "epoch": 6.0, "eval_loss": 2.4714808464050293, "eval_runtime": 5.8424, "eval_samples_per_second": 6.847, "eval_steps_per_second": 0.856, "step": 690 }, { "epoch": 7.0, "learning_rate": 7.231304347826088e-06, "loss": 2.6236, "step": 805 }, { "epoch": 7.0, "eval_loss": 2.461406946182251, "eval_runtime": 5.862, "eval_samples_per_second": 6.824, "eval_steps_per_second": 0.853, "step": 805 }, { "epoch": 8.0, "learning_rate": 6.8313043478260874e-06, "loss": 2.5318, "step": 920 }, { "epoch": 8.0, "eval_loss": 2.3440959453582764, "eval_runtime": 5.9348, "eval_samples_per_second": 6.74, "eval_steps_per_second": 0.842, "step": 920 }, { "epoch": 9.0, "learning_rate": 6.431304347826087e-06, "loss": 2.5224, "step": 1035 }, { "epoch": 9.0, "eval_loss": 2.283745765686035, "eval_runtime": 5.872, "eval_samples_per_second": 6.812, "eval_steps_per_second": 0.851, "step": 1035 }, { "epoch": 10.0, "learning_rate": 6.031304347826088e-06, "loss": 2.4661, "step": 1150 }, { "epoch": 10.0, "eval_loss": 2.250960111618042, "eval_runtime": 5.9135, "eval_samples_per_second": 6.764, "eval_steps_per_second": 0.846, "step": 1150 }, { "epoch": 11.0, "learning_rate": 5.631304347826088e-06, "loss": 2.4313, "step": 1265 }, { "epoch": 11.0, "eval_loss": 2.333876132965088, "eval_runtime": 5.8831, "eval_samples_per_second": 6.799, "eval_steps_per_second": 0.85, "step": 1265 }, { "epoch": 12.0, "learning_rate": 5.2313043478260875e-06, "loss": 2.4125, "step": 1380 }, { "epoch": 12.0, "eval_loss": 2.2956740856170654, "eval_runtime": 5.9965, "eval_samples_per_second": 6.671, "eval_steps_per_second": 0.834, "step": 1380 }, { "epoch": 13.0, "learning_rate": 4.831304347826087e-06, "loss": 2.4113, "step": 1495 }, { "epoch": 13.0, "eval_loss": 2.235807180404663, "eval_runtime": 5.8572, "eval_samples_per_second": 6.829, "eval_steps_per_second": 0.854, "step": 1495 }, { "epoch": 14.0, "learning_rate": 4.4313043478260875e-06, "loss": 2.3784, "step": 1610 }, { "epoch": 14.0, "eval_loss": 2.263479232788086, "eval_runtime": 5.9302, "eval_samples_per_second": 6.745, "eval_steps_per_second": 0.843, "step": 1610 }, { "epoch": 15.0, "learning_rate": 4.031304347826087e-06, "loss": 2.3199, "step": 1725 }, { "epoch": 15.0, "eval_loss": 2.232009172439575, "eval_runtime": 5.8956, "eval_samples_per_second": 6.785, "eval_steps_per_second": 0.848, "step": 1725 }, { "epoch": 16.0, "learning_rate": 3.631304347826087e-06, "loss": 2.3321, "step": 1840 }, { "epoch": 16.0, "eval_loss": 2.2249927520751953, "eval_runtime": 5.9501, "eval_samples_per_second": 6.723, "eval_steps_per_second": 0.84, "step": 1840 }, { "epoch": 17.0, "learning_rate": 3.2313043478260876e-06, "loss": 2.3305, "step": 1955 }, { "epoch": 17.0, "eval_loss": 2.202038288116455, "eval_runtime": 5.8864, "eval_samples_per_second": 6.795, "eval_steps_per_second": 0.849, "step": 1955 }, { "epoch": 18.0, "learning_rate": 2.831304347826087e-06, "loss": 2.2932, "step": 2070 }, { "epoch": 18.0, "eval_loss": 2.1825520992279053, "eval_runtime": 5.8462, "eval_samples_per_second": 6.842, "eval_steps_per_second": 0.855, "step": 2070 }, { "epoch": 19.0, "learning_rate": 2.431304347826087e-06, "loss": 2.2952, "step": 2185 }, { "epoch": 19.0, "eval_loss": 2.1626458168029785, "eval_runtime": 5.963, "eval_samples_per_second": 6.708, "eval_steps_per_second": 0.839, "step": 2185 }, { "epoch": 20.0, "learning_rate": 2.0313043478260872e-06, "loss": 2.2663, "step": 2300 }, { "epoch": 20.0, "eval_loss": 2.157285213470459, "eval_runtime": 5.9246, "eval_samples_per_second": 6.751, "eval_steps_per_second": 0.844, "step": 2300 }, { "epoch": 21.0, "learning_rate": 1.631304347826087e-06, "loss": 2.2916, "step": 2415 }, { "epoch": 21.0, "eval_loss": 2.1653225421905518, "eval_runtime": 5.8815, "eval_samples_per_second": 6.801, "eval_steps_per_second": 0.85, "step": 2415 }, { "epoch": 22.0, "learning_rate": 1.231304347826087e-06, "loss": 2.2703, "step": 2530 }, { "epoch": 22.0, "eval_loss": 2.1443889141082764, "eval_runtime": 5.8599, "eval_samples_per_second": 6.826, "eval_steps_per_second": 0.853, "step": 2530 }, { "epoch": 23.0, "learning_rate": 8.347826086956523e-07, "loss": 2.2431, "step": 2645 }, { "epoch": 23.0, "eval_loss": 2.1373696327209473, "eval_runtime": 5.8436, "eval_samples_per_second": 6.845, "eval_steps_per_second": 0.856, "step": 2645 }, { "epoch": 24.0, "learning_rate": 4.347826086956522e-07, "loss": 2.2243, "step": 2760 }, { "epoch": 24.0, "eval_loss": 2.1275973320007324, "eval_runtime": 5.9461, "eval_samples_per_second": 6.727, "eval_steps_per_second": 0.841, "step": 2760 }, { "epoch": 25.0, "learning_rate": 3.478260869565218e-08, "loss": 2.2413, "step": 2875 }, { "epoch": 25.0, "eval_loss": 2.1030609607696533, "eval_runtime": 5.9121, "eval_samples_per_second": 6.766, "eval_steps_per_second": 0.846, "step": 2875 }, { "epoch": 25.0, "step": 2875, "total_flos": 5.49474551424e+18, "train_loss": 2.50671312945822, "train_runtime": 2370.7956, "train_samples_per_second": 4.851, "train_steps_per_second": 1.213 } ], "logging_steps": 500, "max_steps": 2875, "num_train_epochs": 25, "save_steps": 500, "total_flos": 5.49474551424e+18, "trial_name": null, "trial_params": null }