{ "best_metric": 0.4006434977054596, "best_model_checkpoint": "food_beverages_japan_image_detection/checkpoint-2340", "epoch": 39.0, "eval_steps": 500, "global_step": 2340, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.6215644820295984, "eval_loss": 0.6740179657936096, "eval_runtime": 8.3101, "eval_samples_per_second": 56.919, "eval_steps_per_second": 7.22, "step": 60 }, { "epoch": 2.0, "eval_accuracy": 0.7019027484143763, "eval_loss": 0.6518784165382385, "eval_runtime": 8.3128, "eval_samples_per_second": 56.9, "eval_steps_per_second": 7.218, "step": 120 }, { "epoch": 3.0, "eval_accuracy": 0.7315010570824524, "eval_loss": 0.6313825249671936, "eval_runtime": 8.4056, "eval_samples_per_second": 56.272, "eval_steps_per_second": 7.138, "step": 180 }, { "epoch": 4.0, "eval_accuracy": 0.7378435517970402, "eval_loss": 0.6076480150222778, "eval_runtime": 8.3695, "eval_samples_per_second": 56.515, "eval_steps_per_second": 7.169, "step": 240 }, { "epoch": 5.0, "eval_accuracy": 0.7505285412262156, "eval_loss": 0.5873068571090698, "eval_runtime": 8.3314, "eval_samples_per_second": 56.773, "eval_steps_per_second": 7.202, "step": 300 }, { "epoch": 6.0, "eval_accuracy": 0.7758985200845666, "eval_loss": 0.5679311752319336, "eval_runtime": 8.239, "eval_samples_per_second": 57.41, "eval_steps_per_second": 7.282, "step": 360 }, { "epoch": 7.0, "eval_accuracy": 0.7780126849894292, "eval_loss": 0.5512701869010925, "eval_runtime": 7.9131, "eval_samples_per_second": 59.775, "eval_steps_per_second": 7.582, "step": 420 }, { "epoch": 8.0, "eval_accuracy": 0.7801268498942917, "eval_loss": 0.5363279581069946, "eval_runtime": 7.9214, "eval_samples_per_second": 59.712, "eval_steps_per_second": 7.574, "step": 480 }, { "epoch": 8.33, "learning_rate": 4.042553191489362e-06, "loss": 0.5935, "step": 500 }, { "epoch": 9.0, "eval_accuracy": 0.7843551797040169, "eval_loss": 0.5246909260749817, "eval_runtime": 7.9484, "eval_samples_per_second": 59.509, "eval_steps_per_second": 7.549, "step": 540 }, { "epoch": 10.0, "eval_accuracy": 0.7906976744186046, "eval_loss": 0.5121592283248901, "eval_runtime": 7.9961, "eval_samples_per_second": 59.154, "eval_steps_per_second": 7.504, "step": 600 }, { "epoch": 11.0, "eval_accuracy": 0.7991543340380549, "eval_loss": 0.4976297616958618, "eval_runtime": 7.9409, "eval_samples_per_second": 59.565, "eval_steps_per_second": 7.556, "step": 660 }, { "epoch": 12.0, "eval_accuracy": 0.8054968287526427, "eval_loss": 0.48714011907577515, "eval_runtime": 7.9777, "eval_samples_per_second": 59.29, "eval_steps_per_second": 7.521, "step": 720 }, { "epoch": 13.0, "eval_accuracy": 0.8033826638477801, "eval_loss": 0.47856396436691284, "eval_runtime": 8.0373, "eval_samples_per_second": 58.85, "eval_steps_per_second": 7.465, "step": 780 }, { "epoch": 14.0, "eval_accuracy": 0.8054968287526427, "eval_loss": 0.4685792028903961, "eval_runtime": 8.0022, "eval_samples_per_second": 59.109, "eval_steps_per_second": 7.498, "step": 840 }, { "epoch": 15.0, "eval_accuracy": 0.8076109936575053, "eval_loss": 0.4633488357067108, "eval_runtime": 7.897, "eval_samples_per_second": 59.896, "eval_steps_per_second": 7.598, "step": 900 }, { "epoch": 16.0, "eval_accuracy": 0.8097251585623678, "eval_loss": 0.4541207253932953, "eval_runtime": 7.9062, "eval_samples_per_second": 59.826, "eval_steps_per_second": 7.589, "step": 960 }, { "epoch": 16.67, "learning_rate": 2.978723404255319e-06, "loss": 0.3919, "step": 1000 }, { "epoch": 17.0, "eval_accuracy": 0.8181818181818182, "eval_loss": 0.44693174958229065, "eval_runtime": 7.9465, "eval_samples_per_second": 59.523, "eval_steps_per_second": 7.551, "step": 1020 }, { "epoch": 18.0, "eval_accuracy": 0.8202959830866807, "eval_loss": 0.4403076171875, "eval_runtime": 7.9729, "eval_samples_per_second": 59.326, "eval_steps_per_second": 7.526, "step": 1080 }, { "epoch": 19.0, "eval_accuracy": 0.8181818181818182, "eval_loss": 0.43559935688972473, "eval_runtime": 7.8143, "eval_samples_per_second": 60.53, "eval_steps_per_second": 7.678, "step": 1140 }, { "epoch": 20.0, "eval_accuracy": 0.8245243128964059, "eval_loss": 0.43019139766693115, "eval_runtime": 7.7993, "eval_samples_per_second": 60.646, "eval_steps_per_second": 7.693, "step": 1200 }, { "epoch": 21.0, "eval_accuracy": 0.8202959830866807, "eval_loss": 0.42576563358306885, "eval_runtime": 7.7862, "eval_samples_per_second": 60.749, "eval_steps_per_second": 7.706, "step": 1260 }, { "epoch": 22.0, "eval_accuracy": 0.8245243128964059, "eval_loss": 0.4226011633872986, "eval_runtime": 7.8089, "eval_samples_per_second": 60.572, "eval_steps_per_second": 7.684, "step": 1320 }, { "epoch": 23.0, "eval_accuracy": 0.8266384778012685, "eval_loss": 0.4196974039077759, "eval_runtime": 7.7453, "eval_samples_per_second": 61.069, "eval_steps_per_second": 7.747, "step": 1380 }, { "epoch": 24.0, "eval_accuracy": 0.8308668076109936, "eval_loss": 0.4153010845184326, "eval_runtime": 7.7967, "eval_samples_per_second": 60.667, "eval_steps_per_second": 7.696, "step": 1440 }, { "epoch": 25.0, "learning_rate": 1.9148936170212767e-06, "loss": 0.2598, "step": 1500 }, { "epoch": 25.0, "eval_accuracy": 0.8245243128964059, "eval_loss": 0.41346848011016846, "eval_runtime": 8.0165, "eval_samples_per_second": 59.003, "eval_steps_per_second": 7.485, "step": 1500 }, { "epoch": 26.0, "eval_accuracy": 0.828752642706131, "eval_loss": 0.41087058186531067, "eval_runtime": 8.2057, "eval_samples_per_second": 57.643, "eval_steps_per_second": 7.312, "step": 1560 }, { "epoch": 27.0, "eval_accuracy": 0.8350951374207188, "eval_loss": 0.410675048828125, "eval_runtime": 8.1905, "eval_samples_per_second": 57.75, "eval_steps_per_second": 7.326, "step": 1620 }, { "epoch": 28.0, "eval_accuracy": 0.8372093023255814, "eval_loss": 0.4087086319923401, "eval_runtime": 8.1633, "eval_samples_per_second": 57.942, "eval_steps_per_second": 7.35, "step": 1680 }, { "epoch": 29.0, "eval_accuracy": 0.8266384778012685, "eval_loss": 0.41004815697669983, "eval_runtime": 8.2033, "eval_samples_per_second": 57.66, "eval_steps_per_second": 7.314, "step": 1740 }, { "epoch": 30.0, "eval_accuracy": 0.8372093023255814, "eval_loss": 0.40502193570137024, "eval_runtime": 8.171, "eval_samples_per_second": 57.888, "eval_steps_per_second": 7.343, "step": 1800 }, { "epoch": 31.0, "eval_accuracy": 0.828752642706131, "eval_loss": 0.40703651309013367, "eval_runtime": 8.1556, "eval_samples_per_second": 57.997, "eval_steps_per_second": 7.357, "step": 1860 }, { "epoch": 32.0, "eval_accuracy": 0.8350951374207188, "eval_loss": 0.40481287240982056, "eval_runtime": 8.1436, "eval_samples_per_second": 58.083, "eval_steps_per_second": 7.368, "step": 1920 }, { "epoch": 33.0, "eval_accuracy": 0.8329809725158562, "eval_loss": 0.4047437608242035, "eval_runtime": 8.1259, "eval_samples_per_second": 58.209, "eval_steps_per_second": 7.384, "step": 1980 }, { "epoch": 33.33, "learning_rate": 8.510638297872341e-07, "loss": 0.1847, "step": 2000 }, { "epoch": 34.0, "eval_accuracy": 0.8329809725158562, "eval_loss": 0.4028582274913788, "eval_runtime": 8.1842, "eval_samples_per_second": 57.795, "eval_steps_per_second": 7.331, "step": 2040 }, { "epoch": 35.0, "eval_accuracy": 0.8329809725158562, "eval_loss": 0.4015713930130005, "eval_runtime": 8.1082, "eval_samples_per_second": 58.336, "eval_steps_per_second": 7.4, "step": 2100 }, { "epoch": 36.0, "eval_accuracy": 0.8329809725158562, "eval_loss": 0.4017912745475769, "eval_runtime": 8.0144, "eval_samples_per_second": 59.019, "eval_steps_per_second": 7.487, "step": 2160 }, { "epoch": 37.0, "eval_accuracy": 0.8372093023255814, "eval_loss": 0.401458203792572, "eval_runtime": 7.7426, "eval_samples_per_second": 61.091, "eval_steps_per_second": 7.749, "step": 2220 }, { "epoch": 38.0, "eval_accuracy": 0.8372093023255814, "eval_loss": 0.40120792388916016, "eval_runtime": 7.812, "eval_samples_per_second": 60.548, "eval_steps_per_second": 7.68, "step": 2280 }, { "epoch": 39.0, "eval_accuracy": 0.8372093023255814, "eval_loss": 0.4006434977054596, "eval_runtime": 7.8268, "eval_samples_per_second": 60.433, "eval_steps_per_second": 7.666, "step": 2340 } ], "logging_steps": 500, "max_steps": 2400, "num_train_epochs": 40, "save_steps": 500, "total_flos": 5.714956742086545e+18, "trial_name": null, "trial_params": null }