{ "best_metric": 0.8737166324435318, "best_model_checkpoint": "vc-bantai-vit-withoutAMBI-adunest-v1/checkpoint-1800", "epoch": 12.048192771084338, "global_step": 3000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.4, "eval_accuracy": 0.40811088295687886, "eval_loss": 1.2037091255187988, "eval_runtime": 11.1902, "eval_samples_per_second": 174.08, "eval_steps_per_second": 5.451, "step": 100 }, { "epoch": 0.8, "eval_accuracy": 0.44096509240246407, "eval_loss": 0.9935279488563538, "eval_runtime": 11.2125, "eval_samples_per_second": 173.734, "eval_steps_per_second": 5.44, "step": 200 }, { "epoch": 1.2, "eval_accuracy": 0.6914784394250514, "eval_loss": 0.6460596323013306, "eval_runtime": 11.4894, "eval_samples_per_second": 169.547, "eval_steps_per_second": 5.309, "step": 300 }, { "epoch": 1.61, "eval_accuracy": 0.7705338809034907, "eval_loss": 0.49376896023750305, "eval_runtime": 11.1511, "eval_samples_per_second": 174.691, "eval_steps_per_second": 5.47, "step": 400 }, { "epoch": 2.01, "learning_rate": 0.0004949799196787149, "loss": 0.357, "step": 500 }, { "epoch": 2.01, "eval_accuracy": 0.784394250513347, "eval_loss": 0.4601840376853943, "eval_runtime": 11.4476, "eval_samples_per_second": 170.167, "eval_steps_per_second": 5.329, "step": 500 }, { "epoch": 2.41, "eval_accuracy": 0.7294661190965093, "eval_loss": 0.5220066905021667, "eval_runtime": 11.1921, "eval_samples_per_second": 174.052, "eval_steps_per_second": 5.45, "step": 600 }, { "epoch": 2.81, "eval_accuracy": 0.7782340862422998, "eval_loss": 0.46649423241615295, "eval_runtime": 11.2377, "eval_samples_per_second": 173.346, "eval_steps_per_second": 5.428, "step": 700 }, { "epoch": 3.21, "eval_accuracy": 0.830082135523614, "eval_loss": 0.44400569796562195, "eval_runtime": 11.2183, "eval_samples_per_second": 173.645, "eval_steps_per_second": 5.438, "step": 800 }, { "epoch": 3.61, "eval_accuracy": 0.7176591375770021, "eval_loss": 0.5121513605117798, "eval_runtime": 11.196, "eval_samples_per_second": 173.991, "eval_steps_per_second": 5.448, "step": 900 }, { "epoch": 4.02, "learning_rate": 0.0004899598393574297, "loss": 0.2437, "step": 1000 }, { "epoch": 4.02, "eval_accuracy": 0.7320328542094456, "eval_loss": 0.6155115962028503, "eval_runtime": 11.2061, "eval_samples_per_second": 173.833, "eval_steps_per_second": 5.443, "step": 1000 }, { "epoch": 4.42, "eval_accuracy": 0.7684804928131417, "eval_loss": 0.5802133679389954, "eval_runtime": 11.2176, "eval_samples_per_second": 173.655, "eval_steps_per_second": 5.438, "step": 1100 }, { "epoch": 4.82, "eval_accuracy": 0.8028747433264887, "eval_loss": 0.47085943818092346, "eval_runtime": 11.2201, "eval_samples_per_second": 173.617, "eval_steps_per_second": 5.437, "step": 1200 }, { "epoch": 5.22, "eval_accuracy": 0.8352156057494866, "eval_loss": 0.4694225490093231, "eval_runtime": 11.2031, "eval_samples_per_second": 173.881, "eval_steps_per_second": 5.445, "step": 1300 }, { "epoch": 5.62, "eval_accuracy": 0.8203285420944558, "eval_loss": 0.46516597270965576, "eval_runtime": 11.1655, "eval_samples_per_second": 174.467, "eval_steps_per_second": 5.463, "step": 1400 }, { "epoch": 6.02, "learning_rate": 0.0004849397590361446, "loss": 0.1841, "step": 1500 }, { "epoch": 6.02, "eval_accuracy": 0.7648870636550308, "eval_loss": 0.5424289107322693, "eval_runtime": 11.2414, "eval_samples_per_second": 173.288, "eval_steps_per_second": 5.426, "step": 1500 }, { "epoch": 6.43, "eval_accuracy": 0.8059548254620124, "eval_loss": 0.46159353852272034, "eval_runtime": 11.1678, "eval_samples_per_second": 174.43, "eval_steps_per_second": 5.462, "step": 1600 }, { "epoch": 6.83, "eval_accuracy": 0.8547227926078029, "eval_loss": 0.35685229301452637, "eval_runtime": 11.2186, "eval_samples_per_second": 173.64, "eval_steps_per_second": 5.437, "step": 1700 }, { "epoch": 7.23, "eval_accuracy": 0.8737166324435318, "eval_loss": 0.36519739031791687, "eval_runtime": 11.1645, "eval_samples_per_second": 174.481, "eval_steps_per_second": 5.464, "step": 1800 }, { "epoch": 7.63, "eval_accuracy": 0.7438398357289527, "eval_loss": 0.7777961492538452, "eval_runtime": 11.2328, "eval_samples_per_second": 173.421, "eval_steps_per_second": 5.431, "step": 1900 }, { "epoch": 8.03, "learning_rate": 0.0004799196787148594, "loss": 0.1328, "step": 2000 }, { "epoch": 8.03, "eval_accuracy": 0.8162217659137577, "eval_loss": 0.546014666557312, "eval_runtime": 11.2154, "eval_samples_per_second": 173.689, "eval_steps_per_second": 5.439, "step": 2000 }, { "epoch": 8.43, "eval_accuracy": 0.776694045174538, "eval_loss": 0.8070306777954102, "eval_runtime": 11.1916, "eval_samples_per_second": 174.06, "eval_steps_per_second": 5.451, "step": 2100 }, { "epoch": 8.84, "eval_accuracy": 0.7797741273100616, "eval_loss": 0.6872759461402893, "eval_runtime": 11.206, "eval_samples_per_second": 173.835, "eval_steps_per_second": 5.444, "step": 2200 }, { "epoch": 9.24, "eval_accuracy": 0.7782340862422998, "eval_loss": 0.8942956328392029, "eval_runtime": 11.1451, "eval_samples_per_second": 174.785, "eval_steps_per_second": 5.473, "step": 2300 }, { "epoch": 9.64, "eval_accuracy": 0.8552361396303901, "eval_loss": 0.5378373265266418, "eval_runtime": 11.1452, "eval_samples_per_second": 174.784, "eval_steps_per_second": 5.473, "step": 2400 }, { "epoch": 10.04, "learning_rate": 0.0004748995983935743, "loss": 0.1059, "step": 2500 }, { "epoch": 10.04, "eval_accuracy": 0.8069815195071869, "eval_loss": 0.7080937623977661, "eval_runtime": 11.2065, "eval_samples_per_second": 173.828, "eval_steps_per_second": 5.443, "step": 2500 }, { "epoch": 10.44, "eval_accuracy": 0.7012320328542094, "eval_loss": 0.994149923324585, "eval_runtime": 11.1681, "eval_samples_per_second": 174.426, "eval_steps_per_second": 5.462, "step": 2600 }, { "epoch": 10.84, "eval_accuracy": 0.7900410677618069, "eval_loss": 0.9151853919029236, "eval_runtime": 11.2106, "eval_samples_per_second": 173.764, "eval_steps_per_second": 5.441, "step": 2700 }, { "epoch": 11.24, "eval_accuracy": 0.7736139630390144, "eval_loss": 0.7493842244148254, "eval_runtime": 11.1841, "eval_samples_per_second": 174.175, "eval_steps_per_second": 5.454, "step": 2800 }, { "epoch": 11.65, "eval_accuracy": 0.7869609856262834, "eval_loss": 0.7680638432502747, "eval_runtime": 11.2188, "eval_samples_per_second": 173.636, "eval_steps_per_second": 5.437, "step": 2900 }, { "epoch": 12.05, "learning_rate": 0.0004698795180722892, "loss": 0.081, "step": 3000 }, { "epoch": 12.05, "eval_accuracy": 0.8039014373716632, "eval_loss": 0.7735891342163086, "eval_runtime": 11.4086, "eval_samples_per_second": 170.748, "eval_steps_per_second": 5.347, "step": 3000 }, { "epoch": 12.05, "step": 3000, "total_flos": 7.416049873230029e+18, "train_loss": 0.18408180872599283, "train_runtime": 1888.403, "train_samples_per_second": 841.24, "train_steps_per_second": 26.371 } ], "max_steps": 49800, "num_train_epochs": 200, "total_flos": 7.416049873230029e+18, "trial_name": null, "trial_params": null }