{ "best_metric": 0.8653846153846154, "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-phones/checkpoint-135", "epoch": 28.0, "eval_steps": 500, "global_step": 210, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.9333333333333333, "eval_accuracy": 0.5673076923076923, "eval_loss": 0.6742563247680664, "eval_runtime": 1.0496, "eval_samples_per_second": 99.088, "eval_steps_per_second": 3.811, "step": 7 }, { "epoch": 1.3333333333333333, "grad_norm": 5.86643123626709, "learning_rate": 2.380952380952381e-05, "loss": 0.6763, "step": 10 }, { "epoch": 2.0, "eval_accuracy": 0.6923076923076923, "eval_loss": 0.6165803670883179, "eval_runtime": 0.6494, "eval_samples_per_second": 160.146, "eval_steps_per_second": 6.159, "step": 15 }, { "epoch": 2.6666666666666665, "grad_norm": 6.109733581542969, "learning_rate": 4.761904761904762e-05, "loss": 0.635, "step": 20 }, { "epoch": 2.9333333333333336, "eval_accuracy": 0.7403846153846154, "eval_loss": 0.5646082758903503, "eval_runtime": 0.7406, "eval_samples_per_second": 140.428, "eval_steps_per_second": 5.401, "step": 22 }, { "epoch": 4.0, "grad_norm": 14.055779457092285, "learning_rate": 4.761904761904762e-05, "loss": 0.5724, "step": 30 }, { "epoch": 4.0, "eval_accuracy": 0.7307692307692307, "eval_loss": 0.5073935985565186, "eval_runtime": 0.6701, "eval_samples_per_second": 155.19, "eval_steps_per_second": 5.969, "step": 30 }, { "epoch": 4.933333333333334, "eval_accuracy": 0.7692307692307693, "eval_loss": 0.48087915778160095, "eval_runtime": 0.6729, "eval_samples_per_second": 154.555, "eval_steps_per_second": 5.944, "step": 37 }, { "epoch": 5.333333333333333, "grad_norm": 8.836523056030273, "learning_rate": 4.4973544973544974e-05, "loss": 0.527, "step": 40 }, { "epoch": 6.0, "eval_accuracy": 0.7692307692307693, "eval_loss": 0.45965665578842163, "eval_runtime": 0.6926, "eval_samples_per_second": 150.153, "eval_steps_per_second": 5.775, "step": 45 }, { "epoch": 6.666666666666667, "grad_norm": 6.653749465942383, "learning_rate": 4.232804232804233e-05, "loss": 0.5304, "step": 50 }, { "epoch": 6.933333333333334, "eval_accuracy": 0.7596153846153846, "eval_loss": 0.47583022713661194, "eval_runtime": 0.681, "eval_samples_per_second": 152.716, "eval_steps_per_second": 5.874, "step": 52 }, { "epoch": 8.0, "grad_norm": 13.230646133422852, "learning_rate": 3.968253968253968e-05, "loss": 0.4597, "step": 60 }, { "epoch": 8.0, "eval_accuracy": 0.7884615384615384, "eval_loss": 0.43429186940193176, "eval_runtime": 0.7692, "eval_samples_per_second": 135.213, "eval_steps_per_second": 5.2, "step": 60 }, { "epoch": 8.933333333333334, "eval_accuracy": 0.7980769230769231, "eval_loss": 0.42488300800323486, "eval_runtime": 0.6816, "eval_samples_per_second": 152.578, "eval_steps_per_second": 5.868, "step": 67 }, { "epoch": 9.333333333333334, "grad_norm": 8.930418968200684, "learning_rate": 3.7037037037037037e-05, "loss": 0.4606, "step": 70 }, { "epoch": 10.0, "eval_accuracy": 0.7980769230769231, "eval_loss": 0.42358094453811646, "eval_runtime": 0.6708, "eval_samples_per_second": 155.044, "eval_steps_per_second": 5.963, "step": 75 }, { "epoch": 10.666666666666666, "grad_norm": 10.609027862548828, "learning_rate": 3.439153439153439e-05, "loss": 0.4286, "step": 80 }, { "epoch": 10.933333333333334, "eval_accuracy": 0.8461538461538461, "eval_loss": 0.4054819643497467, "eval_runtime": 0.6768, "eval_samples_per_second": 153.664, "eval_steps_per_second": 5.91, "step": 82 }, { "epoch": 12.0, "grad_norm": 5.532287120819092, "learning_rate": 3.1746031746031745e-05, "loss": 0.3857, "step": 90 }, { "epoch": 12.0, "eval_accuracy": 0.8269230769230769, "eval_loss": 0.4144248962402344, "eval_runtime": 0.7584, "eval_samples_per_second": 137.132, "eval_steps_per_second": 5.274, "step": 90 }, { "epoch": 12.933333333333334, "eval_accuracy": 0.7980769230769231, "eval_loss": 0.4293949007987976, "eval_runtime": 0.6743, "eval_samples_per_second": 154.239, "eval_steps_per_second": 5.932, "step": 97 }, { "epoch": 13.333333333333334, "grad_norm": 11.760865211486816, "learning_rate": 2.91005291005291e-05, "loss": 0.3801, "step": 100 }, { "epoch": 14.0, "eval_accuracy": 0.8461538461538461, "eval_loss": 0.40805691480636597, "eval_runtime": 0.6845, "eval_samples_per_second": 151.929, "eval_steps_per_second": 5.843, "step": 105 }, { "epoch": 14.666666666666666, "grad_norm": 11.491521835327148, "learning_rate": 2.6455026455026456e-05, "loss": 0.3538, "step": 110 }, { "epoch": 14.933333333333334, "eval_accuracy": 0.8461538461538461, "eval_loss": 0.4194793403148651, "eval_runtime": 0.674, "eval_samples_per_second": 154.298, "eval_steps_per_second": 5.935, "step": 112 }, { "epoch": 16.0, "grad_norm": 11.567109107971191, "learning_rate": 2.380952380952381e-05, "loss": 0.3585, "step": 120 }, { "epoch": 16.0, "eval_accuracy": 0.8557692307692307, "eval_loss": 0.4068710207939148, "eval_runtime": 0.7839, "eval_samples_per_second": 132.667, "eval_steps_per_second": 5.103, "step": 120 }, { "epoch": 16.933333333333334, "eval_accuracy": 0.8557692307692307, "eval_loss": 0.3970623016357422, "eval_runtime": 0.6669, "eval_samples_per_second": 155.948, "eval_steps_per_second": 5.998, "step": 127 }, { "epoch": 17.333333333333332, "grad_norm": 12.216808319091797, "learning_rate": 2.1164021164021164e-05, "loss": 0.3258, "step": 130 }, { "epoch": 18.0, "eval_accuracy": 0.8653846153846154, "eval_loss": 0.39384937286376953, "eval_runtime": 0.6899, "eval_samples_per_second": 150.747, "eval_steps_per_second": 5.798, "step": 135 }, { "epoch": 18.666666666666668, "grad_norm": 15.223637580871582, "learning_rate": 1.8518518518518518e-05, "loss": 0.3288, "step": 140 }, { "epoch": 18.933333333333334, "eval_accuracy": 0.8461538461538461, "eval_loss": 0.396359384059906, "eval_runtime": 0.6861, "eval_samples_per_second": 151.574, "eval_steps_per_second": 5.83, "step": 142 }, { "epoch": 20.0, "grad_norm": 25.446683883666992, "learning_rate": 1.5873015873015872e-05, "loss": 0.3276, "step": 150 }, { "epoch": 20.0, "eval_accuracy": 0.8557692307692307, "eval_loss": 0.44233372807502747, "eval_runtime": 0.6969, "eval_samples_per_second": 149.226, "eval_steps_per_second": 5.739, "step": 150 }, { "epoch": 20.933333333333334, "eval_accuracy": 0.8365384615384616, "eval_loss": 0.40670448541641235, "eval_runtime": 0.7625, "eval_samples_per_second": 136.392, "eval_steps_per_second": 5.246, "step": 157 }, { "epoch": 21.333333333333332, "grad_norm": 10.679701805114746, "learning_rate": 1.3227513227513228e-05, "loss": 0.317, "step": 160 }, { "epoch": 22.0, "eval_accuracy": 0.8653846153846154, "eval_loss": 0.4178958535194397, "eval_runtime": 0.6933, "eval_samples_per_second": 150.017, "eval_steps_per_second": 5.77, "step": 165 }, { "epoch": 22.666666666666668, "grad_norm": 12.451942443847656, "learning_rate": 1.0582010582010582e-05, "loss": 0.288, "step": 170 }, { "epoch": 22.933333333333334, "eval_accuracy": 0.8557692307692307, "eval_loss": 0.3881677985191345, "eval_runtime": 0.6592, "eval_samples_per_second": 157.766, "eval_steps_per_second": 6.068, "step": 172 }, { "epoch": 24.0, "grad_norm": 11.666213989257812, "learning_rate": 7.936507936507936e-06, "loss": 0.2735, "step": 180 }, { "epoch": 24.0, "eval_accuracy": 0.8557692307692307, "eval_loss": 0.42146697640419006, "eval_runtime": 0.6742, "eval_samples_per_second": 154.246, "eval_steps_per_second": 5.933, "step": 180 }, { "epoch": 24.933333333333334, "eval_accuracy": 0.8461538461538461, "eval_loss": 0.3971670866012573, "eval_runtime": 0.7934, "eval_samples_per_second": 131.085, "eval_steps_per_second": 5.042, "step": 187 }, { "epoch": 25.333333333333332, "grad_norm": 7.033930778503418, "learning_rate": 5.291005291005291e-06, "loss": 0.2805, "step": 190 }, { "epoch": 26.0, "eval_accuracy": 0.8557692307692307, "eval_loss": 0.3943334221839905, "eval_runtime": 0.6986, "eval_samples_per_second": 148.874, "eval_steps_per_second": 5.726, "step": 195 }, { "epoch": 26.666666666666668, "grad_norm": 5.698335647583008, "learning_rate": 2.6455026455026455e-06, "loss": 0.2961, "step": 200 }, { "epoch": 26.933333333333334, "eval_accuracy": 0.8557692307692307, "eval_loss": 0.39985355734825134, "eval_runtime": 0.691, "eval_samples_per_second": 150.514, "eval_steps_per_second": 5.789, "step": 202 }, { "epoch": 28.0, "grad_norm": 9.678221702575684, "learning_rate": 0.0, "loss": 0.2832, "step": 210 }, { "epoch": 28.0, "eval_accuracy": 0.8557692307692307, "eval_loss": 0.4042527377605438, "eval_runtime": 0.6919, "eval_samples_per_second": 150.307, "eval_steps_per_second": 5.781, "step": 210 }, { "epoch": 28.0, "step": 210, "total_flos": 6.51425759341314e+17, "train_loss": 0.4042152370725359, "train_runtime": 453.861, "train_samples_per_second": 61.869, "train_steps_per_second": 0.463 } ], "logging_steps": 10, "max_steps": 210, "num_input_tokens_seen": 0, "num_train_epochs": 30, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 6.51425759341314e+17, "train_batch_size": 32, "trial_name": null, "trial_params": null }