{ "best_metric": 0.8578052550231839, "best_model_checkpoint": "swin-base-patch4-window7-224-in22k-finetuned-memes/checkpoint-340", "epoch": 19.987654320987655, "global_step": 400, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.49, "learning_rate": 3e-05, "loss": 1.5528, "step": 10 }, { "epoch": 0.99, "learning_rate": 6e-05, "loss": 1.1655, "step": 20 }, { "epoch": 0.99, "eval_accuracy": 0.6955177743431221, "eval_f1": 0.6682587615239292, "eval_loss": 0.8572999835014343, "eval_precision": 0.6952978724784165, "eval_recall": 0.6955177743431221, "eval_runtime": 14.2645, "eval_samples_per_second": 90.715, "eval_steps_per_second": 1.472, "step": 20 }, { "epoch": 1.49, "learning_rate": 9e-05, "loss": 0.7275, "step": 30 }, { "epoch": 1.99, "learning_rate": 0.00012, "loss": 0.5506, "step": 40 }, { "epoch": 1.99, "eval_accuracy": 0.8083462132921174, "eval_f1": 0.7962870636686081, "eval_loss": 0.5326675176620483, "eval_precision": 0.8049703591765521, "eval_recall": 0.8083462132921174, "eval_runtime": 12.6486, "eval_samples_per_second": 102.304, "eval_steps_per_second": 1.66, "step": 40 }, { "epoch": 2.49, "learning_rate": 0.00011666666666666667, "loss": 0.3788, "step": 50 }, { "epoch": 2.99, "learning_rate": 0.00011333333333333333, "loss": 0.3573, "step": 60 }, { "epoch": 2.99, "eval_accuracy": 0.8338485316846986, "eval_f1": 0.831666163408815, "eval_loss": 0.4496992528438568, "eval_precision": 0.8339121233593048, "eval_recall": 0.8338485316846986, "eval_runtime": 12.8713, "eval_samples_per_second": 100.534, "eval_steps_per_second": 1.632, "step": 60 }, { "epoch": 3.49, "learning_rate": 0.00011, "loss": 0.2378, "step": 70 }, { "epoch": 3.99, "learning_rate": 0.00010666666666666667, "loss": 0.2083, "step": 80 }, { "epoch": 3.99, "eval_accuracy": 0.8353941267387944, "eval_f1": 0.8368249403721092, "eval_loss": 0.45606011152267456, "eval_precision": 0.84498910302744, "eval_recall": 0.8353941267387944, "eval_runtime": 12.8489, "eval_samples_per_second": 100.709, "eval_steps_per_second": 1.634, "step": 80 }, { "epoch": 4.49, "learning_rate": 0.00010333333333333334, "loss": 0.1314, "step": 90 }, { "epoch": 4.99, "learning_rate": 0.0001, "loss": 0.1545, "step": 100 }, { "epoch": 4.99, "eval_accuracy": 0.8423493044822257, "eval_f1": 0.8429773996176875, "eval_loss": 0.4605261981487274, "eval_precision": 0.8457880236763888, "eval_recall": 0.8423493044822257, "eval_runtime": 13.8028, "eval_samples_per_second": 93.749, "eval_steps_per_second": 1.521, "step": 100 }, { "epoch": 5.49, "learning_rate": 9.666666666666667e-05, "loss": 0.124, "step": 110 }, { "epoch": 5.99, "learning_rate": 9.333333333333334e-05, "loss": 0.1014, "step": 120 }, { "epoch": 5.99, "eval_accuracy": 0.8523956723338485, "eval_f1": 0.8538473676550408, "eval_loss": 0.4924044609069824, "eval_precision": 0.8570555975028126, "eval_recall": 0.8523956723338485, "eval_runtime": 13.153, "eval_samples_per_second": 98.381, "eval_steps_per_second": 1.597, "step": 120 }, { "epoch": 6.49, "learning_rate": 9e-05, "loss": 0.0886, "step": 130 }, { "epoch": 6.99, "learning_rate": 8.666666666666667e-05, "loss": 0.0854, "step": 140 }, { "epoch": 6.99, "eval_accuracy": 0.839258114374034, "eval_f1": 0.8399595295849303, "eval_loss": 0.575903594493866, "eval_precision": 0.8452221761378239, "eval_recall": 0.839258114374034, "eval_runtime": 12.9566, "eval_samples_per_second": 99.872, "eval_steps_per_second": 1.621, "step": 140 }, { "epoch": 7.49, "learning_rate": 8.333333333333333e-05, "loss": 0.0804, "step": 150 }, { "epoch": 7.99, "learning_rate": 7.999999999999999e-05, "loss": 0.1012, "step": 160 }, { "epoch": 7.99, "eval_accuracy": 0.8361669242658424, "eval_f1": 0.8361306593636055, "eval_loss": 0.5141878724098206, "eval_precision": 0.8378496563621973, "eval_recall": 0.8361669242658424, "eval_runtime": 12.9916, "eval_samples_per_second": 99.602, "eval_steps_per_second": 1.616, "step": 160 }, { "epoch": 8.49, "learning_rate": 7.666666666666667e-05, "loss": 0.0745, "step": 170 }, { "epoch": 8.99, "learning_rate": 7.333333333333334e-05, "loss": 0.077, "step": 180 }, { "epoch": 8.99, "eval_accuracy": 0.8330757341576507, "eval_f1": 0.8406946514001388, "eval_loss": 0.5646628141403198, "eval_precision": 0.8537522286474765, "eval_recall": 0.8330757341576507, "eval_runtime": 13.9321, "eval_samples_per_second": 92.879, "eval_steps_per_second": 1.507, "step": 180 }, { "epoch": 9.49, "learning_rate": 7.000000000000001e-05, "loss": 0.0587, "step": 190 }, { "epoch": 9.99, "learning_rate": 6.666666666666667e-05, "loss": 0.0667, "step": 200 }, { "epoch": 9.99, "eval_accuracy": 0.8462132921174652, "eval_f1": 0.8482978184490837, "eval_loss": 0.5293765068054199, "eval_precision": 0.8508576163797781, "eval_recall": 0.8462132921174652, "eval_runtime": 13.4474, "eval_samples_per_second": 96.227, "eval_steps_per_second": 1.562, "step": 200 }, { "epoch": 10.49, "learning_rate": 6.333333333333333e-05, "loss": 0.0452, "step": 210 }, { "epoch": 10.99, "learning_rate": 6e-05, "loss": 0.0666, "step": 220 }, { "epoch": 10.99, "eval_accuracy": 0.8384853168469861, "eval_f1": 0.839606513626033, "eval_loss": 0.6037518382072449, "eval_precision": 0.84149883116413, "eval_recall": 0.8384853168469861, "eval_runtime": 12.7726, "eval_samples_per_second": 101.311, "eval_steps_per_second": 1.644, "step": 220 }, { "epoch": 11.49, "learning_rate": 5.6666666666666664e-05, "loss": 0.0577, "step": 230 }, { "epoch": 11.99, "learning_rate": 5.333333333333333e-05, "loss": 0.0574, "step": 240 }, { "epoch": 11.99, "eval_accuracy": 0.8408037094281299, "eval_f1": 0.8411127335807149, "eval_loss": 0.6383613348007202, "eval_precision": 0.8431342855971845, "eval_recall": 0.8408037094281299, "eval_runtime": 13.1432, "eval_samples_per_second": 98.454, "eval_steps_per_second": 1.598, "step": 240 }, { "epoch": 12.49, "learning_rate": 5e-05, "loss": 0.0509, "step": 250 }, { "epoch": 12.99, "learning_rate": 4.666666666666667e-05, "loss": 0.0488, "step": 260 }, { "epoch": 12.99, "eval_accuracy": 0.8516228748068007, "eval_f1": 0.8532381219142173, "eval_loss": 0.6304579973220825, "eval_precision": 0.8561226939263563, "eval_recall": 0.8516228748068007, "eval_runtime": 13.6608, "eval_samples_per_second": 94.723, "eval_steps_per_second": 1.537, "step": 260 }, { "epoch": 13.49, "learning_rate": 4.3333333333333334e-05, "loss": 0.0517, "step": 270 }, { "epoch": 13.99, "learning_rate": 3.9999999999999996e-05, "loss": 0.0524, "step": 280 }, { "epoch": 13.99, "eval_accuracy": 0.8508500772797527, "eval_f1": 0.8510093409043722, "eval_loss": 0.6410980224609375, "eval_precision": 0.8526221088238606, "eval_recall": 0.8508500772797527, "eval_runtime": 12.8216, "eval_samples_per_second": 100.923, "eval_steps_per_second": 1.638, "step": 280 }, { "epoch": 14.49, "learning_rate": 3.666666666666667e-05, "loss": 0.0377, "step": 290 }, { "epoch": 14.99, "learning_rate": 3.3333333333333335e-05, "loss": 0.0511, "step": 300 }, { "epoch": 14.99, "eval_accuracy": 0.8547140649149922, "eval_f1": 0.8543059086099318, "eval_loss": 0.6461631655693054, "eval_precision": 0.8541819570387084, "eval_recall": 0.8547140649149922, "eval_runtime": 14.3489, "eval_samples_per_second": 90.181, "eval_steps_per_second": 1.464, "step": 300 }, { "epoch": 15.49, "learning_rate": 3e-05, "loss": 0.0446, "step": 310 }, { "epoch": 15.99, "learning_rate": 2.6666666666666667e-05, "loss": 0.0495, "step": 320 }, { "epoch": 15.99, "eval_accuracy": 0.8531684698608965, "eval_f1": 0.8527356330319577, "eval_loss": 0.6869231462478638, "eval_precision": 0.8533821751799587, "eval_recall": 0.8531684698608965, "eval_runtime": 12.6457, "eval_samples_per_second": 102.327, "eval_steps_per_second": 1.661, "step": 320 }, { "epoch": 16.49, "learning_rate": 2.3333333333333336e-05, "loss": 0.0489, "step": 330 }, { "epoch": 16.99, "learning_rate": 1.9999999999999998e-05, "loss": 0.0412, "step": 340 }, { "epoch": 16.99, "eval_accuracy": 0.8578052550231839, "eval_f1": 0.8563934506342421, "eval_loss": 0.6643078327178955, "eval_precision": 0.8553636638149845, "eval_recall": 0.8578052550231839, "eval_runtime": 13.1315, "eval_samples_per_second": 98.542, "eval_steps_per_second": 1.599, "step": 340 }, { "epoch": 17.49, "learning_rate": 1.6666666666666667e-05, "loss": 0.0447, "step": 350 }, { "epoch": 17.99, "learning_rate": 1.3333333333333333e-05, "loss": 0.0411, "step": 360 }, { "epoch": 17.99, "eval_accuracy": 0.857032457496136, "eval_f1": 0.8552106741098364, "eval_loss": 0.7213734984397888, "eval_precision": 0.8538988900347119, "eval_recall": 0.857032457496136, "eval_runtime": 12.729, "eval_samples_per_second": 101.658, "eval_steps_per_second": 1.65, "step": 360 }, { "epoch": 18.49, "learning_rate": 9.999999999999999e-06, "loss": 0.0411, "step": 370 }, { "epoch": 18.99, "learning_rate": 6.666666666666667e-06, "loss": 0.0434, "step": 380 }, { "epoch": 18.99, "eval_accuracy": 0.8523956723338485, "eval_f1": 0.8514088692604659, "eval_loss": 0.7037173509597778, "eval_precision": 0.850651377920994, "eval_recall": 0.8523956723338485, "eval_runtime": 13.5738, "eval_samples_per_second": 95.331, "eval_steps_per_second": 1.547, "step": 380 }, { "epoch": 19.49, "learning_rate": 3.3333333333333333e-06, "loss": 0.0445, "step": 390 }, { "epoch": 19.99, "learning_rate": 0.0, "loss": 0.0394, "step": 400 }, { "epoch": 19.99, "eval_accuracy": 0.8562596599690881, "eval_f1": 0.8552274649509984, "eval_loss": 0.7093907594680786, "eval_precision": 0.8545652818321074, "eval_recall": 0.8562596599690881, "eval_runtime": 12.9239, "eval_samples_per_second": 100.124, "eval_steps_per_second": 1.625, "step": 400 }, { "epoch": 19.99, "step": 400, "total_flos": 8.103254675374559e+18, "train_loss": 0.18201538026332856, "train_runtime": 1691.2716, "train_samples_per_second": 61.185, "train_steps_per_second": 0.237 } ], "max_steps": 400, "num_train_epochs": 20, "total_flos": 8.103254675374559e+18, "trial_name": null, "trial_params": null }