{ "best_metric": 0.6960989202368513, "best_model_checkpoint": "google-vit-base-patch16-224-face/checkpoint-712", "epoch": 7.991643454038997, "global_step": 712, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.11, "learning_rate": 1.6666666666666667e-05, "loss": 0.9691, "step": 10 }, { "epoch": 0.22, "learning_rate": 3.3333333333333335e-05, "loss": 0.9687, "step": 20 }, { "epoch": 0.33, "learning_rate": 5e-05, "loss": 0.9727, "step": 30 }, { "epoch": 0.45, "learning_rate": 6.666666666666667e-05, "loss": 0.9245, "step": 40 }, { "epoch": 0.56, "learning_rate": 8.333333333333333e-05, "loss": 0.8955, "step": 50 }, { "epoch": 0.67, "learning_rate": 0.0001, "loss": 0.8887, "step": 60 }, { "epoch": 0.78, "learning_rate": 0.00011666666666666667, "loss": 0.8827, "step": 70 }, { "epoch": 0.89, "learning_rate": 0.00011850000000000001, "loss": 0.8364, "step": 80 }, { "epoch": 0.99, "eval_accuracy": 0.648380355276907, "eval_f1": 0.6385482827611145, "eval_loss": 0.9452694654464722, "eval_precision": 0.6461904026185493, "eval_recall": 0.648380355276907, "eval_runtime": 32.7545, "eval_samples_per_second": 175.304, "eval_steps_per_second": 2.748, "step": 89 }, { "epoch": 1.01, "learning_rate": 0.000116625, "loss": 0.9165, "step": 90 }, { "epoch": 1.12, "learning_rate": 0.00011475000000000001, "loss": 0.765, "step": 100 }, { "epoch": 1.23, "learning_rate": 0.000112875, "loss": 0.7639, "step": 110 }, { "epoch": 1.35, "learning_rate": 0.00011100000000000001, "loss": 0.7557, "step": 120 }, { "epoch": 1.46, "learning_rate": 0.00010912500000000001, "loss": 0.7494, "step": 130 }, { "epoch": 1.57, "learning_rate": 0.00010725, "loss": 0.7363, "step": 140 }, { "epoch": 1.68, "learning_rate": 0.00010537500000000001, "loss": 0.7147, "step": 150 }, { "epoch": 1.79, "learning_rate": 0.00010350000000000001, "loss": 0.7283, "step": 160 }, { "epoch": 1.9, "learning_rate": 0.000101625, "loss": 0.7433, "step": 170 }, { "epoch": 1.99, "eval_accuracy": 0.6778126088470916, "eval_f1": 0.672969661980768, "eval_loss": 0.8876001834869385, "eval_precision": 0.679362397138447, "eval_recall": 0.6778126088470916, "eval_runtime": 37.9557, "eval_samples_per_second": 151.282, "eval_steps_per_second": 2.371, "step": 178 }, { "epoch": 2.02, "learning_rate": 9.975000000000001e-05, "loss": 0.7192, "step": 180 }, { "epoch": 2.13, "learning_rate": 9.787500000000001e-05, "loss": 0.5258, "step": 190 }, { "epoch": 2.25, "learning_rate": 9.6e-05, "loss": 0.5159, "step": 200 }, { "epoch": 2.36, "learning_rate": 9.412500000000001e-05, "loss": 0.5151, "step": 210 }, { "epoch": 2.47, "learning_rate": 9.225e-05, "loss": 0.5134, "step": 220 }, { "epoch": 2.58, "learning_rate": 9.0375e-05, "loss": 0.4776, "step": 230 }, { "epoch": 2.69, "learning_rate": 8.850000000000001e-05, "loss": 0.5188, "step": 240 }, { "epoch": 2.8, "learning_rate": 8.6625e-05, "loss": 0.5312, "step": 250 }, { "epoch": 2.91, "learning_rate": 8.475000000000001e-05, "loss": 0.4732, "step": 260 }, { "epoch": 2.99, "eval_accuracy": 0.6872169975618252, "eval_f1": 0.6840932939913709, "eval_loss": 0.9042980670928955, "eval_precision": 0.6906579200512205, "eval_recall": 0.6872169975618252, "eval_runtime": 32.8137, "eval_samples_per_second": 174.988, "eval_steps_per_second": 2.743, "step": 267 }, { "epoch": 3.03, "learning_rate": 8.287500000000001e-05, "loss": 0.4772, "step": 270 }, { "epoch": 3.14, "learning_rate": 8.1e-05, "loss": 0.299, "step": 280 }, { "epoch": 3.26, "learning_rate": 7.912500000000001e-05, "loss": 0.2614, "step": 290 }, { "epoch": 3.37, "learning_rate": 7.725000000000001e-05, "loss": 0.2679, "step": 300 }, { "epoch": 3.48, "learning_rate": 7.5375e-05, "loss": 0.2992, "step": 310 }, { "epoch": 3.59, "learning_rate": 7.350000000000001e-05, "loss": 0.2835, "step": 320 }, { "epoch": 3.7, "learning_rate": 7.1625e-05, "loss": 0.2752, "step": 330 }, { "epoch": 3.81, "learning_rate": 6.975e-05, "loss": 0.27, "step": 340 }, { "epoch": 3.92, "learning_rate": 6.787500000000001e-05, "loss": 0.2861, "step": 350 }, { "epoch": 3.99, "eval_accuracy": 0.6847788227098572, "eval_f1": 0.6813474424826861, "eval_loss": 0.9865238666534424, "eval_precision": 0.6808262458026351, "eval_recall": 0.6847788227098572, "eval_runtime": 34.0061, "eval_samples_per_second": 168.852, "eval_steps_per_second": 2.647, "step": 356 }, { "epoch": 4.04, "learning_rate": 6.6e-05, "loss": 0.2485, "step": 360 }, { "epoch": 4.16, "learning_rate": 6.412500000000001e-05, "loss": 0.1212, "step": 370 }, { "epoch": 4.27, "learning_rate": 6.225000000000001e-05, "loss": 0.121, "step": 380 }, { "epoch": 4.38, "learning_rate": 6.0375000000000004e-05, "loss": 0.131, "step": 390 }, { "epoch": 4.49, "learning_rate": 5.85e-05, "loss": 0.1192, "step": 400 }, { "epoch": 4.6, "learning_rate": 5.6625e-05, "loss": 0.1137, "step": 410 }, { "epoch": 4.71, "learning_rate": 5.475e-05, "loss": 0.1334, "step": 420 }, { "epoch": 4.82, "learning_rate": 5.2875e-05, "loss": 0.1285, "step": 430 }, { "epoch": 4.94, "learning_rate": 5.1e-05, "loss": 0.1234, "step": 440 }, { "epoch": 4.99, "eval_accuracy": 0.6853012887495646, "eval_f1": 0.6871627462072427, "eval_loss": 1.1047998666763306, "eval_precision": 0.6907009316583976, "eval_recall": 0.6853012887495646, "eval_runtime": 32.6937, "eval_samples_per_second": 175.63, "eval_steps_per_second": 2.753, "step": 445 }, { "epoch": 5.06, "learning_rate": 4.9125e-05, "loss": 0.1018, "step": 450 }, { "epoch": 5.17, "learning_rate": 4.7249999999999997e-05, "loss": 0.053, "step": 460 }, { "epoch": 5.28, "learning_rate": 4.5375e-05, "loss": 0.0495, "step": 470 }, { "epoch": 5.39, "learning_rate": 4.35e-05, "loss": 0.052, "step": 480 }, { "epoch": 5.5, "learning_rate": 4.1625e-05, "loss": 0.0597, "step": 490 }, { "epoch": 5.61, "learning_rate": 3.975e-05, "loss": 0.0548, "step": 500 }, { "epoch": 5.72, "learning_rate": 3.7875e-05, "loss": 0.0619, "step": 510 }, { "epoch": 5.84, "learning_rate": 3.6e-05, "loss": 0.0627, "step": 520 }, { "epoch": 5.95, "learning_rate": 3.4125e-05, "loss": 0.0599, "step": 530 }, { "epoch": 5.99, "eval_accuracy": 0.6889585510275166, "eval_f1": 0.6876003709723829, "eval_loss": 1.2361745834350586, "eval_precision": 0.6897347831759311, "eval_recall": 0.6889585510275166, "eval_runtime": 34.0898, "eval_samples_per_second": 168.437, "eval_steps_per_second": 2.64, "step": 534 }, { "epoch": 6.07, "learning_rate": 3.225e-05, "loss": 0.0431, "step": 540 }, { "epoch": 6.18, "learning_rate": 3.0375e-05, "loss": 0.033, "step": 550 }, { "epoch": 6.29, "learning_rate": 2.8499999999999998e-05, "loss": 0.0332, "step": 560 }, { "epoch": 6.4, "learning_rate": 2.6625e-05, "loss": 0.0315, "step": 570 }, { "epoch": 6.51, "learning_rate": 2.475e-05, "loss": 0.0305, "step": 580 }, { "epoch": 6.62, "learning_rate": 2.2875e-05, "loss": 0.0243, "step": 590 }, { "epoch": 6.74, "learning_rate": 2.1e-05, "loss": 0.0241, "step": 600 }, { "epoch": 6.85, "learning_rate": 1.9125e-05, "loss": 0.0206, "step": 610 }, { "epoch": 6.96, "learning_rate": 1.725e-05, "loss": 0.0289, "step": 620 }, { "epoch": 6.99, "eval_accuracy": 0.6931382793451759, "eval_f1": 0.6921150248707686, "eval_loss": 1.3140767812728882, "eval_precision": 0.6925717262836596, "eval_recall": 0.6931382793451759, "eval_runtime": 33.0395, "eval_samples_per_second": 173.792, "eval_steps_per_second": 2.724, "step": 623 }, { "epoch": 7.08, "learning_rate": 1.5374999999999998e-05, "loss": 0.0185, "step": 630 }, { "epoch": 7.19, "learning_rate": 1.3500000000000001e-05, "loss": 0.0132, "step": 640 }, { "epoch": 7.3, "learning_rate": 1.1625000000000001e-05, "loss": 0.014, "step": 650 }, { "epoch": 7.41, "learning_rate": 9.75e-06, "loss": 0.0121, "step": 660 }, { "epoch": 7.52, "learning_rate": 7.875e-06, "loss": 0.0203, "step": 670 }, { "epoch": 7.64, "learning_rate": 6e-06, "loss": 0.0103, "step": 680 }, { "epoch": 7.75, "learning_rate": 4.125e-06, "loss": 0.0178, "step": 690 }, { "epoch": 7.86, "learning_rate": 2.25e-06, "loss": 0.0126, "step": 700 }, { "epoch": 7.97, "learning_rate": 3.75e-07, "loss": 0.0134, "step": 710 }, { "epoch": 7.99, "eval_accuracy": 0.6960989202368513, "eval_f1": 0.6957934361657124, "eval_loss": 1.3257348537445068, "eval_precision": 0.6966334506335445, "eval_recall": 0.6960989202368513, "eval_runtime": 37.8195, "eval_samples_per_second": 151.827, "eval_steps_per_second": 2.38, "step": 712 }, { "epoch": 7.99, "step": 712, "total_flos": 1.4224524590735456e+19, "train_loss": 0.3359685759269371, "train_runtime": 2345.2254, "train_samples_per_second": 78.345, "train_steps_per_second": 0.304 } ], "max_steps": 712, "num_train_epochs": 8, "total_flos": 1.4224524590735456e+19, "trial_name": null, "trial_params": null }