{ "best_metric": 0.3408508457201435, "best_model_checkpoint": "videomae-base-finetuned-ucf_crime/checkpoint-640", "epoch": 15.0625, "global_step": 640, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.02, "learning_rate": 7.8125e-06, "loss": 2.0077, "step": 10 }, { "epoch": 0.03, "learning_rate": 1.5625e-05, "loss": 2.0023, "step": 20 }, { "epoch": 0.05, "learning_rate": 2.34375e-05, "loss": 1.9694, "step": 30 }, { "epoch": 0.06, "learning_rate": 3.125e-05, "loss": 1.9349, "step": 40 }, { "epoch": 0.06, "eval_accuracy": 0.23321373654536134, "eval_loss": 1.9845067262649536, "eval_runtime": 283.512, "eval_samples_per_second": 6.882, "eval_steps_per_second": 1.379, "step": 40 }, { "epoch": 1.02, "learning_rate": 3.90625e-05, "loss": 1.8948, "step": 50 }, { "epoch": 1.03, "learning_rate": 4.6875e-05, "loss": 1.9233, "step": 60 }, { "epoch": 1.05, "learning_rate": 4.947916666666667e-05, "loss": 1.8999, "step": 70 }, { "epoch": 1.06, "learning_rate": 4.8611111111111115e-05, "loss": 1.8834, "step": 80 }, { "epoch": 1.06, "eval_accuracy": 0.300871348026653, "eval_loss": 1.913393259048462, "eval_runtime": 275.0254, "eval_samples_per_second": 7.094, "eval_steps_per_second": 1.422, "step": 80 }, { "epoch": 2.02, "learning_rate": 4.774305555555556e-05, "loss": 1.7494, "step": 90 }, { "epoch": 2.03, "learning_rate": 4.6875e-05, "loss": 1.8734, "step": 100 }, { "epoch": 2.05, "learning_rate": 4.6006944444444444e-05, "loss": 1.7983, "step": 110 }, { "epoch": 2.06, "learning_rate": 4.5138888888888894e-05, "loss": 1.7506, "step": 120 }, { "epoch": 2.06, "eval_accuracy": 0.3080471553049718, "eval_loss": 1.8459901809692383, "eval_runtime": 276.2962, "eval_samples_per_second": 7.061, "eval_steps_per_second": 1.415, "step": 120 }, { "epoch": 3.02, "learning_rate": 4.4270833333333337e-05, "loss": 1.7095, "step": 130 }, { "epoch": 3.03, "learning_rate": 4.340277777777778e-05, "loss": 1.7728, "step": 140 }, { "epoch": 3.05, "learning_rate": 4.253472222222222e-05, "loss": 1.6405, "step": 150 }, { "epoch": 3.06, "learning_rate": 4.166666666666667e-05, "loss": 1.6494, "step": 160 }, { "epoch": 3.06, "eval_accuracy": 0.26242952332137365, "eval_loss": 1.7690991163253784, "eval_runtime": 273.7893, "eval_samples_per_second": 7.126, "eval_steps_per_second": 1.428, "step": 160 }, { "epoch": 4.02, "learning_rate": 4.0798611111111115e-05, "loss": 1.54, "step": 170 }, { "epoch": 4.03, "learning_rate": 3.993055555555556e-05, "loss": 1.7852, "step": 180 }, { "epoch": 4.05, "learning_rate": 3.90625e-05, "loss": 1.6099, "step": 190 }, { "epoch": 4.06, "learning_rate": 3.8194444444444444e-05, "loss": 1.6189, "step": 200 }, { "epoch": 4.06, "eval_accuracy": 0.2537160430548437, "eval_loss": 1.7939332723617554, "eval_runtime": 277.3167, "eval_samples_per_second": 7.035, "eval_steps_per_second": 1.41, "step": 200 }, { "epoch": 5.02, "learning_rate": 3.7326388888888893e-05, "loss": 1.6924, "step": 210 }, { "epoch": 5.03, "learning_rate": 3.6458333333333336e-05, "loss": 1.4859, "step": 220 }, { "epoch": 5.05, "learning_rate": 3.559027777777778e-05, "loss": 1.5968, "step": 230 }, { "epoch": 5.06, "learning_rate": 3.472222222222222e-05, "loss": 1.6895, "step": 240 }, { "epoch": 5.06, "eval_accuracy": 0.2706304459251666, "eval_loss": 1.7808924913406372, "eval_runtime": 273.0904, "eval_samples_per_second": 7.144, "eval_steps_per_second": 1.432, "step": 240 }, { "epoch": 6.02, "learning_rate": 3.385416666666667e-05, "loss": 1.4744, "step": 250 }, { "epoch": 6.03, "learning_rate": 3.2986111111111115e-05, "loss": 1.4511, "step": 260 }, { "epoch": 6.05, "learning_rate": 3.211805555555556e-05, "loss": 1.5508, "step": 270 }, { "epoch": 6.06, "learning_rate": 3.125e-05, "loss": 1.517, "step": 280 }, { "epoch": 6.06, "eval_accuracy": 0.32444900051255765, "eval_loss": 1.6772902011871338, "eval_runtime": 276.0493, "eval_samples_per_second": 7.068, "eval_steps_per_second": 1.416, "step": 280 }, { "epoch": 7.02, "learning_rate": 3.0381944444444444e-05, "loss": 1.4337, "step": 290 }, { "epoch": 7.03, "learning_rate": 2.951388888888889e-05, "loss": 1.3272, "step": 300 }, { "epoch": 7.05, "learning_rate": 2.8645833333333333e-05, "loss": 1.5492, "step": 310 }, { "epoch": 7.06, "learning_rate": 2.777777777777778e-05, "loss": 1.308, "step": 320 }, { "epoch": 7.06, "eval_accuracy": 0.31522296258329063, "eval_loss": 1.8363568782806396, "eval_runtime": 279.2835, "eval_samples_per_second": 6.986, "eval_steps_per_second": 1.4, "step": 320 }, { "epoch": 8.02, "learning_rate": 2.6909722222222222e-05, "loss": 1.3879, "step": 330 }, { "epoch": 8.03, "learning_rate": 2.604166666666667e-05, "loss": 1.275, "step": 340 }, { "epoch": 8.05, "learning_rate": 2.517361111111111e-05, "loss": 1.5059, "step": 350 }, { "epoch": 8.06, "learning_rate": 2.4305555555555558e-05, "loss": 1.2267, "step": 360 }, { "epoch": 8.06, "eval_accuracy": 0.24397744746283956, "eval_loss": 2.039224147796631, "eval_runtime": 274.0654, "eval_samples_per_second": 7.119, "eval_steps_per_second": 1.427, "step": 360 }, { "epoch": 9.02, "learning_rate": 2.34375e-05, "loss": 1.1202, "step": 370 }, { "epoch": 9.03, "learning_rate": 2.2569444444444447e-05, "loss": 1.2332, "step": 380 }, { "epoch": 9.05, "learning_rate": 2.170138888888889e-05, "loss": 1.202, "step": 390 }, { "epoch": 9.06, "learning_rate": 2.0833333333333336e-05, "loss": 1.4347, "step": 400 }, { "epoch": 9.06, "eval_accuracy": 0.2450025627883137, "eval_loss": 1.9110286235809326, "eval_runtime": 276.5587, "eval_samples_per_second": 7.055, "eval_steps_per_second": 1.414, "step": 400 }, { "epoch": 10.02, "learning_rate": 1.996527777777778e-05, "loss": 1.2234, "step": 410 }, { "epoch": 10.03, "learning_rate": 1.9097222222222222e-05, "loss": 1.1313, "step": 420 }, { "epoch": 10.05, "learning_rate": 1.8229166666666668e-05, "loss": 1.0577, "step": 430 }, { "epoch": 10.06, "learning_rate": 1.736111111111111e-05, "loss": 1.1567, "step": 440 }, { "epoch": 10.06, "eval_accuracy": 0.2839569451563301, "eval_loss": 1.7605599164962769, "eval_runtime": 272.6134, "eval_samples_per_second": 7.157, "eval_steps_per_second": 1.434, "step": 440 }, { "epoch": 11.02, "learning_rate": 1.6493055555555557e-05, "loss": 0.8971, "step": 450 }, { "epoch": 11.03, "learning_rate": 1.5625e-05, "loss": 0.9622, "step": 460 }, { "epoch": 11.05, "learning_rate": 1.4756944444444445e-05, "loss": 1.0249, "step": 470 }, { "epoch": 11.06, "learning_rate": 1.388888888888889e-05, "loss": 1.1937, "step": 480 }, { "epoch": 11.06, "eval_accuracy": 0.27370579190158895, "eval_loss": 1.9803204536437988, "eval_runtime": 276.1285, "eval_samples_per_second": 7.066, "eval_steps_per_second": 1.416, "step": 480 }, { "epoch": 12.02, "learning_rate": 1.3020833333333334e-05, "loss": 1.0393, "step": 490 }, { "epoch": 12.03, "learning_rate": 1.2152777777777779e-05, "loss": 1.0307, "step": 500 }, { "epoch": 12.05, "learning_rate": 1.1284722222222223e-05, "loss": 0.9968, "step": 510 }, { "epoch": 12.06, "learning_rate": 1.0416666666666668e-05, "loss": 1.0729, "step": 520 }, { "epoch": 12.06, "eval_accuracy": 0.3352127114300359, "eval_loss": 1.8354512453079224, "eval_runtime": 279.58, "eval_samples_per_second": 6.978, "eval_steps_per_second": 1.399, "step": 520 }, { "epoch": 13.02, "learning_rate": 9.548611111111111e-06, "loss": 0.8985, "step": 530 }, { "epoch": 13.03, "learning_rate": 8.680555555555556e-06, "loss": 0.8869, "step": 540 }, { "epoch": 13.05, "learning_rate": 7.8125e-06, "loss": 0.8955, "step": 550 }, { "epoch": 13.06, "learning_rate": 6.944444444444445e-06, "loss": 1.0721, "step": 560 }, { "epoch": 13.06, "eval_accuracy": 0.33111225012813944, "eval_loss": 1.780818223953247, "eval_runtime": 273.7447, "eval_samples_per_second": 7.127, "eval_steps_per_second": 1.428, "step": 560 }, { "epoch": 14.02, "learning_rate": 6.076388888888889e-06, "loss": 0.9399, "step": 570 }, { "epoch": 14.03, "learning_rate": 5.208333333333334e-06, "loss": 0.9936, "step": 580 }, { "epoch": 14.05, "learning_rate": 4.340277777777778e-06, "loss": 0.9332, "step": 590 }, { "epoch": 14.06, "learning_rate": 3.4722222222222224e-06, "loss": 0.6594, "step": 600 }, { "epoch": 14.06, "eval_accuracy": 0.30599692465402356, "eval_loss": 1.8175382614135742, "eval_runtime": 275.653, "eval_samples_per_second": 7.078, "eval_steps_per_second": 1.418, "step": 600 }, { "epoch": 15.02, "learning_rate": 2.604166666666667e-06, "loss": 0.9107, "step": 610 }, { "epoch": 15.03, "learning_rate": 1.7361111111111112e-06, "loss": 0.8448, "step": 620 }, { "epoch": 15.05, "learning_rate": 8.680555555555556e-07, "loss": 0.8649, "step": 630 }, { "epoch": 15.06, "learning_rate": 0.0, "loss": 0.7636, "step": 640 }, { "epoch": 15.06, "eval_accuracy": 0.3408508457201435, "eval_loss": 1.8408526182174683, "eval_runtime": 276.6561, "eval_samples_per_second": 7.052, "eval_steps_per_second": 1.413, "step": 640 }, { "epoch": 15.06, "step": 640, "total_flos": 6.380135180119572e+18, "train_loss": 1.3738294385373593, "train_runtime": 5964.0785, "train_samples_per_second": 0.858, "train_steps_per_second": 0.107 }, { "epoch": 15.06, "eval_accuracy": 0.3719715956558062, "eval_loss": 1.4775745868682861, "eval_runtime": 739.4258, "eval_samples_per_second": 6.475, "eval_steps_per_second": 1.296, "step": 640 }, { "epoch": 15.06, "eval_accuracy": 0.3719715956558062, "eval_loss": 1.4775745868682861, "eval_runtime": 711.1381, "eval_samples_per_second": 6.733, "eval_steps_per_second": 1.347, "step": 640 } ], "max_steps": 640, "num_train_epochs": 9223372036854775807, "total_flos": 6.380135180119572e+18, "trial_name": null, "trial_params": null }