{ "best_metric": 0.3229311406612396, "best_model_checkpoint": "deepfake_vs_real_image_detection/checkpoint-1008", "epoch": 63.0, "eval_steps": 500, "global_step": 1008, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.7091988130563798, "eval_loss": 1.3149911165237427, "eval_runtime": 4.5396, "eval_samples_per_second": 74.236, "eval_steps_per_second": 9.472, "step": 16 }, { "epoch": 2.0, "eval_accuracy": 0.7240356083086054, "eval_loss": 1.2351125478744507, "eval_runtime": 4.5534, "eval_samples_per_second": 74.011, "eval_steps_per_second": 9.443, "step": 32 }, { "epoch": 3.0, "eval_accuracy": 0.7477744807121661, "eval_loss": 1.1467523574829102, "eval_runtime": 4.5438, "eval_samples_per_second": 74.166, "eval_steps_per_second": 9.463, "step": 48 }, { "epoch": 4.0, "eval_accuracy": 0.7566765578635015, "eval_loss": 1.0724865198135376, "eval_runtime": 4.6718, "eval_samples_per_second": 72.136, "eval_steps_per_second": 9.204, "step": 64 }, { "epoch": 5.0, "eval_accuracy": 0.7744807121661721, "eval_loss": 1.0107314586639404, "eval_runtime": 4.63, "eval_samples_per_second": 72.787, "eval_steps_per_second": 9.287, "step": 80 }, { "epoch": 6.0, "eval_accuracy": 0.7804154302670623, "eval_loss": 0.9634671211242676, "eval_runtime": 4.5376, "eval_samples_per_second": 74.268, "eval_steps_per_second": 9.476, "step": 96 }, { "epoch": 7.0, "eval_accuracy": 0.7833827893175074, "eval_loss": 0.9228468537330627, "eval_runtime": 4.533, "eval_samples_per_second": 74.344, "eval_steps_per_second": 9.486, "step": 112 }, { "epoch": 8.0, "eval_accuracy": 0.7833827893175074, "eval_loss": 0.8867318034172058, "eval_runtime": 4.5995, "eval_samples_per_second": 73.269, "eval_steps_per_second": 9.349, "step": 128 }, { "epoch": 9.0, "eval_accuracy": 0.7893175074183977, "eval_loss": 0.8541847467422485, "eval_runtime": 4.5814, "eval_samples_per_second": 73.558, "eval_steps_per_second": 9.386, "step": 144 }, { "epoch": 10.0, "eval_accuracy": 0.7893175074183977, "eval_loss": 0.8184245824813843, "eval_runtime": 4.6031, "eval_samples_per_second": 73.211, "eval_steps_per_second": 9.341, "step": 160 }, { "epoch": 11.0, "eval_accuracy": 0.7804154302670623, "eval_loss": 0.7671003341674805, "eval_runtime": 4.5853, "eval_samples_per_second": 73.496, "eval_steps_per_second": 9.378, "step": 176 }, { "epoch": 12.0, "eval_accuracy": 0.7833827893175074, "eval_loss": 0.7202329039573669, "eval_runtime": 4.5949, "eval_samples_per_second": 73.342, "eval_steps_per_second": 9.358, "step": 192 }, { "epoch": 13.0, "eval_accuracy": 0.7833827893175074, "eval_loss": 0.6835761666297913, "eval_runtime": 4.5413, "eval_samples_per_second": 74.208, "eval_steps_per_second": 9.469, "step": 208 }, { "epoch": 14.0, "eval_accuracy": 0.7863501483679525, "eval_loss": 0.6513931155204773, "eval_runtime": 4.6483, "eval_samples_per_second": 72.5, "eval_steps_per_second": 9.251, "step": 224 }, { "epoch": 15.0, "eval_accuracy": 0.7952522255192879, "eval_loss": 0.6230782866477966, "eval_runtime": 4.5993, "eval_samples_per_second": 73.272, "eval_steps_per_second": 9.349, "step": 240 }, { "epoch": 16.0, "eval_accuracy": 0.8041543026706232, "eval_loss": 0.5948796272277832, "eval_runtime": 4.5704, "eval_samples_per_second": 73.735, "eval_steps_per_second": 9.408, "step": 256 }, { "epoch": 17.0, "eval_accuracy": 0.8071216617210683, "eval_loss": 0.5689114332199097, "eval_runtime": 4.5933, "eval_samples_per_second": 73.367, "eval_steps_per_second": 9.361, "step": 272 }, { "epoch": 18.0, "eval_accuracy": 0.8130563798219584, "eval_loss": 0.5446034669876099, "eval_runtime": 4.5362, "eval_samples_per_second": 74.291, "eval_steps_per_second": 9.479, "step": 288 }, { "epoch": 19.0, "eval_accuracy": 0.8130563798219584, "eval_loss": 0.5227214097976685, "eval_runtime": 4.5669, "eval_samples_per_second": 73.791, "eval_steps_per_second": 9.415, "step": 304 }, { "epoch": 20.0, "eval_accuracy": 0.8189910979228486, "eval_loss": 0.5031161308288574, "eval_runtime": 4.5479, "eval_samples_per_second": 74.1, "eval_steps_per_second": 9.455, "step": 320 }, { "epoch": 21.0, "eval_accuracy": 0.8160237388724035, "eval_loss": 0.48820197582244873, "eval_runtime": 4.5452, "eval_samples_per_second": 74.145, "eval_steps_per_second": 9.461, "step": 336 }, { "epoch": 22.0, "eval_accuracy": 0.8130563798219584, "eval_loss": 0.47535890340805054, "eval_runtime": 4.6769, "eval_samples_per_second": 72.057, "eval_steps_per_second": 9.194, "step": 352 }, { "epoch": 23.0, "eval_accuracy": 0.8130563798219584, "eval_loss": 0.4620312452316284, "eval_runtime": 4.5546, "eval_samples_per_second": 73.992, "eval_steps_per_second": 9.441, "step": 368 }, { "epoch": 24.0, "eval_accuracy": 0.8130563798219584, "eval_loss": 0.44609472155570984, "eval_runtime": 4.562, "eval_samples_per_second": 73.87, "eval_steps_per_second": 9.426, "step": 384 }, { "epoch": 25.0, "eval_accuracy": 0.8160237388724035, "eval_loss": 0.4364510774612427, "eval_runtime": 4.6256, "eval_samples_per_second": 72.855, "eval_steps_per_second": 9.296, "step": 400 }, { "epoch": 26.0, "eval_accuracy": 0.8249258160237388, "eval_loss": 0.42621392011642456, "eval_runtime": 4.5891, "eval_samples_per_second": 73.434, "eval_steps_per_second": 9.37, "step": 416 }, { "epoch": 27.0, "eval_accuracy": 0.827893175074184, "eval_loss": 0.4176171123981476, "eval_runtime": 4.7205, "eval_samples_per_second": 71.39, "eval_steps_per_second": 9.109, "step": 432 }, { "epoch": 28.0, "eval_accuracy": 0.8338278931750742, "eval_loss": 0.40912118554115295, "eval_runtime": 4.6413, "eval_samples_per_second": 72.609, "eval_steps_per_second": 9.265, "step": 448 }, { "epoch": 29.0, "eval_accuracy": 0.8397626112759644, "eval_loss": 0.40831413865089417, "eval_runtime": 4.5637, "eval_samples_per_second": 73.843, "eval_steps_per_second": 9.422, "step": 464 }, { "epoch": 30.0, "eval_accuracy": 0.8397626112759644, "eval_loss": 0.40189576148986816, "eval_runtime": 4.6019, "eval_samples_per_second": 73.23, "eval_steps_per_second": 9.344, "step": 480 }, { "epoch": 31.0, "eval_accuracy": 0.8427299703264095, "eval_loss": 0.39464861154556274, "eval_runtime": 4.5459, "eval_samples_per_second": 74.133, "eval_steps_per_second": 9.459, "step": 496 }, { "epoch": 31.25, "grad_norm": 2.8177223205566406, "learning_rate": 8.098055790363483e-07, "loss": 0.7287, "step": 500 }, { "epoch": 32.0, "eval_accuracy": 0.8427299703264095, "eval_loss": 0.38916730880737305, "eval_runtime": 4.6237, "eval_samples_per_second": 72.886, "eval_steps_per_second": 9.3, "step": 512 }, { "epoch": 33.0, "eval_accuracy": 0.8516320474777448, "eval_loss": 0.3844282031059265, "eval_runtime": 4.5824, "eval_samples_per_second": 73.542, "eval_steps_per_second": 9.384, "step": 528 }, { "epoch": 34.0, "eval_accuracy": 0.8516320474777448, "eval_loss": 0.37861311435699463, "eval_runtime": 4.5644, "eval_samples_per_second": 73.833, "eval_steps_per_second": 9.421, "step": 544 }, { "epoch": 35.0, "eval_accuracy": 0.8516320474777448, "eval_loss": 0.3732515275478363, "eval_runtime": 4.5962, "eval_samples_per_second": 73.322, "eval_steps_per_second": 9.356, "step": 560 }, { "epoch": 36.0, "eval_accuracy": 0.8516320474777448, "eval_loss": 0.37023723125457764, "eval_runtime": 4.5345, "eval_samples_per_second": 74.319, "eval_steps_per_second": 9.483, "step": 576 }, { "epoch": 37.0, "eval_accuracy": 0.8605341246290801, "eval_loss": 0.36356887221336365, "eval_runtime": 4.6253, "eval_samples_per_second": 72.86, "eval_steps_per_second": 9.297, "step": 592 }, { "epoch": 38.0, "eval_accuracy": 0.8635014836795252, "eval_loss": 0.35962143540382385, "eval_runtime": 4.5862, "eval_samples_per_second": 73.482, "eval_steps_per_second": 9.376, "step": 608 }, { "epoch": 39.0, "eval_accuracy": 0.8605341246290801, "eval_loss": 0.3568034768104553, "eval_runtime": 4.5393, "eval_samples_per_second": 74.241, "eval_steps_per_second": 9.473, "step": 624 }, { "epoch": 40.0, "eval_accuracy": 0.8516320474777448, "eval_loss": 0.35836362838745117, "eval_runtime": 4.5145, "eval_samples_per_second": 74.649, "eval_steps_per_second": 9.525, "step": 640 }, { "epoch": 41.0, "eval_accuracy": 0.857566765578635, "eval_loss": 0.35482144355773926, "eval_runtime": 4.5734, "eval_samples_per_second": 73.687, "eval_steps_per_second": 9.402, "step": 656 }, { "epoch": 42.0, "eval_accuracy": 0.857566765578635, "eval_loss": 0.3515448272228241, "eval_runtime": 4.5679, "eval_samples_per_second": 73.776, "eval_steps_per_second": 9.414, "step": 672 }, { "epoch": 43.0, "eval_accuracy": 0.8605341246290801, "eval_loss": 0.3470025658607483, "eval_runtime": 4.5874, "eval_samples_per_second": 73.462, "eval_steps_per_second": 9.374, "step": 688 }, { "epoch": 44.0, "eval_accuracy": 0.8664688427299704, "eval_loss": 0.3467743992805481, "eval_runtime": 4.6426, "eval_samples_per_second": 72.589, "eval_steps_per_second": 9.262, "step": 704 }, { "epoch": 45.0, "eval_accuracy": 0.8664688427299704, "eval_loss": 0.3463208079338074, "eval_runtime": 4.5833, "eval_samples_per_second": 73.528, "eval_steps_per_second": 9.382, "step": 720 }, { "epoch": 46.0, "eval_accuracy": 0.8664688427299704, "eval_loss": 0.3457556664943695, "eval_runtime": 4.6971, "eval_samples_per_second": 71.746, "eval_steps_per_second": 9.155, "step": 736 }, { "epoch": 47.0, "eval_accuracy": 0.8664688427299704, "eval_loss": 0.3446126878261566, "eval_runtime": 4.5645, "eval_samples_per_second": 73.831, "eval_steps_per_second": 9.421, "step": 752 }, { "epoch": 48.0, "eval_accuracy": 0.8664688427299704, "eval_loss": 0.34248268604278564, "eval_runtime": 4.5812, "eval_samples_per_second": 73.561, "eval_steps_per_second": 9.386, "step": 768 }, { "epoch": 49.0, "eval_accuracy": 0.8694362017804155, "eval_loss": 0.3440556824207306, "eval_runtime": 4.5663, "eval_samples_per_second": 73.802, "eval_steps_per_second": 9.417, "step": 784 }, { "epoch": 50.0, "eval_accuracy": 0.8664688427299704, "eval_loss": 0.3455652594566345, "eval_runtime": 4.5263, "eval_samples_per_second": 74.454, "eval_steps_per_second": 9.5, "step": 800 }, { "epoch": 51.0, "eval_accuracy": 0.8724035608308606, "eval_loss": 0.3401181697845459, "eval_runtime": 4.5842, "eval_samples_per_second": 73.513, "eval_steps_per_second": 9.38, "step": 816 }, { "epoch": 52.0, "eval_accuracy": 0.8724035608308606, "eval_loss": 0.33749544620513916, "eval_runtime": 4.5545, "eval_samples_per_second": 73.993, "eval_steps_per_second": 9.441, "step": 832 }, { "epoch": 53.0, "eval_accuracy": 0.8724035608308606, "eval_loss": 0.33886510133743286, "eval_runtime": 4.6181, "eval_samples_per_second": 72.974, "eval_steps_per_second": 9.311, "step": 848 }, { "epoch": 54.0, "eval_accuracy": 0.8724035608308606, "eval_loss": 0.33066779375076294, "eval_runtime": 4.6066, "eval_samples_per_second": 73.155, "eval_steps_per_second": 9.334, "step": 864 }, { "epoch": 55.0, "eval_accuracy": 0.8724035608308606, "eval_loss": 0.3285369575023651, "eval_runtime": 4.6615, "eval_samples_per_second": 72.294, "eval_steps_per_second": 9.224, "step": 880 }, { "epoch": 56.0, "eval_accuracy": 0.8724035608308606, "eval_loss": 0.3319447338581085, "eval_runtime": 4.6422, "eval_samples_per_second": 72.594, "eval_steps_per_second": 9.263, "step": 896 }, { "epoch": 57.0, "eval_accuracy": 0.8724035608308606, "eval_loss": 0.33194291591644287, "eval_runtime": 4.5847, "eval_samples_per_second": 73.506, "eval_steps_per_second": 9.379, "step": 912 }, { "epoch": 58.0, "eval_accuracy": 0.8724035608308606, "eval_loss": 0.33001473546028137, "eval_runtime": 4.546, "eval_samples_per_second": 74.131, "eval_steps_per_second": 9.459, "step": 928 }, { "epoch": 59.0, "eval_accuracy": 0.8753709198813057, "eval_loss": 0.32828956842422485, "eval_runtime": 4.5976, "eval_samples_per_second": 73.299, "eval_steps_per_second": 9.353, "step": 944 }, { "epoch": 60.0, "eval_accuracy": 0.8753709198813057, "eval_loss": 0.3273901641368866, "eval_runtime": 4.6205, "eval_samples_per_second": 72.936, "eval_steps_per_second": 9.306, "step": 960 }, { "epoch": 61.0, "eval_accuracy": 0.8753709198813057, "eval_loss": 0.32634109258651733, "eval_runtime": 4.5578, "eval_samples_per_second": 73.94, "eval_steps_per_second": 9.434, "step": 976 }, { "epoch": 62.0, "eval_accuracy": 0.8753709198813057, "eval_loss": 0.3289165496826172, "eval_runtime": 4.6025, "eval_samples_per_second": 73.22, "eval_steps_per_second": 9.343, "step": 992 }, { "epoch": 62.5, "grad_norm": 2.3223371505737305, "learning_rate": 5.984784446322908e-07, "loss": 0.2023, "step": 1000 }, { "epoch": 63.0, "eval_accuracy": 0.8783382789317508, "eval_loss": 0.3229311406612396, "eval_runtime": 4.5765, "eval_samples_per_second": 73.637, "eval_steps_per_second": 9.396, "step": 1008 } ], "logging_steps": 500, "max_steps": 2416, "num_input_tokens_seen": 0, "num_train_epochs": 151, "save_steps": 500, "total_flos": 2.4654076495882445e+18, "train_batch_size": 32, "trial_name": null, "trial_params": null }