|
{ |
|
"best_metric": 0.3229311406612396, |
|
"best_model_checkpoint": "deepfake_vs_real_image_detection/checkpoint-1008", |
|
"epoch": 63.0, |
|
"eval_steps": 500, |
|
"global_step": 1008, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.7091988130563798, |
|
"eval_loss": 1.3149911165237427, |
|
"eval_runtime": 4.5396, |
|
"eval_samples_per_second": 74.236, |
|
"eval_steps_per_second": 9.472, |
|
"step": 16 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7240356083086054, |
|
"eval_loss": 1.2351125478744507, |
|
"eval_runtime": 4.5534, |
|
"eval_samples_per_second": 74.011, |
|
"eval_steps_per_second": 9.443, |
|
"step": 32 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7477744807121661, |
|
"eval_loss": 1.1467523574829102, |
|
"eval_runtime": 4.5438, |
|
"eval_samples_per_second": 74.166, |
|
"eval_steps_per_second": 9.463, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.7566765578635015, |
|
"eval_loss": 1.0724865198135376, |
|
"eval_runtime": 4.6718, |
|
"eval_samples_per_second": 72.136, |
|
"eval_steps_per_second": 9.204, |
|
"step": 64 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.7744807121661721, |
|
"eval_loss": 1.0107314586639404, |
|
"eval_runtime": 4.63, |
|
"eval_samples_per_second": 72.787, |
|
"eval_steps_per_second": 9.287, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.7804154302670623, |
|
"eval_loss": 0.9634671211242676, |
|
"eval_runtime": 4.5376, |
|
"eval_samples_per_second": 74.268, |
|
"eval_steps_per_second": 9.476, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.7833827893175074, |
|
"eval_loss": 0.9228468537330627, |
|
"eval_runtime": 4.533, |
|
"eval_samples_per_second": 74.344, |
|
"eval_steps_per_second": 9.486, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.7833827893175074, |
|
"eval_loss": 0.8867318034172058, |
|
"eval_runtime": 4.5995, |
|
"eval_samples_per_second": 73.269, |
|
"eval_steps_per_second": 9.349, |
|
"step": 128 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.7893175074183977, |
|
"eval_loss": 0.8541847467422485, |
|
"eval_runtime": 4.5814, |
|
"eval_samples_per_second": 73.558, |
|
"eval_steps_per_second": 9.386, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.7893175074183977, |
|
"eval_loss": 0.8184245824813843, |
|
"eval_runtime": 4.6031, |
|
"eval_samples_per_second": 73.211, |
|
"eval_steps_per_second": 9.341, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.7804154302670623, |
|
"eval_loss": 0.7671003341674805, |
|
"eval_runtime": 4.5853, |
|
"eval_samples_per_second": 73.496, |
|
"eval_steps_per_second": 9.378, |
|
"step": 176 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.7833827893175074, |
|
"eval_loss": 0.7202329039573669, |
|
"eval_runtime": 4.5949, |
|
"eval_samples_per_second": 73.342, |
|
"eval_steps_per_second": 9.358, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.7833827893175074, |
|
"eval_loss": 0.6835761666297913, |
|
"eval_runtime": 4.5413, |
|
"eval_samples_per_second": 74.208, |
|
"eval_steps_per_second": 9.469, |
|
"step": 208 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.7863501483679525, |
|
"eval_loss": 0.6513931155204773, |
|
"eval_runtime": 4.6483, |
|
"eval_samples_per_second": 72.5, |
|
"eval_steps_per_second": 9.251, |
|
"step": 224 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_accuracy": 0.7952522255192879, |
|
"eval_loss": 0.6230782866477966, |
|
"eval_runtime": 4.5993, |
|
"eval_samples_per_second": 73.272, |
|
"eval_steps_per_second": 9.349, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.8041543026706232, |
|
"eval_loss": 0.5948796272277832, |
|
"eval_runtime": 4.5704, |
|
"eval_samples_per_second": 73.735, |
|
"eval_steps_per_second": 9.408, |
|
"step": 256 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_accuracy": 0.8071216617210683, |
|
"eval_loss": 0.5689114332199097, |
|
"eval_runtime": 4.5933, |
|
"eval_samples_per_second": 73.367, |
|
"eval_steps_per_second": 9.361, |
|
"step": 272 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 0.8130563798219584, |
|
"eval_loss": 0.5446034669876099, |
|
"eval_runtime": 4.5362, |
|
"eval_samples_per_second": 74.291, |
|
"eval_steps_per_second": 9.479, |
|
"step": 288 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_accuracy": 0.8130563798219584, |
|
"eval_loss": 0.5227214097976685, |
|
"eval_runtime": 4.5669, |
|
"eval_samples_per_second": 73.791, |
|
"eval_steps_per_second": 9.415, |
|
"step": 304 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.8189910979228486, |
|
"eval_loss": 0.5031161308288574, |
|
"eval_runtime": 4.5479, |
|
"eval_samples_per_second": 74.1, |
|
"eval_steps_per_second": 9.455, |
|
"step": 320 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_accuracy": 0.8160237388724035, |
|
"eval_loss": 0.48820197582244873, |
|
"eval_runtime": 4.5452, |
|
"eval_samples_per_second": 74.145, |
|
"eval_steps_per_second": 9.461, |
|
"step": 336 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_accuracy": 0.8130563798219584, |
|
"eval_loss": 0.47535890340805054, |
|
"eval_runtime": 4.6769, |
|
"eval_samples_per_second": 72.057, |
|
"eval_steps_per_second": 9.194, |
|
"step": 352 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_accuracy": 0.8130563798219584, |
|
"eval_loss": 0.4620312452316284, |
|
"eval_runtime": 4.5546, |
|
"eval_samples_per_second": 73.992, |
|
"eval_steps_per_second": 9.441, |
|
"step": 368 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.8130563798219584, |
|
"eval_loss": 0.44609472155570984, |
|
"eval_runtime": 4.562, |
|
"eval_samples_per_second": 73.87, |
|
"eval_steps_per_second": 9.426, |
|
"step": 384 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_accuracy": 0.8160237388724035, |
|
"eval_loss": 0.4364510774612427, |
|
"eval_runtime": 4.6256, |
|
"eval_samples_per_second": 72.855, |
|
"eval_steps_per_second": 9.296, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_accuracy": 0.8249258160237388, |
|
"eval_loss": 0.42621392011642456, |
|
"eval_runtime": 4.5891, |
|
"eval_samples_per_second": 73.434, |
|
"eval_steps_per_second": 9.37, |
|
"step": 416 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_accuracy": 0.827893175074184, |
|
"eval_loss": 0.4176171123981476, |
|
"eval_runtime": 4.7205, |
|
"eval_samples_per_second": 71.39, |
|
"eval_steps_per_second": 9.109, |
|
"step": 432 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_accuracy": 0.8338278931750742, |
|
"eval_loss": 0.40912118554115295, |
|
"eval_runtime": 4.6413, |
|
"eval_samples_per_second": 72.609, |
|
"eval_steps_per_second": 9.265, |
|
"step": 448 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_accuracy": 0.8397626112759644, |
|
"eval_loss": 0.40831413865089417, |
|
"eval_runtime": 4.5637, |
|
"eval_samples_per_second": 73.843, |
|
"eval_steps_per_second": 9.422, |
|
"step": 464 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_accuracy": 0.8397626112759644, |
|
"eval_loss": 0.40189576148986816, |
|
"eval_runtime": 4.6019, |
|
"eval_samples_per_second": 73.23, |
|
"eval_steps_per_second": 9.344, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_accuracy": 0.8427299703264095, |
|
"eval_loss": 0.39464861154556274, |
|
"eval_runtime": 4.5459, |
|
"eval_samples_per_second": 74.133, |
|
"eval_steps_per_second": 9.459, |
|
"step": 496 |
|
}, |
|
{ |
|
"epoch": 31.25, |
|
"grad_norm": 2.8177223205566406, |
|
"learning_rate": 8.098055790363483e-07, |
|
"loss": 0.7287, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_accuracy": 0.8427299703264095, |
|
"eval_loss": 0.38916730880737305, |
|
"eval_runtime": 4.6237, |
|
"eval_samples_per_second": 72.886, |
|
"eval_steps_per_second": 9.3, |
|
"step": 512 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_accuracy": 0.8516320474777448, |
|
"eval_loss": 0.3844282031059265, |
|
"eval_runtime": 4.5824, |
|
"eval_samples_per_second": 73.542, |
|
"eval_steps_per_second": 9.384, |
|
"step": 528 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_accuracy": 0.8516320474777448, |
|
"eval_loss": 0.37861311435699463, |
|
"eval_runtime": 4.5644, |
|
"eval_samples_per_second": 73.833, |
|
"eval_steps_per_second": 9.421, |
|
"step": 544 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_accuracy": 0.8516320474777448, |
|
"eval_loss": 0.3732515275478363, |
|
"eval_runtime": 4.5962, |
|
"eval_samples_per_second": 73.322, |
|
"eval_steps_per_second": 9.356, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_accuracy": 0.8516320474777448, |
|
"eval_loss": 0.37023723125457764, |
|
"eval_runtime": 4.5345, |
|
"eval_samples_per_second": 74.319, |
|
"eval_steps_per_second": 9.483, |
|
"step": 576 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_accuracy": 0.8605341246290801, |
|
"eval_loss": 0.36356887221336365, |
|
"eval_runtime": 4.6253, |
|
"eval_samples_per_second": 72.86, |
|
"eval_steps_per_second": 9.297, |
|
"step": 592 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_accuracy": 0.8635014836795252, |
|
"eval_loss": 0.35962143540382385, |
|
"eval_runtime": 4.5862, |
|
"eval_samples_per_second": 73.482, |
|
"eval_steps_per_second": 9.376, |
|
"step": 608 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_accuracy": 0.8605341246290801, |
|
"eval_loss": 0.3568034768104553, |
|
"eval_runtime": 4.5393, |
|
"eval_samples_per_second": 74.241, |
|
"eval_steps_per_second": 9.473, |
|
"step": 624 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_accuracy": 0.8516320474777448, |
|
"eval_loss": 0.35836362838745117, |
|
"eval_runtime": 4.5145, |
|
"eval_samples_per_second": 74.649, |
|
"eval_steps_per_second": 9.525, |
|
"step": 640 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_accuracy": 0.857566765578635, |
|
"eval_loss": 0.35482144355773926, |
|
"eval_runtime": 4.5734, |
|
"eval_samples_per_second": 73.687, |
|
"eval_steps_per_second": 9.402, |
|
"step": 656 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_accuracy": 0.857566765578635, |
|
"eval_loss": 0.3515448272228241, |
|
"eval_runtime": 4.5679, |
|
"eval_samples_per_second": 73.776, |
|
"eval_steps_per_second": 9.414, |
|
"step": 672 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_accuracy": 0.8605341246290801, |
|
"eval_loss": 0.3470025658607483, |
|
"eval_runtime": 4.5874, |
|
"eval_samples_per_second": 73.462, |
|
"eval_steps_per_second": 9.374, |
|
"step": 688 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_accuracy": 0.8664688427299704, |
|
"eval_loss": 0.3467743992805481, |
|
"eval_runtime": 4.6426, |
|
"eval_samples_per_second": 72.589, |
|
"eval_steps_per_second": 9.262, |
|
"step": 704 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_accuracy": 0.8664688427299704, |
|
"eval_loss": 0.3463208079338074, |
|
"eval_runtime": 4.5833, |
|
"eval_samples_per_second": 73.528, |
|
"eval_steps_per_second": 9.382, |
|
"step": 720 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_accuracy": 0.8664688427299704, |
|
"eval_loss": 0.3457556664943695, |
|
"eval_runtime": 4.6971, |
|
"eval_samples_per_second": 71.746, |
|
"eval_steps_per_second": 9.155, |
|
"step": 736 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_accuracy": 0.8664688427299704, |
|
"eval_loss": 0.3446126878261566, |
|
"eval_runtime": 4.5645, |
|
"eval_samples_per_second": 73.831, |
|
"eval_steps_per_second": 9.421, |
|
"step": 752 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_accuracy": 0.8664688427299704, |
|
"eval_loss": 0.34248268604278564, |
|
"eval_runtime": 4.5812, |
|
"eval_samples_per_second": 73.561, |
|
"eval_steps_per_second": 9.386, |
|
"step": 768 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_accuracy": 0.8694362017804155, |
|
"eval_loss": 0.3440556824207306, |
|
"eval_runtime": 4.5663, |
|
"eval_samples_per_second": 73.802, |
|
"eval_steps_per_second": 9.417, |
|
"step": 784 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_accuracy": 0.8664688427299704, |
|
"eval_loss": 0.3455652594566345, |
|
"eval_runtime": 4.5263, |
|
"eval_samples_per_second": 74.454, |
|
"eval_steps_per_second": 9.5, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_accuracy": 0.8724035608308606, |
|
"eval_loss": 0.3401181697845459, |
|
"eval_runtime": 4.5842, |
|
"eval_samples_per_second": 73.513, |
|
"eval_steps_per_second": 9.38, |
|
"step": 816 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_accuracy": 0.8724035608308606, |
|
"eval_loss": 0.33749544620513916, |
|
"eval_runtime": 4.5545, |
|
"eval_samples_per_second": 73.993, |
|
"eval_steps_per_second": 9.441, |
|
"step": 832 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_accuracy": 0.8724035608308606, |
|
"eval_loss": 0.33886510133743286, |
|
"eval_runtime": 4.6181, |
|
"eval_samples_per_second": 72.974, |
|
"eval_steps_per_second": 9.311, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_accuracy": 0.8724035608308606, |
|
"eval_loss": 0.33066779375076294, |
|
"eval_runtime": 4.6066, |
|
"eval_samples_per_second": 73.155, |
|
"eval_steps_per_second": 9.334, |
|
"step": 864 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_accuracy": 0.8724035608308606, |
|
"eval_loss": 0.3285369575023651, |
|
"eval_runtime": 4.6615, |
|
"eval_samples_per_second": 72.294, |
|
"eval_steps_per_second": 9.224, |
|
"step": 880 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_accuracy": 0.8724035608308606, |
|
"eval_loss": 0.3319447338581085, |
|
"eval_runtime": 4.6422, |
|
"eval_samples_per_second": 72.594, |
|
"eval_steps_per_second": 9.263, |
|
"step": 896 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_accuracy": 0.8724035608308606, |
|
"eval_loss": 0.33194291591644287, |
|
"eval_runtime": 4.5847, |
|
"eval_samples_per_second": 73.506, |
|
"eval_steps_per_second": 9.379, |
|
"step": 912 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_accuracy": 0.8724035608308606, |
|
"eval_loss": 0.33001473546028137, |
|
"eval_runtime": 4.546, |
|
"eval_samples_per_second": 74.131, |
|
"eval_steps_per_second": 9.459, |
|
"step": 928 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_accuracy": 0.8753709198813057, |
|
"eval_loss": 0.32828956842422485, |
|
"eval_runtime": 4.5976, |
|
"eval_samples_per_second": 73.299, |
|
"eval_steps_per_second": 9.353, |
|
"step": 944 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_accuracy": 0.8753709198813057, |
|
"eval_loss": 0.3273901641368866, |
|
"eval_runtime": 4.6205, |
|
"eval_samples_per_second": 72.936, |
|
"eval_steps_per_second": 9.306, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_accuracy": 0.8753709198813057, |
|
"eval_loss": 0.32634109258651733, |
|
"eval_runtime": 4.5578, |
|
"eval_samples_per_second": 73.94, |
|
"eval_steps_per_second": 9.434, |
|
"step": 976 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_accuracy": 0.8753709198813057, |
|
"eval_loss": 0.3289165496826172, |
|
"eval_runtime": 4.6025, |
|
"eval_samples_per_second": 73.22, |
|
"eval_steps_per_second": 9.343, |
|
"step": 992 |
|
}, |
|
{ |
|
"epoch": 62.5, |
|
"grad_norm": 2.3223371505737305, |
|
"learning_rate": 5.984784446322908e-07, |
|
"loss": 0.2023, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_accuracy": 0.8783382789317508, |
|
"eval_loss": 0.3229311406612396, |
|
"eval_runtime": 4.5765, |
|
"eval_samples_per_second": 73.637, |
|
"eval_steps_per_second": 9.396, |
|
"step": 1008 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 2416, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 151, |
|
"save_steps": 500, |
|
"total_flos": 2.4654076495882445e+18, |
|
"train_batch_size": 32, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|