net_dfm_myimg / checkpoint-1392 /trainer_state.json
VINAYAK MODI
Upload folder using huggingface_hub
f871afb verified
raw
history blame
22 kB
{
"best_metric": 0.33774590492248535,
"best_model_checkpoint": "deepfake_vs_real_image_detection/checkpoint-1392",
"epoch": 87.0,
"eval_steps": 500,
"global_step": 1392,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.6765578635014837,
"eval_loss": 1.4959243535995483,
"eval_runtime": 4.5936,
"eval_samples_per_second": 73.362,
"eval_steps_per_second": 9.361,
"step": 16
},
{
"epoch": 2.0,
"eval_accuracy": 0.6913946587537092,
"eval_loss": 1.4148070812225342,
"eval_runtime": 5.1723,
"eval_samples_per_second": 65.154,
"eval_steps_per_second": 8.313,
"step": 32
},
{
"epoch": 3.0,
"eval_accuracy": 0.7091988130563798,
"eval_loss": 1.309860348701477,
"eval_runtime": 4.8265,
"eval_samples_per_second": 69.823,
"eval_steps_per_second": 8.909,
"step": 48
},
{
"epoch": 4.0,
"eval_accuracy": 0.7240356083086054,
"eval_loss": 1.2197798490524292,
"eval_runtime": 4.7427,
"eval_samples_per_second": 71.057,
"eval_steps_per_second": 9.067,
"step": 64
},
{
"epoch": 5.0,
"eval_accuracy": 0.7477744807121661,
"eval_loss": 1.1465003490447998,
"eval_runtime": 4.8571,
"eval_samples_per_second": 69.383,
"eval_steps_per_second": 8.853,
"step": 80
},
{
"epoch": 6.0,
"eval_accuracy": 0.7655786350148368,
"eval_loss": 1.0904771089553833,
"eval_runtime": 4.7162,
"eval_samples_per_second": 71.456,
"eval_steps_per_second": 9.118,
"step": 96
},
{
"epoch": 7.0,
"eval_accuracy": 0.7626112759643917,
"eval_loss": 1.0423768758773804,
"eval_runtime": 4.7414,
"eval_samples_per_second": 71.077,
"eval_steps_per_second": 9.069,
"step": 112
},
{
"epoch": 8.0,
"eval_accuracy": 0.7626112759643917,
"eval_loss": 0.9944449067115784,
"eval_runtime": 4.7288,
"eval_samples_per_second": 71.265,
"eval_steps_per_second": 9.093,
"step": 128
},
{
"epoch": 9.0,
"eval_accuracy": 0.7626112759643917,
"eval_loss": 0.9456853270530701,
"eval_runtime": 4.6848,
"eval_samples_per_second": 71.935,
"eval_steps_per_second": 9.179,
"step": 144
},
{
"epoch": 10.0,
"eval_accuracy": 0.7626112759643917,
"eval_loss": 0.8957338333129883,
"eval_runtime": 4.7194,
"eval_samples_per_second": 71.407,
"eval_steps_per_second": 9.111,
"step": 160
},
{
"epoch": 11.0,
"eval_accuracy": 0.7626112759643917,
"eval_loss": 0.852699875831604,
"eval_runtime": 4.7114,
"eval_samples_per_second": 71.529,
"eval_steps_per_second": 9.127,
"step": 176
},
{
"epoch": 12.0,
"eval_accuracy": 0.7626112759643917,
"eval_loss": 0.815643310546875,
"eval_runtime": 4.7006,
"eval_samples_per_second": 71.694,
"eval_steps_per_second": 9.148,
"step": 192
},
{
"epoch": 13.0,
"eval_accuracy": 0.771513353115727,
"eval_loss": 0.7831457853317261,
"eval_runtime": 4.7983,
"eval_samples_per_second": 70.233,
"eval_steps_per_second": 8.961,
"step": 208
},
{
"epoch": 14.0,
"eval_accuracy": 0.7744807121661721,
"eval_loss": 0.7558016180992126,
"eval_runtime": 4.7359,
"eval_samples_per_second": 71.159,
"eval_steps_per_second": 9.08,
"step": 224
},
{
"epoch": 15.0,
"eval_accuracy": 0.7744807121661721,
"eval_loss": 0.7284858226776123,
"eval_runtime": 4.6713,
"eval_samples_per_second": 72.143,
"eval_steps_per_second": 9.205,
"step": 240
},
{
"epoch": 16.0,
"eval_accuracy": 0.7744807121661721,
"eval_loss": 0.6914460062980652,
"eval_runtime": 4.7809,
"eval_samples_per_second": 70.489,
"eval_steps_per_second": 8.994,
"step": 256
},
{
"epoch": 17.0,
"eval_accuracy": 0.7774480712166172,
"eval_loss": 0.6581370830535889,
"eval_runtime": 4.7253,
"eval_samples_per_second": 71.318,
"eval_steps_per_second": 9.1,
"step": 272
},
{
"epoch": 18.0,
"eval_accuracy": 0.7804154302670623,
"eval_loss": 0.6323521733283997,
"eval_runtime": 4.7945,
"eval_samples_per_second": 70.289,
"eval_steps_per_second": 8.969,
"step": 288
},
{
"epoch": 19.0,
"eval_accuracy": 0.7774480712166172,
"eval_loss": 0.6072251796722412,
"eval_runtime": 4.8798,
"eval_samples_per_second": 69.06,
"eval_steps_per_second": 8.812,
"step": 304
},
{
"epoch": 20.0,
"eval_accuracy": 0.7804154302670623,
"eval_loss": 0.5835662484169006,
"eval_runtime": 4.6039,
"eval_samples_per_second": 73.199,
"eval_steps_per_second": 9.34,
"step": 320
},
{
"epoch": 21.0,
"eval_accuracy": 0.7922848664688428,
"eval_loss": 0.5593723654747009,
"eval_runtime": 4.7955,
"eval_samples_per_second": 70.274,
"eval_steps_per_second": 8.967,
"step": 336
},
{
"epoch": 22.0,
"eval_accuracy": 0.7922848664688428,
"eval_loss": 0.5364292860031128,
"eval_runtime": 4.8089,
"eval_samples_per_second": 70.078,
"eval_steps_per_second": 8.942,
"step": 352
},
{
"epoch": 23.0,
"eval_accuracy": 0.7952522255192879,
"eval_loss": 0.5182026028633118,
"eval_runtime": 4.6149,
"eval_samples_per_second": 73.024,
"eval_steps_per_second": 9.318,
"step": 368
},
{
"epoch": 24.0,
"eval_accuracy": 0.8041543026706232,
"eval_loss": 0.504047691822052,
"eval_runtime": 4.5605,
"eval_samples_per_second": 73.895,
"eval_steps_per_second": 9.429,
"step": 384
},
{
"epoch": 25.0,
"eval_accuracy": 0.8041543026706232,
"eval_loss": 0.4920850694179535,
"eval_runtime": 4.6821,
"eval_samples_per_second": 71.976,
"eval_steps_per_second": 9.184,
"step": 400
},
{
"epoch": 26.0,
"eval_accuracy": 0.8160237388724035,
"eval_loss": 0.48037412762641907,
"eval_runtime": 4.7178,
"eval_samples_per_second": 71.432,
"eval_steps_per_second": 9.114,
"step": 416
},
{
"epoch": 27.0,
"eval_accuracy": 0.8189910979228486,
"eval_loss": 0.4688655138015747,
"eval_runtime": 4.6086,
"eval_samples_per_second": 73.124,
"eval_steps_per_second": 9.33,
"step": 432
},
{
"epoch": 28.0,
"eval_accuracy": 0.8249258160237388,
"eval_loss": 0.4574899971485138,
"eval_runtime": 4.6369,
"eval_samples_per_second": 72.678,
"eval_steps_per_second": 9.273,
"step": 448
},
{
"epoch": 29.0,
"eval_accuracy": 0.827893175074184,
"eval_loss": 0.448953777551651,
"eval_runtime": 4.7138,
"eval_samples_per_second": 71.491,
"eval_steps_per_second": 9.122,
"step": 464
},
{
"epoch": 30.0,
"eval_accuracy": 0.827893175074184,
"eval_loss": 0.4414035379886627,
"eval_runtime": 4.7192,
"eval_samples_per_second": 71.41,
"eval_steps_per_second": 9.112,
"step": 480
},
{
"epoch": 31.0,
"eval_accuracy": 0.827893175074184,
"eval_loss": 0.4335722029209137,
"eval_runtime": 4.6675,
"eval_samples_per_second": 72.202,
"eval_steps_per_second": 9.213,
"step": 496
},
{
"epoch": 31.25,
"grad_norm": 2.672912120819092,
"learning_rate": 7.096774193548387e-07,
"loss": 0.6719,
"step": 500
},
{
"epoch": 32.0,
"eval_accuracy": 0.8219584569732937,
"eval_loss": 0.43041178584098816,
"eval_runtime": 4.7762,
"eval_samples_per_second": 70.559,
"eval_steps_per_second": 9.003,
"step": 512
},
{
"epoch": 33.0,
"eval_accuracy": 0.8249258160237388,
"eval_loss": 0.4242512881755829,
"eval_runtime": 4.6367,
"eval_samples_per_second": 72.681,
"eval_steps_per_second": 9.274,
"step": 528
},
{
"epoch": 34.0,
"eval_accuracy": 0.827893175074184,
"eval_loss": 0.421082079410553,
"eval_runtime": 4.733,
"eval_samples_per_second": 71.201,
"eval_steps_per_second": 9.085,
"step": 544
},
{
"epoch": 35.0,
"eval_accuracy": 0.8338278931750742,
"eval_loss": 0.41326144337654114,
"eval_runtime": 4.6282,
"eval_samples_per_second": 72.815,
"eval_steps_per_second": 9.291,
"step": 560
},
{
"epoch": 36.0,
"eval_accuracy": 0.8338278931750742,
"eval_loss": 0.41096124053001404,
"eval_runtime": 4.6107,
"eval_samples_per_second": 73.092,
"eval_steps_per_second": 9.326,
"step": 576
},
{
"epoch": 37.0,
"eval_accuracy": 0.8367952522255193,
"eval_loss": 0.404769629240036,
"eval_runtime": 4.6205,
"eval_samples_per_second": 72.936,
"eval_steps_per_second": 9.306,
"step": 592
},
{
"epoch": 38.0,
"eval_accuracy": 0.8427299703264095,
"eval_loss": 0.40141698718070984,
"eval_runtime": 4.6612,
"eval_samples_per_second": 72.298,
"eval_steps_per_second": 9.225,
"step": 608
},
{
"epoch": 39.0,
"eval_accuracy": 0.8456973293768546,
"eval_loss": 0.3952626883983612,
"eval_runtime": 4.6328,
"eval_samples_per_second": 72.742,
"eval_steps_per_second": 9.282,
"step": 624
},
{
"epoch": 40.0,
"eval_accuracy": 0.8456973293768546,
"eval_loss": 0.390024334192276,
"eval_runtime": 4.5638,
"eval_samples_per_second": 73.843,
"eval_steps_per_second": 9.422,
"step": 640
},
{
"epoch": 41.0,
"eval_accuracy": 0.8456973293768546,
"eval_loss": 0.3834027349948883,
"eval_runtime": 4.6261,
"eval_samples_per_second": 72.848,
"eval_steps_per_second": 9.295,
"step": 656
},
{
"epoch": 42.0,
"eval_accuracy": 0.8456973293768546,
"eval_loss": 0.3803389072418213,
"eval_runtime": 4.6158,
"eval_samples_per_second": 73.009,
"eval_steps_per_second": 9.316,
"step": 672
},
{
"epoch": 43.0,
"eval_accuracy": 0.8456973293768546,
"eval_loss": 0.37990784645080566,
"eval_runtime": 4.6288,
"eval_samples_per_second": 72.805,
"eval_steps_per_second": 9.29,
"step": 688
},
{
"epoch": 44.0,
"eval_accuracy": 0.8456973293768546,
"eval_loss": 0.3741393983364105,
"eval_runtime": 4.7575,
"eval_samples_per_second": 70.836,
"eval_steps_per_second": 9.038,
"step": 704
},
{
"epoch": 45.0,
"eval_accuracy": 0.8545994065281899,
"eval_loss": 0.36607253551483154,
"eval_runtime": 4.6476,
"eval_samples_per_second": 72.511,
"eval_steps_per_second": 9.252,
"step": 720
},
{
"epoch": 46.0,
"eval_accuracy": 0.8486646884272997,
"eval_loss": 0.3655509054660797,
"eval_runtime": 4.6664,
"eval_samples_per_second": 72.218,
"eval_steps_per_second": 9.215,
"step": 736
},
{
"epoch": 47.0,
"eval_accuracy": 0.8486646884272997,
"eval_loss": 0.36614400148391724,
"eval_runtime": 4.6792,
"eval_samples_per_second": 72.021,
"eval_steps_per_second": 9.19,
"step": 752
},
{
"epoch": 48.0,
"eval_accuracy": 0.8486646884272997,
"eval_loss": 0.3684944808483124,
"eval_runtime": 4.6175,
"eval_samples_per_second": 72.983,
"eval_steps_per_second": 9.312,
"step": 768
},
{
"epoch": 49.0,
"eval_accuracy": 0.8486646884272997,
"eval_loss": 0.36265119910240173,
"eval_runtime": 4.6573,
"eval_samples_per_second": 72.36,
"eval_steps_per_second": 9.233,
"step": 784
},
{
"epoch": 50.0,
"eval_accuracy": 0.8486646884272997,
"eval_loss": 0.359169065952301,
"eval_runtime": 4.7664,
"eval_samples_per_second": 70.703,
"eval_steps_per_second": 9.021,
"step": 800
},
{
"epoch": 51.0,
"eval_accuracy": 0.8486646884272997,
"eval_loss": 0.35570138692855835,
"eval_runtime": 4.7355,
"eval_samples_per_second": 71.165,
"eval_steps_per_second": 9.08,
"step": 816
},
{
"epoch": 52.0,
"eval_accuracy": 0.8456973293768546,
"eval_loss": 0.35541436076164246,
"eval_runtime": 4.7442,
"eval_samples_per_second": 71.035,
"eval_steps_per_second": 9.064,
"step": 832
},
{
"epoch": 53.0,
"eval_accuracy": 0.8486646884272997,
"eval_loss": 0.3521236479282379,
"eval_runtime": 4.6755,
"eval_samples_per_second": 72.078,
"eval_steps_per_second": 9.197,
"step": 848
},
{
"epoch": 54.0,
"eval_accuracy": 0.8486646884272997,
"eval_loss": 0.3523922264575958,
"eval_runtime": 4.6657,
"eval_samples_per_second": 72.23,
"eval_steps_per_second": 9.216,
"step": 864
},
{
"epoch": 55.0,
"eval_accuracy": 0.8516320474777448,
"eval_loss": 0.34878119826316833,
"eval_runtime": 4.6488,
"eval_samples_per_second": 72.491,
"eval_steps_per_second": 9.25,
"step": 880
},
{
"epoch": 56.0,
"eval_accuracy": 0.8516320474777448,
"eval_loss": 0.3482997715473175,
"eval_runtime": 4.683,
"eval_samples_per_second": 71.963,
"eval_steps_per_second": 9.182,
"step": 896
},
{
"epoch": 57.0,
"eval_accuracy": 0.8456973293768546,
"eval_loss": 0.348295122385025,
"eval_runtime": 4.8638,
"eval_samples_per_second": 69.287,
"eval_steps_per_second": 8.841,
"step": 912
},
{
"epoch": 58.0,
"eval_accuracy": 0.8456973293768546,
"eval_loss": 0.3468620479106903,
"eval_runtime": 4.8133,
"eval_samples_per_second": 70.014,
"eval_steps_per_second": 8.934,
"step": 928
},
{
"epoch": 59.0,
"eval_accuracy": 0.8486646884272997,
"eval_loss": 0.3429933488368988,
"eval_runtime": 4.7367,
"eval_samples_per_second": 71.146,
"eval_steps_per_second": 9.078,
"step": 944
},
{
"epoch": 60.0,
"eval_accuracy": 0.8516320474777448,
"eval_loss": 0.347034752368927,
"eval_runtime": 4.7735,
"eval_samples_per_second": 70.598,
"eval_steps_per_second": 9.008,
"step": 960
},
{
"epoch": 61.0,
"eval_accuracy": 0.8545994065281899,
"eval_loss": 0.34952038526535034,
"eval_runtime": 4.6627,
"eval_samples_per_second": 72.276,
"eval_steps_per_second": 9.222,
"step": 976
},
{
"epoch": 62.0,
"eval_accuracy": 0.857566765578635,
"eval_loss": 0.34523066878318787,
"eval_runtime": 4.761,
"eval_samples_per_second": 70.783,
"eval_steps_per_second": 9.032,
"step": 992
},
{
"epoch": 62.5,
"grad_norm": 4.032630920410156,
"learning_rate": 3.8709677419354837e-07,
"loss": 0.2134,
"step": 1000
},
{
"epoch": 63.0,
"eval_accuracy": 0.8605341246290801,
"eval_loss": 0.3458469808101654,
"eval_runtime": 4.7825,
"eval_samples_per_second": 70.465,
"eval_steps_per_second": 8.991,
"step": 1008
},
{
"epoch": 64.0,
"eval_accuracy": 0.8605341246290801,
"eval_loss": 0.3463592529296875,
"eval_runtime": 4.7675,
"eval_samples_per_second": 70.687,
"eval_steps_per_second": 9.019,
"step": 1024
},
{
"epoch": 65.0,
"eval_accuracy": 0.8605341246290801,
"eval_loss": 0.3484276831150055,
"eval_runtime": 4.7586,
"eval_samples_per_second": 70.82,
"eval_steps_per_second": 9.036,
"step": 1040
},
{
"epoch": 66.0,
"eval_accuracy": 0.8635014836795252,
"eval_loss": 0.34886136651039124,
"eval_runtime": 4.7061,
"eval_samples_per_second": 71.609,
"eval_steps_per_second": 9.137,
"step": 1056
},
{
"epoch": 67.0,
"eval_accuracy": 0.8635014836795252,
"eval_loss": 0.3485889434814453,
"eval_runtime": 4.6029,
"eval_samples_per_second": 73.215,
"eval_steps_per_second": 9.342,
"step": 1072
},
{
"epoch": 68.0,
"eval_accuracy": 0.8635014836795252,
"eval_loss": 0.3503687381744385,
"eval_runtime": 4.7013,
"eval_samples_per_second": 71.682,
"eval_steps_per_second": 9.146,
"step": 1088
},
{
"epoch": 69.0,
"eval_accuracy": 0.8635014836795252,
"eval_loss": 0.3495609164237976,
"eval_runtime": 4.7225,
"eval_samples_per_second": 71.36,
"eval_steps_per_second": 9.105,
"step": 1104
},
{
"epoch": 70.0,
"eval_accuracy": 0.8605341246290801,
"eval_loss": 0.3446400761604309,
"eval_runtime": 4.7445,
"eval_samples_per_second": 71.029,
"eval_steps_per_second": 9.063,
"step": 1120
},
{
"epoch": 71.0,
"eval_accuracy": 0.8635014836795252,
"eval_loss": 0.3452640175819397,
"eval_runtime": 4.6434,
"eval_samples_per_second": 72.577,
"eval_steps_per_second": 9.261,
"step": 1136
},
{
"epoch": 72.0,
"eval_accuracy": 0.8635014836795252,
"eval_loss": 0.34035128355026245,
"eval_runtime": 4.7053,
"eval_samples_per_second": 71.622,
"eval_steps_per_second": 9.139,
"step": 1152
},
{
"epoch": 73.0,
"eval_accuracy": 0.8635014836795252,
"eval_loss": 0.33860069513320923,
"eval_runtime": 4.6174,
"eval_samples_per_second": 72.985,
"eval_steps_per_second": 9.313,
"step": 1168
},
{
"epoch": 74.0,
"eval_accuracy": 0.8635014836795252,
"eval_loss": 0.3384004831314087,
"eval_runtime": 4.663,
"eval_samples_per_second": 72.271,
"eval_steps_per_second": 9.221,
"step": 1184
},
{
"epoch": 75.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.33985474705696106,
"eval_runtime": 4.7211,
"eval_samples_per_second": 71.382,
"eval_steps_per_second": 9.108,
"step": 1200
},
{
"epoch": 76.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.3414258062839508,
"eval_runtime": 4.7314,
"eval_samples_per_second": 71.226,
"eval_steps_per_second": 9.088,
"step": 1216
},
{
"epoch": 77.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.3427448272705078,
"eval_runtime": 4.7038,
"eval_samples_per_second": 71.644,
"eval_steps_per_second": 9.141,
"step": 1232
},
{
"epoch": 78.0,
"eval_accuracy": 0.8635014836795252,
"eval_loss": 0.34361016750335693,
"eval_runtime": 4.8723,
"eval_samples_per_second": 69.167,
"eval_steps_per_second": 8.825,
"step": 1248
},
{
"epoch": 79.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.34205198287963867,
"eval_runtime": 4.7564,
"eval_samples_per_second": 70.851,
"eval_steps_per_second": 9.04,
"step": 1264
},
{
"epoch": 80.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.3414119780063629,
"eval_runtime": 4.7639,
"eval_samples_per_second": 70.74,
"eval_steps_per_second": 9.026,
"step": 1280
},
{
"epoch": 81.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.3397296071052551,
"eval_runtime": 4.7085,
"eval_samples_per_second": 71.572,
"eval_steps_per_second": 9.132,
"step": 1296
},
{
"epoch": 82.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.3387517035007477,
"eval_runtime": 4.764,
"eval_samples_per_second": 70.738,
"eval_steps_per_second": 9.026,
"step": 1312
},
{
"epoch": 83.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.33925285935401917,
"eval_runtime": 4.8225,
"eval_samples_per_second": 69.88,
"eval_steps_per_second": 8.916,
"step": 1328
},
{
"epoch": 84.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.3406101167201996,
"eval_runtime": 4.6734,
"eval_samples_per_second": 72.11,
"eval_steps_per_second": 9.201,
"step": 1344
},
{
"epoch": 85.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.33851388096809387,
"eval_runtime": 4.7413,
"eval_samples_per_second": 71.077,
"eval_steps_per_second": 9.069,
"step": 1360
},
{
"epoch": 86.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.3385758697986603,
"eval_runtime": 4.707,
"eval_samples_per_second": 71.596,
"eval_steps_per_second": 9.135,
"step": 1376
},
{
"epoch": 87.0,
"eval_accuracy": 0.8664688427299704,
"eval_loss": 0.33774590492248535,
"eval_runtime": 4.6381,
"eval_samples_per_second": 72.658,
"eval_steps_per_second": 9.271,
"step": 1392
}
],
"logging_steps": 500,
"max_steps": 1600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 3.4046105637170995e+18,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}