dima806's picture
Upload folder using huggingface_hub
b5274ae
{
"best_metric": 1.3654530048370361,
"best_model_checkpoint": "75_butterfly_types_image_detection/checkpoint-6150",
"epoch": 50.0,
"eval_steps": 500,
"global_step": 6150,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.10483460559796437,
"eval_loss": 4.219280242919922,
"eval_runtime": 16.1158,
"eval_samples_per_second": 121.93,
"eval_steps_per_second": 3.847,
"step": 123
},
{
"epoch": 2.0,
"eval_accuracy": 0.416793893129771,
"eval_loss": 4.0515265464782715,
"eval_runtime": 16.031,
"eval_samples_per_second": 122.575,
"eval_steps_per_second": 3.868,
"step": 246
},
{
"epoch": 3.0,
"eval_accuracy": 0.6743002544529262,
"eval_loss": 3.868370532989502,
"eval_runtime": 16.1588,
"eval_samples_per_second": 121.605,
"eval_steps_per_second": 3.837,
"step": 369
},
{
"epoch": 4.0,
"eval_accuracy": 0.7791348600508906,
"eval_loss": 3.682469129562378,
"eval_runtime": 16.1954,
"eval_samples_per_second": 121.331,
"eval_steps_per_second": 3.828,
"step": 492
},
{
"epoch": 4.07,
"learning_rate": 4.631147540983607e-06,
"loss": 4.0027,
"step": 500
},
{
"epoch": 5.0,
"eval_accuracy": 0.8213740458015267,
"eval_loss": 3.506803035736084,
"eval_runtime": 16.0347,
"eval_samples_per_second": 122.546,
"eval_steps_per_second": 3.867,
"step": 615
},
{
"epoch": 6.0,
"eval_accuracy": 0.8396946564885496,
"eval_loss": 3.344095468521118,
"eval_runtime": 16.3499,
"eval_samples_per_second": 120.184,
"eval_steps_per_second": 3.792,
"step": 738
},
{
"epoch": 7.0,
"eval_accuracy": 0.8569974554707379,
"eval_loss": 3.1964809894561768,
"eval_runtime": 16.1751,
"eval_samples_per_second": 121.483,
"eval_steps_per_second": 3.833,
"step": 861
},
{
"epoch": 8.0,
"eval_accuracy": 0.8661577608142493,
"eval_loss": 3.0642857551574707,
"eval_runtime": 16.1962,
"eval_samples_per_second": 121.325,
"eval_steps_per_second": 3.828,
"step": 984
},
{
"epoch": 8.13,
"learning_rate": 4.221311475409837e-06,
"loss": 3.2743,
"step": 1000
},
{
"epoch": 9.0,
"eval_accuracy": 0.8743002544529263,
"eval_loss": 2.9428579807281494,
"eval_runtime": 16.3097,
"eval_samples_per_second": 120.48,
"eval_steps_per_second": 3.801,
"step": 1107
},
{
"epoch": 10.0,
"eval_accuracy": 0.8844783715012723,
"eval_loss": 2.832017183303833,
"eval_runtime": 16.1405,
"eval_samples_per_second": 121.743,
"eval_steps_per_second": 3.841,
"step": 1230
},
{
"epoch": 11.0,
"eval_accuracy": 0.8875318066157761,
"eval_loss": 2.7307262420654297,
"eval_runtime": 16.6796,
"eval_samples_per_second": 117.808,
"eval_steps_per_second": 3.717,
"step": 1353
},
{
"epoch": 12.0,
"eval_accuracy": 0.8941475826972011,
"eval_loss": 2.635011911392212,
"eval_runtime": 16.1864,
"eval_samples_per_second": 121.398,
"eval_steps_per_second": 3.83,
"step": 1476
},
{
"epoch": 12.2,
"learning_rate": 3.811475409836066e-06,
"loss": 2.7379,
"step": 1500
},
{
"epoch": 13.0,
"eval_accuracy": 0.9012722646310433,
"eval_loss": 2.54408597946167,
"eval_runtime": 16.1725,
"eval_samples_per_second": 121.503,
"eval_steps_per_second": 3.834,
"step": 1599
},
{
"epoch": 14.0,
"eval_accuracy": 0.9038167938931297,
"eval_loss": 2.461076259613037,
"eval_runtime": 16.188,
"eval_samples_per_second": 121.386,
"eval_steps_per_second": 3.83,
"step": 1722
},
{
"epoch": 15.0,
"eval_accuracy": 0.905852417302799,
"eval_loss": 2.3826189041137695,
"eval_runtime": 16.0942,
"eval_samples_per_second": 122.094,
"eval_steps_per_second": 3.852,
"step": 1845
},
{
"epoch": 16.0,
"eval_accuracy": 0.9104325699745547,
"eval_loss": 2.3125312328338623,
"eval_runtime": 16.0801,
"eval_samples_per_second": 122.201,
"eval_steps_per_second": 3.856,
"step": 1968
},
{
"epoch": 16.26,
"learning_rate": 3.4016393442622954e-06,
"loss": 2.3551,
"step": 2000
},
{
"epoch": 17.0,
"eval_accuracy": 0.9150127226463104,
"eval_loss": 2.2421457767486572,
"eval_runtime": 16.1647,
"eval_samples_per_second": 121.561,
"eval_steps_per_second": 3.836,
"step": 2091
},
{
"epoch": 18.0,
"eval_accuracy": 0.9180661577608142,
"eval_loss": 2.177084445953369,
"eval_runtime": 16.1219,
"eval_samples_per_second": 121.884,
"eval_steps_per_second": 3.846,
"step": 2214
},
{
"epoch": 19.0,
"eval_accuracy": 0.9185750636132316,
"eval_loss": 2.118427038192749,
"eval_runtime": 16.2975,
"eval_samples_per_second": 120.571,
"eval_steps_per_second": 3.804,
"step": 2337
},
{
"epoch": 20.0,
"eval_accuracy": 0.9206106870229007,
"eval_loss": 2.0600903034210205,
"eval_runtime": 16.1374,
"eval_samples_per_second": 121.767,
"eval_steps_per_second": 3.842,
"step": 2460
},
{
"epoch": 20.33,
"learning_rate": 2.991803278688525e-06,
"loss": 2.0646,
"step": 2500
},
{
"epoch": 21.0,
"eval_accuracy": 0.9231552162849873,
"eval_loss": 2.0077874660491943,
"eval_runtime": 16.1894,
"eval_samples_per_second": 121.376,
"eval_steps_per_second": 3.83,
"step": 2583
},
{
"epoch": 22.0,
"eval_accuracy": 0.9246819338422392,
"eval_loss": 1.9560858011245728,
"eval_runtime": 16.2039,
"eval_samples_per_second": 121.267,
"eval_steps_per_second": 3.826,
"step": 2706
},
{
"epoch": 23.0,
"eval_accuracy": 0.9246819338422392,
"eval_loss": 1.9086360931396484,
"eval_runtime": 16.1264,
"eval_samples_per_second": 121.85,
"eval_steps_per_second": 3.845,
"step": 2829
},
{
"epoch": 24.0,
"eval_accuracy": 0.9272264631043257,
"eval_loss": 1.8643087148666382,
"eval_runtime": 16.2238,
"eval_samples_per_second": 121.118,
"eval_steps_per_second": 3.822,
"step": 2952
},
{
"epoch": 24.39,
"learning_rate": 2.5819672131147543e-06,
"loss": 1.8362,
"step": 3000
},
{
"epoch": 25.0,
"eval_accuracy": 0.9292620865139949,
"eval_loss": 1.8223220109939575,
"eval_runtime": 16.1769,
"eval_samples_per_second": 121.47,
"eval_steps_per_second": 3.833,
"step": 3075
},
{
"epoch": 26.0,
"eval_accuracy": 0.9323155216284987,
"eval_loss": 1.781746745109558,
"eval_runtime": 16.1733,
"eval_samples_per_second": 121.496,
"eval_steps_per_second": 3.833,
"step": 3198
},
{
"epoch": 27.0,
"eval_accuracy": 0.932824427480916,
"eval_loss": 1.7436439990997314,
"eval_runtime": 16.25,
"eval_samples_per_second": 120.923,
"eval_steps_per_second": 3.815,
"step": 3321
},
{
"epoch": 28.0,
"eval_accuracy": 0.9333333333333333,
"eval_loss": 1.7096657752990723,
"eval_runtime": 16.2645,
"eval_samples_per_second": 120.815,
"eval_steps_per_second": 3.812,
"step": 3444
},
{
"epoch": 28.46,
"learning_rate": 2.1721311475409838e-06,
"loss": 1.6594,
"step": 3500
},
{
"epoch": 29.0,
"eval_accuracy": 0.934351145038168,
"eval_loss": 1.6767544746398926,
"eval_runtime": 16.0446,
"eval_samples_per_second": 122.471,
"eval_steps_per_second": 3.864,
"step": 3567
},
{
"epoch": 30.0,
"eval_accuracy": 0.9363867684478372,
"eval_loss": 1.6452341079711914,
"eval_runtime": 16.2929,
"eval_samples_per_second": 120.605,
"eval_steps_per_second": 3.805,
"step": 3690
},
{
"epoch": 31.0,
"eval_accuracy": 0.9368956743002544,
"eval_loss": 1.6171735525131226,
"eval_runtime": 16.1612,
"eval_samples_per_second": 121.587,
"eval_steps_per_second": 3.836,
"step": 3813
},
{
"epoch": 32.0,
"eval_accuracy": 0.9394402035623409,
"eval_loss": 1.5884838104248047,
"eval_runtime": 16.0285,
"eval_samples_per_second": 122.594,
"eval_steps_per_second": 3.868,
"step": 3936
},
{
"epoch": 32.52,
"learning_rate": 1.7622950819672133e-06,
"loss": 1.5202,
"step": 4000
},
{
"epoch": 33.0,
"eval_accuracy": 0.9399491094147583,
"eval_loss": 1.5642931461334229,
"eval_runtime": 16.0014,
"eval_samples_per_second": 122.801,
"eval_steps_per_second": 3.875,
"step": 4059
},
{
"epoch": 34.0,
"eval_accuracy": 0.9379134860050891,
"eval_loss": 1.5411930084228516,
"eval_runtime": 16.0783,
"eval_samples_per_second": 122.214,
"eval_steps_per_second": 3.856,
"step": 4182
},
{
"epoch": 35.0,
"eval_accuracy": 0.9409669211195929,
"eval_loss": 1.518629789352417,
"eval_runtime": 16.0126,
"eval_samples_per_second": 122.716,
"eval_steps_per_second": 3.872,
"step": 4305
},
{
"epoch": 36.0,
"eval_accuracy": 0.9419847328244275,
"eval_loss": 1.4979873895645142,
"eval_runtime": 16.1815,
"eval_samples_per_second": 121.435,
"eval_steps_per_second": 3.832,
"step": 4428
},
{
"epoch": 36.59,
"learning_rate": 1.352459016393443e-06,
"loss": 1.4134,
"step": 4500
},
{
"epoch": 37.0,
"eval_accuracy": 0.9424936386768448,
"eval_loss": 1.4799128770828247,
"eval_runtime": 16.1592,
"eval_samples_per_second": 121.603,
"eval_steps_per_second": 3.837,
"step": 4551
},
{
"epoch": 38.0,
"eval_accuracy": 0.944529262086514,
"eval_loss": 1.462226390838623,
"eval_runtime": 16.17,
"eval_samples_per_second": 121.522,
"eval_steps_per_second": 3.834,
"step": 4674
},
{
"epoch": 39.0,
"eval_accuracy": 0.9435114503816794,
"eval_loss": 1.4462333917617798,
"eval_runtime": 16.3661,
"eval_samples_per_second": 120.065,
"eval_steps_per_second": 3.788,
"step": 4797
},
{
"epoch": 40.0,
"eval_accuracy": 0.9435114503816794,
"eval_loss": 1.432714581489563,
"eval_runtime": 16.2167,
"eval_samples_per_second": 121.171,
"eval_steps_per_second": 3.823,
"step": 4920
},
{
"epoch": 40.65,
"learning_rate": 9.426229508196721e-07,
"loss": 1.3371,
"step": 5000
},
{
"epoch": 41.0,
"eval_accuracy": 0.9435114503816794,
"eval_loss": 1.4191633462905884,
"eval_runtime": 16.352,
"eval_samples_per_second": 120.169,
"eval_steps_per_second": 3.792,
"step": 5043
},
{
"epoch": 42.0,
"eval_accuracy": 0.944529262086514,
"eval_loss": 1.4076900482177734,
"eval_runtime": 16.453,
"eval_samples_per_second": 119.431,
"eval_steps_per_second": 3.768,
"step": 5166
},
{
"epoch": 43.0,
"eval_accuracy": 0.9450381679389313,
"eval_loss": 1.3978630304336548,
"eval_runtime": 16.2004,
"eval_samples_per_second": 121.293,
"eval_steps_per_second": 3.827,
"step": 5289
},
{
"epoch": 44.0,
"eval_accuracy": 0.9455470737913486,
"eval_loss": 1.3894777297973633,
"eval_runtime": 16.3005,
"eval_samples_per_second": 120.549,
"eval_steps_per_second": 3.804,
"step": 5412
},
{
"epoch": 44.72,
"learning_rate": 5.327868852459017e-07,
"loss": 1.2847,
"step": 5500
},
{
"epoch": 45.0,
"eval_accuracy": 0.9455470737913486,
"eval_loss": 1.3816895484924316,
"eval_runtime": 16.1887,
"eval_samples_per_second": 121.381,
"eval_steps_per_second": 3.83,
"step": 5535
},
{
"epoch": 46.0,
"eval_accuracy": 0.9455470737913486,
"eval_loss": 1.376446008682251,
"eval_runtime": 16.3897,
"eval_samples_per_second": 119.893,
"eval_steps_per_second": 3.783,
"step": 5658
},
{
"epoch": 47.0,
"eval_accuracy": 0.9455470737913486,
"eval_loss": 1.3714139461517334,
"eval_runtime": 16.2429,
"eval_samples_per_second": 120.976,
"eval_steps_per_second": 3.817,
"step": 5781
},
{
"epoch": 48.0,
"eval_accuracy": 0.9455470737913486,
"eval_loss": 1.3681418895721436,
"eval_runtime": 16.2361,
"eval_samples_per_second": 121.027,
"eval_steps_per_second": 3.819,
"step": 5904
},
{
"epoch": 48.78,
"learning_rate": 1.2295081967213116e-07,
"loss": 1.2536,
"step": 6000
},
{
"epoch": 49.0,
"eval_accuracy": 0.9455470737913486,
"eval_loss": 1.3659467697143555,
"eval_runtime": 16.2019,
"eval_samples_per_second": 121.282,
"eval_steps_per_second": 3.827,
"step": 6027
},
{
"epoch": 50.0,
"eval_accuracy": 0.9455470737913486,
"eval_loss": 1.3654530048370361,
"eval_runtime": 16.2047,
"eval_samples_per_second": 121.261,
"eval_steps_per_second": 3.826,
"step": 6150
}
],
"logging_steps": 500,
"max_steps": 6150,
"num_train_epochs": 50,
"save_steps": 500,
"total_flos": 3.0474277467346944e+19,
"trial_name": null,
"trial_params": null
}