resnet-18-feature-extraction / trainer_state.json
SiddharthaM's picture
End of training
5db9bb2
{
"best_metric": 0.95625,
"best_model_checkpoint": "resnet-18-feature-extraction/checkpoint-26",
"epoch": 49.8,
"global_step": 100,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.8,
"eval_accuracy": 0.75,
"eval_f1": 0.8412698412698413,
"eval_loss": 0.6231745481491089,
"eval_precision": 0.9636363636363636,
"eval_recall": 0.7464788732394366,
"eval_roc_auc": 0.7621283255086071,
"eval_runtime": 5.3474,
"eval_samples_per_second": 29.921,
"eval_steps_per_second": 0.561,
"step": 2
},
{
"epoch": 1.8,
"eval_accuracy": 0.4875,
"eval_f1": 0.5940594059405941,
"eval_loss": 0.6971184611320496,
"eval_precision": 1.0,
"eval_recall": 0.4225352112676056,
"eval_roc_auc": 0.7112676056338028,
"eval_runtime": 4.1245,
"eval_samples_per_second": 38.792,
"eval_steps_per_second": 0.727,
"step": 4
},
{
"epoch": 2.8,
"eval_accuracy": 0.2875,
"eval_f1": 0.32941176470588235,
"eval_loss": 0.7914562821388245,
"eval_precision": 1.0,
"eval_recall": 0.19718309859154928,
"eval_roc_auc": 0.5985915492957746,
"eval_runtime": 4.0788,
"eval_samples_per_second": 39.227,
"eval_steps_per_second": 0.736,
"step": 6
},
{
"epoch": 3.8,
"eval_accuracy": 0.2875,
"eval_f1": 0.32941176470588235,
"eval_loss": 0.8479948043823242,
"eval_precision": 1.0,
"eval_recall": 0.19718309859154928,
"eval_roc_auc": 0.5985915492957746,
"eval_runtime": 3.9544,
"eval_samples_per_second": 40.462,
"eval_steps_per_second": 0.759,
"step": 8
},
{
"epoch": 4.8,
"learning_rate": 2e-05,
"loss": 0.8651,
"step": 10
},
{
"epoch": 4.8,
"eval_accuracy": 0.25625,
"eval_f1": 0.2787878787878788,
"eval_loss": 0.9093517065048218,
"eval_precision": 1.0,
"eval_recall": 0.1619718309859155,
"eval_roc_auc": 0.5809859154929577,
"eval_runtime": 4.143,
"eval_samples_per_second": 38.62,
"eval_steps_per_second": 0.724,
"step": 10
},
{
"epoch": 5.8,
"eval_accuracy": 0.5625,
"eval_f1": 0.6728971962616822,
"eval_loss": 0.7470346689224243,
"eval_precision": 1.0,
"eval_recall": 0.5070422535211268,
"eval_roc_auc": 0.7535211267605634,
"eval_runtime": 3.9679,
"eval_samples_per_second": 40.323,
"eval_steps_per_second": 0.756,
"step": 12
},
{
"epoch": 6.8,
"eval_accuracy": 0.85,
"eval_f1": 0.9076923076923077,
"eval_loss": 0.5915343165397644,
"eval_precision": 1.0,
"eval_recall": 0.8309859154929577,
"eval_roc_auc": 0.9154929577464789,
"eval_runtime": 4.0338,
"eval_samples_per_second": 39.665,
"eval_steps_per_second": 0.744,
"step": 14
},
{
"epoch": 7.8,
"eval_accuracy": 0.8875,
"eval_f1": 0.9333333333333333,
"eval_loss": 0.4816938042640686,
"eval_precision": 0.984375,
"eval_recall": 0.8873239436619719,
"eval_roc_auc": 0.8881064162754304,
"eval_runtime": 4.0258,
"eval_samples_per_second": 39.743,
"eval_steps_per_second": 0.745,
"step": 16
},
{
"epoch": 8.8,
"eval_accuracy": 0.91875,
"eval_f1": 0.9530685920577617,
"eval_loss": 0.34547853469848633,
"eval_precision": 0.9777777777777777,
"eval_recall": 0.9295774647887324,
"eval_roc_auc": 0.881455399061033,
"eval_runtime": 3.9749,
"eval_samples_per_second": 40.253,
"eval_steps_per_second": 0.755,
"step": 18
},
{
"epoch": 9.8,
"learning_rate": 1.7777777777777777e-05,
"loss": 0.5349,
"step": 20
},
{
"epoch": 9.8,
"eval_accuracy": 0.91875,
"eval_f1": 0.9534050179211471,
"eval_loss": 0.29664501547813416,
"eval_precision": 0.9708029197080292,
"eval_recall": 0.9366197183098591,
"eval_roc_auc": 0.8571987480438183,
"eval_runtime": 4.2704,
"eval_samples_per_second": 37.467,
"eval_steps_per_second": 0.703,
"step": 20
},
{
"epoch": 10.8,
"eval_accuracy": 0.95,
"eval_f1": 0.972027972027972,
"eval_loss": 0.23471388220787048,
"eval_precision": 0.9652777777777778,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.850547730829421,
"eval_runtime": 3.9069,
"eval_samples_per_second": 40.953,
"eval_steps_per_second": 0.768,
"step": 22
},
{
"epoch": 11.8,
"eval_accuracy": 0.93125,
"eval_f1": 0.9611307420494699,
"eval_loss": 0.2467934787273407,
"eval_precision": 0.9645390070921985,
"eval_recall": 0.9577464788732394,
"eval_roc_auc": 0.8399843505477309,
"eval_runtime": 4.025,
"eval_samples_per_second": 39.751,
"eval_steps_per_second": 0.745,
"step": 24
},
{
"epoch": 12.8,
"eval_accuracy": 0.95625,
"eval_f1": 0.9754385964912281,
"eval_loss": 0.23101434111595154,
"eval_precision": 0.972027972027972,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.8783255086071988,
"eval_runtime": 4.0457,
"eval_samples_per_second": 39.548,
"eval_steps_per_second": 0.742,
"step": 26
},
{
"epoch": 13.8,
"eval_accuracy": 0.93125,
"eval_f1": 0.9614035087719298,
"eval_loss": 0.2082931101322174,
"eval_precision": 0.958041958041958,
"eval_recall": 0.9647887323943662,
"eval_roc_auc": 0.8157276995305165,
"eval_runtime": 4.0645,
"eval_samples_per_second": 39.366,
"eval_steps_per_second": 0.738,
"step": 28
},
{
"epoch": 14.8,
"learning_rate": 1.555555555555556e-05,
"loss": 0.3593,
"step": 30
},
{
"epoch": 14.8,
"eval_accuracy": 0.9375,
"eval_f1": 0.9652777777777778,
"eval_loss": 0.18395133316516876,
"eval_precision": 0.952054794520548,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.7949921752738655,
"eval_runtime": 3.8518,
"eval_samples_per_second": 41.539,
"eval_steps_per_second": 0.779,
"step": 30
},
{
"epoch": 15.8,
"eval_accuracy": 0.9375,
"eval_f1": 0.9647887323943662,
"eval_loss": 0.19472570717334747,
"eval_precision": 0.9647887323943662,
"eval_recall": 0.9647887323943662,
"eval_roc_auc": 0.8435054773082942,
"eval_runtime": 4.1431,
"eval_samples_per_second": 38.618,
"eval_steps_per_second": 0.724,
"step": 32
},
{
"epoch": 16.8,
"eval_accuracy": 0.93125,
"eval_f1": 0.9616724738675958,
"eval_loss": 0.1836571842432022,
"eval_precision": 0.9517241379310345,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.7914710485133021,
"eval_runtime": 4.0848,
"eval_samples_per_second": 39.17,
"eval_steps_per_second": 0.734,
"step": 34
},
{
"epoch": 17.8,
"eval_accuracy": 0.94375,
"eval_f1": 0.9688581314878894,
"eval_loss": 0.1819494664669037,
"eval_precision": 0.9523809523809523,
"eval_recall": 0.9859154929577465,
"eval_roc_auc": 0.7985133020344288,
"eval_runtime": 3.9897,
"eval_samples_per_second": 40.104,
"eval_steps_per_second": 0.752,
"step": 36
},
{
"epoch": 18.8,
"eval_accuracy": 0.94375,
"eval_f1": 0.968421052631579,
"eval_loss": 0.19235201179981232,
"eval_precision": 0.965034965034965,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.8470266040688575,
"eval_runtime": 4.041,
"eval_samples_per_second": 39.594,
"eval_steps_per_second": 0.742,
"step": 38
},
{
"epoch": 19.8,
"learning_rate": 1.3333333333333333e-05,
"loss": 0.2737,
"step": 40
},
{
"epoch": 19.8,
"eval_accuracy": 0.95,
"eval_f1": 0.972027972027972,
"eval_loss": 0.1990378201007843,
"eval_precision": 0.9652777777777778,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.850547730829421,
"eval_runtime": 4.1236,
"eval_samples_per_second": 38.801,
"eval_steps_per_second": 0.728,
"step": 40
},
{
"epoch": 20.8,
"eval_accuracy": 0.95,
"eval_f1": 0.971830985915493,
"eval_loss": 0.1758503019809723,
"eval_precision": 0.971830985915493,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.8748043818466354,
"eval_runtime": 4.1193,
"eval_samples_per_second": 38.841,
"eval_steps_per_second": 0.728,
"step": 42
},
{
"epoch": 21.8,
"eval_accuracy": 0.93125,
"eval_f1": 0.9616724738675958,
"eval_loss": 0.18040268123149872,
"eval_precision": 0.9517241379310345,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.7914710485133021,
"eval_runtime": 3.8662,
"eval_samples_per_second": 41.384,
"eval_steps_per_second": 0.776,
"step": 44
},
{
"epoch": 22.8,
"eval_accuracy": 0.93125,
"eval_f1": 0.9616724738675958,
"eval_loss": 0.16663400828838348,
"eval_precision": 0.9517241379310345,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.7914710485133021,
"eval_runtime": 4.3016,
"eval_samples_per_second": 37.195,
"eval_steps_per_second": 0.697,
"step": 46
},
{
"epoch": 23.8,
"eval_accuracy": 0.94375,
"eval_f1": 0.9688581314878894,
"eval_loss": 0.15337304770946503,
"eval_precision": 0.9523809523809523,
"eval_recall": 0.9859154929577465,
"eval_roc_auc": 0.7985133020344288,
"eval_runtime": 4.0456,
"eval_samples_per_second": 39.549,
"eval_steps_per_second": 0.742,
"step": 48
},
{
"epoch": 24.8,
"learning_rate": 1.1111111111111113e-05,
"loss": 0.2278,
"step": 50
},
{
"epoch": 24.8,
"eval_accuracy": 0.9375,
"eval_f1": 0.9652777777777778,
"eval_loss": 0.16116251051425934,
"eval_precision": 0.952054794520548,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.7949921752738655,
"eval_runtime": 4.0452,
"eval_samples_per_second": 39.553,
"eval_steps_per_second": 0.742,
"step": 50
},
{
"epoch": 25.8,
"eval_accuracy": 0.94375,
"eval_f1": 0.9686411149825783,
"eval_loss": 0.15349864959716797,
"eval_precision": 0.9586206896551724,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.8227699530516432,
"eval_runtime": 6.0991,
"eval_samples_per_second": 26.233,
"eval_steps_per_second": 0.492,
"step": 52
},
{
"epoch": 26.8,
"eval_accuracy": 0.94375,
"eval_f1": 0.9681978798586572,
"eval_loss": 0.1568022519350052,
"eval_precision": 0.9716312056737588,
"eval_recall": 0.9647887323943662,
"eval_roc_auc": 0.871283255086072,
"eval_runtime": 4.0891,
"eval_samples_per_second": 39.128,
"eval_steps_per_second": 0.734,
"step": 54
},
{
"epoch": 27.8,
"eval_accuracy": 0.9375,
"eval_f1": 0.9645390070921985,
"eval_loss": 0.21069078147411346,
"eval_precision": 0.9714285714285714,
"eval_recall": 0.9577464788732394,
"eval_roc_auc": 0.8677621283255086,
"eval_runtime": 4.1257,
"eval_samples_per_second": 38.781,
"eval_steps_per_second": 0.727,
"step": 56
},
{
"epoch": 28.8,
"eval_accuracy": 0.93125,
"eval_f1": 0.9616724738675958,
"eval_loss": 0.15922358632087708,
"eval_precision": 0.9517241379310345,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.7914710485133021,
"eval_runtime": 3.944,
"eval_samples_per_second": 40.568,
"eval_steps_per_second": 0.761,
"step": 58
},
{
"epoch": 29.8,
"learning_rate": 8.888888888888888e-06,
"loss": 0.2057,
"step": 60
},
{
"epoch": 29.8,
"eval_accuracy": 0.9375,
"eval_f1": 0.9647887323943662,
"eval_loss": 0.15567776560783386,
"eval_precision": 0.9647887323943662,
"eval_recall": 0.9647887323943662,
"eval_roc_auc": 0.8435054773082942,
"eval_runtime": 3.9386,
"eval_samples_per_second": 40.624,
"eval_steps_per_second": 0.762,
"step": 60
},
{
"epoch": 30.8,
"eval_accuracy": 0.94375,
"eval_f1": 0.968421052631579,
"eval_loss": 0.1714434176683426,
"eval_precision": 0.965034965034965,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.8470266040688575,
"eval_runtime": 4.1925,
"eval_samples_per_second": 38.164,
"eval_steps_per_second": 0.716,
"step": 62
},
{
"epoch": 31.8,
"eval_accuracy": 0.95,
"eval_f1": 0.972027972027972,
"eval_loss": 0.15714499354362488,
"eval_precision": 0.9652777777777778,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.850547730829421,
"eval_runtime": 4.3684,
"eval_samples_per_second": 36.627,
"eval_steps_per_second": 0.687,
"step": 64
},
{
"epoch": 32.8,
"eval_accuracy": 0.9375,
"eval_f1": 0.965034965034965,
"eval_loss": 0.15739548206329346,
"eval_precision": 0.9583333333333334,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.8192488262910799,
"eval_runtime": 3.9613,
"eval_samples_per_second": 40.39,
"eval_steps_per_second": 0.757,
"step": 66
},
{
"epoch": 33.8,
"eval_accuracy": 0.95625,
"eval_f1": 0.9754385964912281,
"eval_loss": 0.1422826498746872,
"eval_precision": 0.972027972027972,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.8783255086071988,
"eval_runtime": 3.9825,
"eval_samples_per_second": 40.175,
"eval_steps_per_second": 0.753,
"step": 68
},
{
"epoch": 34.8,
"learning_rate": 6.666666666666667e-06,
"loss": 0.2,
"step": 70
},
{
"epoch": 34.8,
"eval_accuracy": 0.94375,
"eval_f1": 0.968421052631579,
"eval_loss": 0.16770192980766296,
"eval_precision": 0.965034965034965,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.8470266040688575,
"eval_runtime": 4.1697,
"eval_samples_per_second": 38.372,
"eval_steps_per_second": 0.719,
"step": 70
},
{
"epoch": 35.8,
"eval_accuracy": 0.9375,
"eval_f1": 0.965034965034965,
"eval_loss": 0.1559743881225586,
"eval_precision": 0.9583333333333334,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.8192488262910799,
"eval_runtime": 4.0897,
"eval_samples_per_second": 39.123,
"eval_steps_per_second": 0.734,
"step": 72
},
{
"epoch": 36.8,
"eval_accuracy": 0.9375,
"eval_f1": 0.9652777777777778,
"eval_loss": 0.15941758453845978,
"eval_precision": 0.952054794520548,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.7949921752738655,
"eval_runtime": 4.0474,
"eval_samples_per_second": 39.531,
"eval_steps_per_second": 0.741,
"step": 74
},
{
"epoch": 37.8,
"eval_accuracy": 0.94375,
"eval_f1": 0.9686411149825783,
"eval_loss": 0.15121030807495117,
"eval_precision": 0.9586206896551724,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.8227699530516432,
"eval_runtime": 4.2667,
"eval_samples_per_second": 37.499,
"eval_steps_per_second": 0.703,
"step": 76
},
{
"epoch": 38.8,
"eval_accuracy": 0.95625,
"eval_f1": 0.975609756097561,
"eval_loss": 0.13959212601184845,
"eval_precision": 0.9655172413793104,
"eval_recall": 0.9859154929577465,
"eval_roc_auc": 0.8540688575899843,
"eval_runtime": 4.0576,
"eval_samples_per_second": 39.432,
"eval_steps_per_second": 0.739,
"step": 78
},
{
"epoch": 39.8,
"learning_rate": 4.444444444444444e-06,
"loss": 0.1838,
"step": 80
},
{
"epoch": 39.8,
"eval_accuracy": 0.9375,
"eval_f1": 0.965034965034965,
"eval_loss": 0.15085594356060028,
"eval_precision": 0.9583333333333334,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.8192488262910799,
"eval_runtime": 3.9857,
"eval_samples_per_second": 40.144,
"eval_steps_per_second": 0.753,
"step": 80
},
{
"epoch": 40.8,
"eval_accuracy": 0.95,
"eval_f1": 0.971830985915493,
"eval_loss": 0.15287616848945618,
"eval_precision": 0.971830985915493,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.8748043818466354,
"eval_runtime": 5.1236,
"eval_samples_per_second": 31.228,
"eval_steps_per_second": 0.586,
"step": 82
},
{
"epoch": 41.8,
"eval_accuracy": 0.95,
"eval_f1": 0.972027972027972,
"eval_loss": 0.1505597084760666,
"eval_precision": 0.9652777777777778,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.850547730829421,
"eval_runtime": 4.2192,
"eval_samples_per_second": 37.921,
"eval_steps_per_second": 0.711,
"step": 84
},
{
"epoch": 42.8,
"eval_accuracy": 0.95,
"eval_f1": 0.972027972027972,
"eval_loss": 0.1549244374036789,
"eval_precision": 0.9652777777777778,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.850547730829421,
"eval_runtime": 3.8602,
"eval_samples_per_second": 41.448,
"eval_steps_per_second": 0.777,
"step": 86
},
{
"epoch": 43.8,
"eval_accuracy": 0.95625,
"eval_f1": 0.975609756097561,
"eval_loss": 0.13305585086345673,
"eval_precision": 0.9655172413793104,
"eval_recall": 0.9859154929577465,
"eval_roc_auc": 0.8540688575899843,
"eval_runtime": 4.2919,
"eval_samples_per_second": 37.28,
"eval_steps_per_second": 0.699,
"step": 88
},
{
"epoch": 44.8,
"learning_rate": 2.222222222222222e-06,
"loss": 0.1872,
"step": 90
},
{
"epoch": 44.8,
"eval_accuracy": 0.94375,
"eval_f1": 0.9688581314878894,
"eval_loss": 0.14087018370628357,
"eval_precision": 0.9523809523809523,
"eval_recall": 0.9859154929577465,
"eval_roc_auc": 0.7985133020344288,
"eval_runtime": 4.0748,
"eval_samples_per_second": 39.266,
"eval_steps_per_second": 0.736,
"step": 90
},
{
"epoch": 45.8,
"eval_accuracy": 0.9375,
"eval_f1": 0.965034965034965,
"eval_loss": 0.1639305055141449,
"eval_precision": 0.9583333333333334,
"eval_recall": 0.971830985915493,
"eval_roc_auc": 0.8192488262910799,
"eval_runtime": 3.9376,
"eval_samples_per_second": 40.634,
"eval_steps_per_second": 0.762,
"step": 92
},
{
"epoch": 46.8,
"eval_accuracy": 0.95,
"eval_f1": 0.9722222222222222,
"eval_loss": 0.1390833854675293,
"eval_precision": 0.958904109589041,
"eval_recall": 0.9859154929577465,
"eval_roc_auc": 0.8262910798122067,
"eval_runtime": 3.9934,
"eval_samples_per_second": 40.066,
"eval_steps_per_second": 0.751,
"step": 94
},
{
"epoch": 47.8,
"eval_accuracy": 0.95625,
"eval_f1": 0.975609756097561,
"eval_loss": 0.14361494779586792,
"eval_precision": 0.9655172413793104,
"eval_recall": 0.9859154929577465,
"eval_roc_auc": 0.8540688575899843,
"eval_runtime": 4.2477,
"eval_samples_per_second": 37.667,
"eval_steps_per_second": 0.706,
"step": 96
},
{
"epoch": 48.8,
"eval_accuracy": 0.94375,
"eval_f1": 0.9686411149825783,
"eval_loss": 0.1442493200302124,
"eval_precision": 0.9586206896551724,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.8227699530516432,
"eval_runtime": 4.0963,
"eval_samples_per_second": 39.059,
"eval_steps_per_second": 0.732,
"step": 98
},
{
"epoch": 49.8,
"learning_rate": 0.0,
"loss": 0.185,
"step": 100
},
{
"epoch": 49.8,
"eval_accuracy": 0.95,
"eval_f1": 0.972027972027972,
"eval_loss": 0.1484707146883011,
"eval_precision": 0.9652777777777778,
"eval_recall": 0.9788732394366197,
"eval_roc_auc": 0.850547730829421,
"eval_runtime": 3.8936,
"eval_samples_per_second": 41.093,
"eval_steps_per_second": 0.77,
"step": 100
},
{
"epoch": 49.8,
"step": 100,
"total_flos": 3.197753854288036e+17,
"train_loss": 0.3222511351108551,
"train_runtime": 425.6784,
"train_samples_per_second": 74.704,
"train_steps_per_second": 0.235
}
],
"max_steps": 100,
"num_train_epochs": 50,
"total_flos": 3.197753854288036e+17,
"trial_name": null,
"trial_params": null
}