{ "best_metric": 0.95625, "best_model_checkpoint": "resnet-18-feature-extraction/checkpoint-26", "epoch": 49.8, "global_step": 100, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.8, "eval_accuracy": 0.75, "eval_f1": 0.8412698412698413, "eval_loss": 0.6231745481491089, "eval_precision": 0.9636363636363636, "eval_recall": 0.7464788732394366, "eval_roc_auc": 0.7621283255086071, "eval_runtime": 5.3474, "eval_samples_per_second": 29.921, "eval_steps_per_second": 0.561, "step": 2 }, { "epoch": 1.8, "eval_accuracy": 0.4875, "eval_f1": 0.5940594059405941, "eval_loss": 0.6971184611320496, "eval_precision": 1.0, "eval_recall": 0.4225352112676056, "eval_roc_auc": 0.7112676056338028, "eval_runtime": 4.1245, "eval_samples_per_second": 38.792, "eval_steps_per_second": 0.727, "step": 4 }, { "epoch": 2.8, "eval_accuracy": 0.2875, "eval_f1": 0.32941176470588235, "eval_loss": 0.7914562821388245, "eval_precision": 1.0, "eval_recall": 0.19718309859154928, "eval_roc_auc": 0.5985915492957746, "eval_runtime": 4.0788, "eval_samples_per_second": 39.227, "eval_steps_per_second": 0.736, "step": 6 }, { "epoch": 3.8, "eval_accuracy": 0.2875, "eval_f1": 0.32941176470588235, "eval_loss": 0.8479948043823242, "eval_precision": 1.0, "eval_recall": 0.19718309859154928, "eval_roc_auc": 0.5985915492957746, "eval_runtime": 3.9544, "eval_samples_per_second": 40.462, "eval_steps_per_second": 0.759, "step": 8 }, { "epoch": 4.8, "learning_rate": 2e-05, "loss": 0.8651, "step": 10 }, { "epoch": 4.8, "eval_accuracy": 0.25625, "eval_f1": 0.2787878787878788, "eval_loss": 0.9093517065048218, "eval_precision": 1.0, "eval_recall": 0.1619718309859155, "eval_roc_auc": 0.5809859154929577, "eval_runtime": 4.143, "eval_samples_per_second": 38.62, "eval_steps_per_second": 0.724, "step": 10 }, { "epoch": 5.8, "eval_accuracy": 0.5625, "eval_f1": 0.6728971962616822, "eval_loss": 0.7470346689224243, "eval_precision": 1.0, "eval_recall": 0.5070422535211268, "eval_roc_auc": 0.7535211267605634, "eval_runtime": 3.9679, "eval_samples_per_second": 40.323, "eval_steps_per_second": 0.756, "step": 12 }, { "epoch": 6.8, "eval_accuracy": 0.85, "eval_f1": 0.9076923076923077, "eval_loss": 0.5915343165397644, "eval_precision": 1.0, "eval_recall": 0.8309859154929577, "eval_roc_auc": 0.9154929577464789, "eval_runtime": 4.0338, "eval_samples_per_second": 39.665, "eval_steps_per_second": 0.744, "step": 14 }, { "epoch": 7.8, "eval_accuracy": 0.8875, "eval_f1": 0.9333333333333333, "eval_loss": 0.4816938042640686, "eval_precision": 0.984375, "eval_recall": 0.8873239436619719, "eval_roc_auc": 0.8881064162754304, "eval_runtime": 4.0258, "eval_samples_per_second": 39.743, "eval_steps_per_second": 0.745, "step": 16 }, { "epoch": 8.8, "eval_accuracy": 0.91875, "eval_f1": 0.9530685920577617, "eval_loss": 0.34547853469848633, "eval_precision": 0.9777777777777777, "eval_recall": 0.9295774647887324, "eval_roc_auc": 0.881455399061033, "eval_runtime": 3.9749, "eval_samples_per_second": 40.253, "eval_steps_per_second": 0.755, "step": 18 }, { "epoch": 9.8, "learning_rate": 1.7777777777777777e-05, "loss": 0.5349, "step": 20 }, { "epoch": 9.8, "eval_accuracy": 0.91875, "eval_f1": 0.9534050179211471, "eval_loss": 0.29664501547813416, "eval_precision": 0.9708029197080292, "eval_recall": 0.9366197183098591, "eval_roc_auc": 0.8571987480438183, "eval_runtime": 4.2704, "eval_samples_per_second": 37.467, "eval_steps_per_second": 0.703, "step": 20 }, { "epoch": 10.8, "eval_accuracy": 0.95, "eval_f1": 0.972027972027972, "eval_loss": 0.23471388220787048, "eval_precision": 0.9652777777777778, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.850547730829421, "eval_runtime": 3.9069, "eval_samples_per_second": 40.953, "eval_steps_per_second": 0.768, "step": 22 }, { "epoch": 11.8, "eval_accuracy": 0.93125, "eval_f1": 0.9611307420494699, "eval_loss": 0.2467934787273407, "eval_precision": 0.9645390070921985, "eval_recall": 0.9577464788732394, "eval_roc_auc": 0.8399843505477309, "eval_runtime": 4.025, "eval_samples_per_second": 39.751, "eval_steps_per_second": 0.745, "step": 24 }, { "epoch": 12.8, "eval_accuracy": 0.95625, "eval_f1": 0.9754385964912281, "eval_loss": 0.23101434111595154, "eval_precision": 0.972027972027972, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.8783255086071988, "eval_runtime": 4.0457, "eval_samples_per_second": 39.548, "eval_steps_per_second": 0.742, "step": 26 }, { "epoch": 13.8, "eval_accuracy": 0.93125, "eval_f1": 0.9614035087719298, "eval_loss": 0.2082931101322174, "eval_precision": 0.958041958041958, "eval_recall": 0.9647887323943662, "eval_roc_auc": 0.8157276995305165, "eval_runtime": 4.0645, "eval_samples_per_second": 39.366, "eval_steps_per_second": 0.738, "step": 28 }, { "epoch": 14.8, "learning_rate": 1.555555555555556e-05, "loss": 0.3593, "step": 30 }, { "epoch": 14.8, "eval_accuracy": 0.9375, "eval_f1": 0.9652777777777778, "eval_loss": 0.18395133316516876, "eval_precision": 0.952054794520548, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.7949921752738655, "eval_runtime": 3.8518, "eval_samples_per_second": 41.539, "eval_steps_per_second": 0.779, "step": 30 }, { "epoch": 15.8, "eval_accuracy": 0.9375, "eval_f1": 0.9647887323943662, "eval_loss": 0.19472570717334747, "eval_precision": 0.9647887323943662, "eval_recall": 0.9647887323943662, "eval_roc_auc": 0.8435054773082942, "eval_runtime": 4.1431, "eval_samples_per_second": 38.618, "eval_steps_per_second": 0.724, "step": 32 }, { "epoch": 16.8, "eval_accuracy": 0.93125, "eval_f1": 0.9616724738675958, "eval_loss": 0.1836571842432022, "eval_precision": 0.9517241379310345, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.7914710485133021, "eval_runtime": 4.0848, "eval_samples_per_second": 39.17, "eval_steps_per_second": 0.734, "step": 34 }, { "epoch": 17.8, "eval_accuracy": 0.94375, "eval_f1": 0.9688581314878894, "eval_loss": 0.1819494664669037, "eval_precision": 0.9523809523809523, "eval_recall": 0.9859154929577465, "eval_roc_auc": 0.7985133020344288, "eval_runtime": 3.9897, "eval_samples_per_second": 40.104, "eval_steps_per_second": 0.752, "step": 36 }, { "epoch": 18.8, "eval_accuracy": 0.94375, "eval_f1": 0.968421052631579, "eval_loss": 0.19235201179981232, "eval_precision": 0.965034965034965, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.8470266040688575, "eval_runtime": 4.041, "eval_samples_per_second": 39.594, "eval_steps_per_second": 0.742, "step": 38 }, { "epoch": 19.8, "learning_rate": 1.3333333333333333e-05, "loss": 0.2737, "step": 40 }, { "epoch": 19.8, "eval_accuracy": 0.95, "eval_f1": 0.972027972027972, "eval_loss": 0.1990378201007843, "eval_precision": 0.9652777777777778, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.850547730829421, "eval_runtime": 4.1236, "eval_samples_per_second": 38.801, "eval_steps_per_second": 0.728, "step": 40 }, { "epoch": 20.8, "eval_accuracy": 0.95, "eval_f1": 0.971830985915493, "eval_loss": 0.1758503019809723, "eval_precision": 0.971830985915493, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.8748043818466354, "eval_runtime": 4.1193, "eval_samples_per_second": 38.841, "eval_steps_per_second": 0.728, "step": 42 }, { "epoch": 21.8, "eval_accuracy": 0.93125, "eval_f1": 0.9616724738675958, "eval_loss": 0.18040268123149872, "eval_precision": 0.9517241379310345, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.7914710485133021, "eval_runtime": 3.8662, "eval_samples_per_second": 41.384, "eval_steps_per_second": 0.776, "step": 44 }, { "epoch": 22.8, "eval_accuracy": 0.93125, "eval_f1": 0.9616724738675958, "eval_loss": 0.16663400828838348, "eval_precision": 0.9517241379310345, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.7914710485133021, "eval_runtime": 4.3016, "eval_samples_per_second": 37.195, "eval_steps_per_second": 0.697, "step": 46 }, { "epoch": 23.8, "eval_accuracy": 0.94375, "eval_f1": 0.9688581314878894, "eval_loss": 0.15337304770946503, "eval_precision": 0.9523809523809523, "eval_recall": 0.9859154929577465, "eval_roc_auc": 0.7985133020344288, "eval_runtime": 4.0456, "eval_samples_per_second": 39.549, "eval_steps_per_second": 0.742, "step": 48 }, { "epoch": 24.8, "learning_rate": 1.1111111111111113e-05, "loss": 0.2278, "step": 50 }, { "epoch": 24.8, "eval_accuracy": 0.9375, "eval_f1": 0.9652777777777778, "eval_loss": 0.16116251051425934, "eval_precision": 0.952054794520548, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.7949921752738655, "eval_runtime": 4.0452, "eval_samples_per_second": 39.553, "eval_steps_per_second": 0.742, "step": 50 }, { "epoch": 25.8, "eval_accuracy": 0.94375, "eval_f1": 0.9686411149825783, "eval_loss": 0.15349864959716797, "eval_precision": 0.9586206896551724, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.8227699530516432, "eval_runtime": 6.0991, "eval_samples_per_second": 26.233, "eval_steps_per_second": 0.492, "step": 52 }, { "epoch": 26.8, "eval_accuracy": 0.94375, "eval_f1": 0.9681978798586572, "eval_loss": 0.1568022519350052, "eval_precision": 0.9716312056737588, "eval_recall": 0.9647887323943662, "eval_roc_auc": 0.871283255086072, "eval_runtime": 4.0891, "eval_samples_per_second": 39.128, "eval_steps_per_second": 0.734, "step": 54 }, { "epoch": 27.8, "eval_accuracy": 0.9375, "eval_f1": 0.9645390070921985, "eval_loss": 0.21069078147411346, "eval_precision": 0.9714285714285714, "eval_recall": 0.9577464788732394, "eval_roc_auc": 0.8677621283255086, "eval_runtime": 4.1257, "eval_samples_per_second": 38.781, "eval_steps_per_second": 0.727, "step": 56 }, { "epoch": 28.8, "eval_accuracy": 0.93125, "eval_f1": 0.9616724738675958, "eval_loss": 0.15922358632087708, "eval_precision": 0.9517241379310345, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.7914710485133021, "eval_runtime": 3.944, "eval_samples_per_second": 40.568, "eval_steps_per_second": 0.761, "step": 58 }, { "epoch": 29.8, "learning_rate": 8.888888888888888e-06, "loss": 0.2057, "step": 60 }, { "epoch": 29.8, "eval_accuracy": 0.9375, "eval_f1": 0.9647887323943662, "eval_loss": 0.15567776560783386, "eval_precision": 0.9647887323943662, "eval_recall": 0.9647887323943662, "eval_roc_auc": 0.8435054773082942, "eval_runtime": 3.9386, "eval_samples_per_second": 40.624, "eval_steps_per_second": 0.762, "step": 60 }, { "epoch": 30.8, "eval_accuracy": 0.94375, "eval_f1": 0.968421052631579, "eval_loss": 0.1714434176683426, "eval_precision": 0.965034965034965, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.8470266040688575, "eval_runtime": 4.1925, "eval_samples_per_second": 38.164, "eval_steps_per_second": 0.716, "step": 62 }, { "epoch": 31.8, "eval_accuracy": 0.95, "eval_f1": 0.972027972027972, "eval_loss": 0.15714499354362488, "eval_precision": 0.9652777777777778, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.850547730829421, "eval_runtime": 4.3684, "eval_samples_per_second": 36.627, "eval_steps_per_second": 0.687, "step": 64 }, { "epoch": 32.8, "eval_accuracy": 0.9375, "eval_f1": 0.965034965034965, "eval_loss": 0.15739548206329346, "eval_precision": 0.9583333333333334, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.8192488262910799, "eval_runtime": 3.9613, "eval_samples_per_second": 40.39, "eval_steps_per_second": 0.757, "step": 66 }, { "epoch": 33.8, "eval_accuracy": 0.95625, "eval_f1": 0.9754385964912281, "eval_loss": 0.1422826498746872, "eval_precision": 0.972027972027972, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.8783255086071988, "eval_runtime": 3.9825, "eval_samples_per_second": 40.175, "eval_steps_per_second": 0.753, "step": 68 }, { "epoch": 34.8, "learning_rate": 6.666666666666667e-06, "loss": 0.2, "step": 70 }, { "epoch": 34.8, "eval_accuracy": 0.94375, "eval_f1": 0.968421052631579, "eval_loss": 0.16770192980766296, "eval_precision": 0.965034965034965, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.8470266040688575, "eval_runtime": 4.1697, "eval_samples_per_second": 38.372, "eval_steps_per_second": 0.719, "step": 70 }, { "epoch": 35.8, "eval_accuracy": 0.9375, "eval_f1": 0.965034965034965, "eval_loss": 0.1559743881225586, "eval_precision": 0.9583333333333334, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.8192488262910799, "eval_runtime": 4.0897, "eval_samples_per_second": 39.123, "eval_steps_per_second": 0.734, "step": 72 }, { "epoch": 36.8, "eval_accuracy": 0.9375, "eval_f1": 0.9652777777777778, "eval_loss": 0.15941758453845978, "eval_precision": 0.952054794520548, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.7949921752738655, "eval_runtime": 4.0474, "eval_samples_per_second": 39.531, "eval_steps_per_second": 0.741, "step": 74 }, { "epoch": 37.8, "eval_accuracy": 0.94375, "eval_f1": 0.9686411149825783, "eval_loss": 0.15121030807495117, "eval_precision": 0.9586206896551724, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.8227699530516432, "eval_runtime": 4.2667, "eval_samples_per_second": 37.499, "eval_steps_per_second": 0.703, "step": 76 }, { "epoch": 38.8, "eval_accuracy": 0.95625, "eval_f1": 0.975609756097561, "eval_loss": 0.13959212601184845, "eval_precision": 0.9655172413793104, "eval_recall": 0.9859154929577465, "eval_roc_auc": 0.8540688575899843, "eval_runtime": 4.0576, "eval_samples_per_second": 39.432, "eval_steps_per_second": 0.739, "step": 78 }, { "epoch": 39.8, "learning_rate": 4.444444444444444e-06, "loss": 0.1838, "step": 80 }, { "epoch": 39.8, "eval_accuracy": 0.9375, "eval_f1": 0.965034965034965, "eval_loss": 0.15085594356060028, "eval_precision": 0.9583333333333334, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.8192488262910799, "eval_runtime": 3.9857, "eval_samples_per_second": 40.144, "eval_steps_per_second": 0.753, "step": 80 }, { "epoch": 40.8, "eval_accuracy": 0.95, "eval_f1": 0.971830985915493, "eval_loss": 0.15287616848945618, "eval_precision": 0.971830985915493, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.8748043818466354, "eval_runtime": 5.1236, "eval_samples_per_second": 31.228, "eval_steps_per_second": 0.586, "step": 82 }, { "epoch": 41.8, "eval_accuracy": 0.95, "eval_f1": 0.972027972027972, "eval_loss": 0.1505597084760666, "eval_precision": 0.9652777777777778, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.850547730829421, "eval_runtime": 4.2192, "eval_samples_per_second": 37.921, "eval_steps_per_second": 0.711, "step": 84 }, { "epoch": 42.8, "eval_accuracy": 0.95, "eval_f1": 0.972027972027972, "eval_loss": 0.1549244374036789, "eval_precision": 0.9652777777777778, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.850547730829421, "eval_runtime": 3.8602, "eval_samples_per_second": 41.448, "eval_steps_per_second": 0.777, "step": 86 }, { "epoch": 43.8, "eval_accuracy": 0.95625, "eval_f1": 0.975609756097561, "eval_loss": 0.13305585086345673, "eval_precision": 0.9655172413793104, "eval_recall": 0.9859154929577465, "eval_roc_auc": 0.8540688575899843, "eval_runtime": 4.2919, "eval_samples_per_second": 37.28, "eval_steps_per_second": 0.699, "step": 88 }, { "epoch": 44.8, "learning_rate": 2.222222222222222e-06, "loss": 0.1872, "step": 90 }, { "epoch": 44.8, "eval_accuracy": 0.94375, "eval_f1": 0.9688581314878894, "eval_loss": 0.14087018370628357, "eval_precision": 0.9523809523809523, "eval_recall": 0.9859154929577465, "eval_roc_auc": 0.7985133020344288, "eval_runtime": 4.0748, "eval_samples_per_second": 39.266, "eval_steps_per_second": 0.736, "step": 90 }, { "epoch": 45.8, "eval_accuracy": 0.9375, "eval_f1": 0.965034965034965, "eval_loss": 0.1639305055141449, "eval_precision": 0.9583333333333334, "eval_recall": 0.971830985915493, "eval_roc_auc": 0.8192488262910799, "eval_runtime": 3.9376, "eval_samples_per_second": 40.634, "eval_steps_per_second": 0.762, "step": 92 }, { "epoch": 46.8, "eval_accuracy": 0.95, "eval_f1": 0.9722222222222222, "eval_loss": 0.1390833854675293, "eval_precision": 0.958904109589041, "eval_recall": 0.9859154929577465, "eval_roc_auc": 0.8262910798122067, "eval_runtime": 3.9934, "eval_samples_per_second": 40.066, "eval_steps_per_second": 0.751, "step": 94 }, { "epoch": 47.8, "eval_accuracy": 0.95625, "eval_f1": 0.975609756097561, "eval_loss": 0.14361494779586792, "eval_precision": 0.9655172413793104, "eval_recall": 0.9859154929577465, "eval_roc_auc": 0.8540688575899843, "eval_runtime": 4.2477, "eval_samples_per_second": 37.667, "eval_steps_per_second": 0.706, "step": 96 }, { "epoch": 48.8, "eval_accuracy": 0.94375, "eval_f1": 0.9686411149825783, "eval_loss": 0.1442493200302124, "eval_precision": 0.9586206896551724, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.8227699530516432, "eval_runtime": 4.0963, "eval_samples_per_second": 39.059, "eval_steps_per_second": 0.732, "step": 98 }, { "epoch": 49.8, "learning_rate": 0.0, "loss": 0.185, "step": 100 }, { "epoch": 49.8, "eval_accuracy": 0.95, "eval_f1": 0.972027972027972, "eval_loss": 0.1484707146883011, "eval_precision": 0.9652777777777778, "eval_recall": 0.9788732394366197, "eval_roc_auc": 0.850547730829421, "eval_runtime": 3.8936, "eval_samples_per_second": 41.093, "eval_steps_per_second": 0.77, "step": 100 }, { "epoch": 49.8, "step": 100, "total_flos": 3.197753854288036e+17, "train_loss": 0.3222511351108551, "train_runtime": 425.6784, "train_samples_per_second": 74.704, "train_steps_per_second": 0.235 } ], "max_steps": 100, "num_train_epochs": 50, "total_flos": 3.197753854288036e+17, "trial_name": null, "trial_params": null }