{ "best_metric": 0.42085567116737366, "best_model_checkpoint": "google/vit-base-patch16-224-in21k_covid_19_ct_scans/checkpoint-2394", "epoch": 100.0, "eval_steps": 500, "global_step": 26600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0037593984962406013, "grad_norm": 3.3277029991149902, "learning_rate": 0.00019999248120300753, "loss": 0.768, "step": 1 }, { "epoch": 1.0, "eval_AUC": 0.5, "eval_F1": 0.45505906522855677, "eval_Precision": 0.8350612629594723, "eval_Recall": 1.0, "eval_accuracy": 0.8350612629594723, "eval_loss": 0.45460373163223267, "eval_runtime": 23.809, "eval_samples_per_second": 44.563, "eval_steps_per_second": 2.814, "step": 266 }, { "epoch": 1.8796992481203008, "grad_norm": 0.9518311023712158, "learning_rate": 0.0001962406015037594, "loss": 0.4516, "step": 500 }, { "epoch": 2.0, "eval_AUC": 0.5, "eval_F1": 0.45505906522855677, "eval_Precision": 0.8350612629594723, "eval_Recall": 1.0, "eval_accuracy": 0.8350612629594723, "eval_loss": 0.449796199798584, "eval_runtime": 12.1544, "eval_samples_per_second": 87.293, "eval_steps_per_second": 5.512, "step": 532 }, { "epoch": 3.0, "eval_AUC": 0.5, "eval_F1": 0.45505906522855677, "eval_Precision": 0.8350612629594723, "eval_Recall": 1.0, "eval_accuracy": 0.8350612629594723, "eval_loss": 0.4491786062717438, "eval_runtime": 12.1586, "eval_samples_per_second": 87.263, "eval_steps_per_second": 5.51, "step": 798 }, { "epoch": 3.7593984962406015, "grad_norm": 0.6577199101448059, "learning_rate": 0.0001924812030075188, "loss": 0.4521, "step": 1000 }, { "epoch": 4.0, "eval_AUC": 0.5, "eval_F1": 0.45505906522855677, "eval_Precision": 0.8350612629594723, "eval_Recall": 1.0, "eval_accuracy": 0.8350612629594723, "eval_loss": 0.44855841994285583, "eval_runtime": 12.3395, "eval_samples_per_second": 85.984, "eval_steps_per_second": 5.43, "step": 1064 }, { "epoch": 5.0, "eval_AUC": 0.5, "eval_F1": 0.45505906522855677, "eval_Precision": 0.8350612629594723, "eval_Recall": 1.0, "eval_accuracy": 0.8350612629594723, "eval_loss": 0.44568774104118347, "eval_runtime": 12.3116, "eval_samples_per_second": 86.179, "eval_steps_per_second": 5.442, "step": 1330 }, { "epoch": 5.639097744360902, "grad_norm": 0.03062070906162262, "learning_rate": 0.00018872180451127822, "loss": 0.4415, "step": 1500 }, { "epoch": 6.0, "eval_AUC": 0.5, "eval_F1": 0.45505906522855677, "eval_Precision": 0.8350612629594723, "eval_Recall": 1.0, "eval_accuracy": 0.8350612629594723, "eval_loss": 0.4421917796134949, "eval_runtime": 11.8255, "eval_samples_per_second": 89.721, "eval_steps_per_second": 5.666, "step": 1596 }, { "epoch": 7.0, "eval_AUC": 0.5, "eval_F1": 0.45505906522855677, "eval_Precision": 0.8350612629594723, "eval_Recall": 1.0, "eval_accuracy": 0.8350612629594723, "eval_loss": 0.42494845390319824, "eval_runtime": 11.7622, "eval_samples_per_second": 90.204, "eval_steps_per_second": 5.696, "step": 1862 }, { "epoch": 7.518796992481203, "grad_norm": 0.4491100311279297, "learning_rate": 0.0001849624060150376, "loss": 0.4344, "step": 2000 }, { "epoch": 8.0, "eval_AUC": 0.5183424701709126, "eval_F1": 0.4965715075876916, "eval_Precision": 0.8401913875598086, "eval_Recall": 0.9909706546275395, "eval_accuracy": 0.8350612629594723, "eval_loss": 0.4643925130367279, "eval_runtime": 12.3543, "eval_samples_per_second": 85.881, "eval_steps_per_second": 5.423, "step": 2128 }, { "epoch": 9.0, "eval_AUC": 0.5354853273137697, "eval_F1": 0.5271698859516118, "eval_Precision": 0.8450433108758422, "eval_Recall": 0.9909706546275395, "eval_accuracy": 0.8407163053722903, "eval_loss": 0.42085567116737366, "eval_runtime": 12.5156, "eval_samples_per_second": 84.774, "eval_steps_per_second": 5.353, "step": 2394 }, { "epoch": 9.398496240601503, "grad_norm": 0.23315227031707764, "learning_rate": 0.000181203007518797, "loss": 0.3848, "step": 2500 }, { "epoch": 10.0, "eval_AUC": 0.6642373427926476, "eval_F1": 0.6571900744677727, "eval_Precision": 0.8904267589388697, "eval_Recall": 0.871331828442438, "eval_accuracy": 0.8030160226201697, "eval_loss": 0.4335523247718811, "eval_runtime": 12.0639, "eval_samples_per_second": 87.948, "eval_steps_per_second": 5.554, "step": 2660 }, { "epoch": 11.0, "eval_AUC": 0.6386617220251531, "eval_F1": 0.6595258665704602, "eval_Precision": 0.8777660695468915, "eval_Recall": 0.9401805869074492, "eval_accuracy": 0.8407163053722903, "eval_loss": 0.43072912096977234, "eval_runtime": 11.6338, "eval_samples_per_second": 91.2, "eval_steps_per_second": 5.759, "step": 2926 }, { "epoch": 11.278195488721805, "grad_norm": 0.8828286528587341, "learning_rate": 0.0001774436090225564, "loss": 0.2882, "step": 3000 }, { "epoch": 12.0, "eval_AUC": 0.7007449209932279, "eval_F1": 0.6913138583881986, "eval_Precision": 0.9028901734104047, "eval_Recall": 0.881489841986456, "eval_accuracy": 0.82186616399623, "eval_loss": 0.5094270706176758, "eval_runtime": 12.013, "eval_samples_per_second": 88.321, "eval_steps_per_second": 5.577, "step": 3192 }, { "epoch": 13.0, "eval_AUC": 0.6362624959690422, "eval_F1": 0.6636744500641045, "eval_Precision": 0.8761609907120743, "eval_Recall": 0.9582392776523702, "eval_accuracy": 0.8520263901979265, "eval_loss": 0.46198517084121704, "eval_runtime": 11.833, "eval_samples_per_second": 89.665, "eval_steps_per_second": 5.662, "step": 3458 }, { "epoch": 13.157894736842104, "grad_norm": 0.10690835863351822, "learning_rate": 0.0001736842105263158, "loss": 0.1654, "step": 3500 }, { "epoch": 14.0, "eval_AUC": 0.7246952595936795, "eval_F1": 0.7141794985075913, "eval_Precision": 0.9109826589595376, "eval_Recall": 0.8893905191873589, "eval_accuracy": 0.8350612629594723, "eval_loss": 0.58914715051651, "eval_runtime": 12.2166, "eval_samples_per_second": 86.849, "eval_steps_per_second": 5.484, "step": 3724 }, { "epoch": 15.0, "eval_AUC": 0.6827894227668494, "eval_F1": 0.6940221645449677, "eval_Precision": 0.893640350877193, "eval_Recall": 0.9198645598194131, "eval_accuracy": 0.8416588124410933, "eval_loss": 0.5601742267608643, "eval_runtime": 12.0344, "eval_samples_per_second": 88.164, "eval_steps_per_second": 5.567, "step": 3990 }, { "epoch": 15.037593984962406, "grad_norm": 0.1679229587316513, "learning_rate": 0.0001699248120300752, "loss": 0.0868, "step": 4000 }, { "epoch": 16.0, "eval_AUC": 0.6785198323121573, "eval_F1": 0.7114280962304207, "eval_Precision": 0.8894681960375391, "eval_Recall": 0.9627539503386005, "eval_accuracy": 0.8689915174363808, "eval_loss": 0.5927982926368713, "eval_runtime": 11.7748, "eval_samples_per_second": 90.107, "eval_steps_per_second": 5.69, "step": 4256 }, { "epoch": 16.917293233082706, "grad_norm": 0.02159872278571129, "learning_rate": 0.00016616541353383458, "loss": 0.045, "step": 4500 }, { "epoch": 17.0, "eval_AUC": 0.7072331505965818, "eval_F1": 0.7268478980719824, "eval_Precision": 0.9005405405405406, "eval_Recall": 0.9401805869074492, "eval_accuracy": 0.8633364750235627, "eval_loss": 0.6153913140296936, "eval_runtime": 11.9361, "eval_samples_per_second": 88.89, "eval_steps_per_second": 5.613, "step": 4522 }, { "epoch": 18.0, "eval_AUC": 0.7169332473395679, "eval_F1": 0.7369669924918544, "eval_Precision": 0.9036796536796536, "eval_Recall": 0.9424379232505643, "eval_accuracy": 0.8680490103675778, "eval_loss": 0.6357868909835815, "eval_runtime": 11.728, "eval_samples_per_second": 90.467, "eval_steps_per_second": 5.713, "step": 4788 }, { "epoch": 18.796992481203006, "grad_norm": 0.00539048295468092, "learning_rate": 0.00016240601503759398, "loss": 0.021, "step": 5000 }, { "epoch": 19.0, "eval_AUC": 0.7422960335375686, "eval_F1": 0.737905217953103, "eval_Precision": 0.9157175398633257, "eval_Recall": 0.90744920993228, "eval_accuracy": 0.8529688972667295, "eval_loss": 0.8246906399726868, "eval_runtime": 11.7691, "eval_samples_per_second": 90.151, "eval_steps_per_second": 5.693, "step": 5054 }, { "epoch": 20.0, "eval_AUC": 0.7228603676233473, "eval_F1": 0.7228603676233474, "eval_Precision": 0.9085778781038375, "eval_Recall": 0.9085778781038375, "eval_accuracy": 0.8473138548539114, "eval_loss": 0.9930059909820557, "eval_runtime": 11.643, "eval_samples_per_second": 91.128, "eval_steps_per_second": 5.755, "step": 5320 }, { "epoch": 20.67669172932331, "grad_norm": 1.4996395111083984, "learning_rate": 0.0001586466165413534, "loss": 0.0136, "step": 5500 }, { "epoch": 21.0, "eval_AUC": 0.7037762012254112, "eval_F1": 0.7262231926161842, "eval_Precision": 0.8990332975295381, "eval_Recall": 0.9446952595936795, "eval_accuracy": 0.8652214891611687, "eval_loss": 0.5600523352622986, "eval_runtime": 11.6192, "eval_samples_per_second": 91.315, "eval_steps_per_second": 5.766, "step": 5586 }, { "epoch": 22.0, "eval_AUC": 0.6561560786842955, "eval_F1": 0.6934912580385852, "eval_Precision": 0.8816326530612245, "eval_Recall": 0.9751693002257337, "eval_accuracy": 0.8699340245051838, "eval_loss": 0.64747554063797, "eval_runtime": 11.5363, "eval_samples_per_second": 91.971, "eval_steps_per_second": 5.808, "step": 5852 }, { "epoch": 22.55639097744361, "grad_norm": 0.029281923547387123, "learning_rate": 0.0001548872180451128, "loss": 0.0464, "step": 6000 }, { "epoch": 23.0, "eval_AUC": 0.7170396646243147, "eval_F1": 0.7272862554112554, "eval_Precision": 0.9050772626931567, "eval_Recall": 0.9255079006772009, "eval_accuracy": 0.8567389255419415, "eval_loss": 0.5766553282737732, "eval_runtime": 11.6613, "eval_samples_per_second": 90.984, "eval_steps_per_second": 5.745, "step": 6118 }, { "epoch": 24.0, "eval_AUC": 0.7451886488229603, "eval_F1": 0.736944199717763, "eval_Precision": 0.9173363949483353, "eval_Recall": 0.9018058690744921, "eval_accuracy": 0.8501413760603205, "eval_loss": 0.7393656373023987, "eval_runtime": 11.8414, "eval_samples_per_second": 89.601, "eval_steps_per_second": 5.658, "step": 6384 }, { "epoch": 24.43609022556391, "grad_norm": 0.0072451187297701836, "learning_rate": 0.00015112781954887218, "loss": 0.0438, "step": 6500 }, { "epoch": 25.0, "eval_AUC": 0.6412705578845533, "eval_F1": 0.6781337216357238, "eval_Precision": 0.8767676767676768, "eval_Recall": 0.9796839729119639, "eval_accuracy": 0.8680490103675778, "eval_loss": 0.762208878993988, "eval_runtime": 11.8755, "eval_samples_per_second": 89.344, "eval_steps_per_second": 5.642, "step": 6650 }, { "epoch": 26.0, "eval_AUC": 0.7167913576265721, "eval_F1": 0.7509163334545014, "eval_Precision": 0.9018987341772152, "eval_Recall": 0.9650112866817155, "eval_accuracy": 0.883129123468426, "eval_loss": 0.7616934180259705, "eval_runtime": 11.673, "eval_samples_per_second": 90.893, "eval_steps_per_second": 5.74, "step": 6916 }, { "epoch": 26.31578947368421, "grad_norm": 0.005205586086958647, "learning_rate": 0.00014736842105263158, "loss": 0.0126, "step": 7000 }, { "epoch": 27.0, "eval_AUC": 0.7227184779103515, "eval_F1": 0.7354277398991624, "eval_Precision": 0.9065934065934066, "eval_Recall": 0.9311512415349887, "eval_accuracy": 0.8623939679547596, "eval_loss": 0.8840720653533936, "eval_runtime": 12.2613, "eval_samples_per_second": 86.533, "eval_steps_per_second": 5.464, "step": 7182 }, { "epoch": 28.0, "eval_AUC": 0.7300193485972267, "eval_F1": 0.7543650900476486, "eval_Precision": 0.907427341227126, "eval_Recall": 0.9514672686230248, "eval_accuracy": 0.8784165881244109, "eval_loss": 0.7538221478462219, "eval_runtime": 11.7032, "eval_samples_per_second": 90.659, "eval_steps_per_second": 5.725, "step": 7448 }, { "epoch": 28.195488721804512, "grad_norm": 0.03350173309445381, "learning_rate": 0.000143609022556391, "loss": 0.016, "step": 7500 }, { "epoch": 29.0, "eval_AUC": 0.6320638503708481, "eval_F1": 0.6709177157453019, "eval_Precision": 0.8735059760956175, "eval_Recall": 0.989841986455982, "eval_accuracy": 0.8718190386427899, "eval_loss": 0.7105740308761597, "eval_runtime": 11.7867, "eval_samples_per_second": 90.017, "eval_steps_per_second": 5.684, "step": 7714 }, { "epoch": 30.0, "eval_AUC": 0.689348597226701, "eval_F1": 0.72511658580244, "eval_Precision": 0.8927083333333333, "eval_Recall": 0.9672686230248307, "eval_accuracy": 0.8755890669180019, "eval_loss": 0.6111597418785095, "eval_runtime": 11.7504, "eval_samples_per_second": 90.295, "eval_steps_per_second": 5.702, "step": 7980 }, { "epoch": 30.075187969924812, "grad_norm": 0.013551408424973488, "learning_rate": 0.0001398496240601504, "loss": 0.0384, "step": 8000 }, { "epoch": 31.0, "eval_AUC": 0.6887487907126733, "eval_F1": 0.7271465907527794, "eval_Precision": 0.8922279792746114, "eval_Recall": 0.9717832957110609, "eval_accuracy": 0.8784165881244109, "eval_loss": 0.5990052223205566, "eval_runtime": 11.854, "eval_samples_per_second": 89.506, "eval_steps_per_second": 5.652, "step": 8246 }, { "epoch": 31.954887218045112, "grad_norm": 0.10003461688756943, "learning_rate": 0.0001360902255639098, "loss": 0.0276, "step": 8500 }, { "epoch": 32.0, "eval_AUC": 0.699577555627217, "eval_F1": 0.741136709063275, "eval_Precision": 0.8954451345755694, "eval_Recall": 0.9762979683972912, "eval_accuracy": 0.8850141376060321, "eval_loss": 0.6617034673690796, "eval_runtime": 11.7353, "eval_samples_per_second": 90.411, "eval_steps_per_second": 5.709, "step": 8512 }, { "epoch": 33.0, "eval_AUC": 0.7190132215414382, "eval_F1": 0.7599135442188549, "eval_Precision": 0.9018789144050104, "eval_Recall": 0.9751693002257337, "eval_accuracy": 0.8906691800188501, "eval_loss": 0.7068904042243958, "eval_runtime": 11.6304, "eval_samples_per_second": 91.226, "eval_steps_per_second": 5.761, "step": 8778 }, { "epoch": 33.83458646616541, "grad_norm": 0.00604345602914691, "learning_rate": 0.00013233082706766918, "loss": 0.0109, "step": 9000 }, { "epoch": 34.0, "eval_AUC": 0.6566849403418252, "eval_F1": 0.6974271887335782, "eval_Precision": 0.8814589665653495, "eval_Recall": 0.981941309255079, "eval_accuracy": 0.8746465598491989, "eval_loss": 0.8042259812355042, "eval_runtime": 11.739, "eval_samples_per_second": 90.382, "eval_steps_per_second": 5.707, "step": 9044 }, { "epoch": 35.0, "eval_AUC": 0.6961560786842954, "eval_F1": 0.7368930485561156, "eval_Precision": 0.8944099378881988, "eval_Recall": 0.9751693002257337, "eval_accuracy": 0.883129123468426, "eval_loss": 0.7705923914909363, "eval_runtime": 11.6824, "eval_samples_per_second": 90.821, "eval_steps_per_second": 5.735, "step": 9310 }, { "epoch": 35.714285714285715, "grad_norm": 0.0020399852655828, "learning_rate": 0.00012857142857142858, "loss": 0.0028, "step": 9500 }, { "epoch": 36.0, "eval_AUC": 0.712170267655595, "eval_F1": 0.7516347009160568, "eval_Precision": 0.8997912317327766, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8868991517436381, "eval_loss": 0.8394030928611755, "eval_runtime": 11.8855, "eval_samples_per_second": 89.268, "eval_steps_per_second": 5.637, "step": 9576 }, { "epoch": 37.0, "eval_AUC": 0.7087487907126733, "eval_F1": 0.7474952792646576, "eval_Precision": 0.8987473903966597, "eval_Recall": 0.9717832957110609, "eval_accuracy": 0.8850141376060321, "eval_loss": 0.8953573107719421, "eval_runtime": 11.8186, "eval_samples_per_second": 89.774, "eval_steps_per_second": 5.669, "step": 9842 }, { "epoch": 37.59398496240601, "grad_norm": 0.0010929929558187723, "learning_rate": 0.00012481203007518797, "loss": 0.0076, "step": 10000 }, { "epoch": 38.0, "eval_AUC": 0.7087487907126733, "eval_F1": 0.7474952792646576, "eval_Precision": 0.8987473903966597, "eval_Recall": 0.9717832957110609, "eval_accuracy": 0.8850141376060321, "eval_loss": 0.9388997554779053, "eval_runtime": 11.6255, "eval_samples_per_second": 91.265, "eval_steps_per_second": 5.763, "step": 10108 }, { "epoch": 39.0, "eval_AUC": 0.7087487907126733, "eval_F1": 0.7474952792646576, "eval_Precision": 0.8987473903966597, "eval_Recall": 0.9717832957110609, "eval_accuracy": 0.8850141376060321, "eval_loss": 0.9697290062904358, "eval_runtime": 11.5778, "eval_samples_per_second": 91.641, "eval_steps_per_second": 5.787, "step": 10374 }, { "epoch": 39.473684210526315, "grad_norm": 0.0006237945053726435, "learning_rate": 0.00012105263157894738, "loss": 0.0001, "step": 10500 }, { "epoch": 40.0, "eval_AUC": 0.7087487907126733, "eval_F1": 0.7474952792646576, "eval_Precision": 0.8987473903966597, "eval_Recall": 0.9717832957110609, "eval_accuracy": 0.8850141376060321, "eval_loss": 0.9953697323799133, "eval_runtime": 11.7777, "eval_samples_per_second": 90.086, "eval_steps_per_second": 5.689, "step": 10640 }, { "epoch": 41.0, "eval_AUC": 0.7087487907126733, "eval_F1": 0.7474952792646576, "eval_Precision": 0.8987473903966597, "eval_Recall": 0.9717832957110609, "eval_accuracy": 0.8850141376060321, "eval_loss": 1.0168683528900146, "eval_runtime": 11.7874, "eval_samples_per_second": 90.011, "eval_steps_per_second": 5.684, "step": 10906 }, { "epoch": 41.35338345864662, "grad_norm": 0.000347771099768579, "learning_rate": 0.00011729323308270677, "loss": 0.0, "step": 11000 }, { "epoch": 42.0, "eval_AUC": 0.7093131247984521, "eval_F1": 0.7487971197401504, "eval_Precision": 0.8988529718456726, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.885956644674835, "eval_loss": 1.038093090057373, "eval_runtime": 11.6656, "eval_samples_per_second": 90.951, "eval_steps_per_second": 5.743, "step": 11172 }, { "epoch": 43.0, "eval_AUC": 0.7093131247984521, "eval_F1": 0.7487971197401504, "eval_Precision": 0.8988529718456726, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.885956644674835, "eval_loss": 1.0582064390182495, "eval_runtime": 11.7863, "eval_samples_per_second": 90.019, "eval_steps_per_second": 5.685, "step": 11438 }, { "epoch": 43.233082706766915, "grad_norm": 0.00026405107928439975, "learning_rate": 0.00011353383458646618, "loss": 0.0, "step": 11500 }, { "epoch": 44.0, "eval_AUC": 0.7093131247984521, "eval_F1": 0.7487971197401504, "eval_Precision": 0.8988529718456726, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.885956644674835, "eval_loss": 1.0762717723846436, "eval_runtime": 11.6351, "eval_samples_per_second": 91.189, "eval_steps_per_second": 5.758, "step": 11704 }, { "epoch": 45.0, "eval_AUC": 0.7093131247984521, "eval_F1": 0.7487971197401504, "eval_Precision": 0.8988529718456726, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.885956644674835, "eval_loss": 1.0936743021011353, "eval_runtime": 11.9085, "eval_samples_per_second": 89.096, "eval_steps_per_second": 5.626, "step": 11970 }, { "epoch": 45.11278195488722, "grad_norm": 0.00022154749603942037, "learning_rate": 0.00010977443609022557, "loss": 0.0, "step": 12000 }, { "epoch": 46.0, "eval_AUC": 0.7150274105127379, "eval_F1": 0.7544540322094451, "eval_Precision": 0.9007314524555904, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8878416588124411, "eval_loss": 1.1094835996627808, "eval_runtime": 11.7724, "eval_samples_per_second": 90.126, "eval_steps_per_second": 5.691, "step": 12236 }, { "epoch": 46.99248120300752, "grad_norm": 0.00019688473548740149, "learning_rate": 0.00010601503759398497, "loss": 0.0, "step": 12500 }, { "epoch": 47.0, "eval_AUC": 0.7150274105127379, "eval_F1": 0.7544540322094451, "eval_Precision": 0.9007314524555904, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8878416588124411, "eval_loss": 1.1262503862380981, "eval_runtime": 11.5453, "eval_samples_per_second": 91.899, "eval_steps_per_second": 5.803, "step": 12502 }, { "epoch": 48.0, "eval_AUC": 0.7150274105127379, "eval_F1": 0.7544540322094451, "eval_Precision": 0.9007314524555904, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8878416588124411, "eval_loss": 1.1426563262939453, "eval_runtime": 11.6837, "eval_samples_per_second": 90.81, "eval_steps_per_second": 5.734, "step": 12768 }, { "epoch": 48.87218045112782, "grad_norm": 0.0001134950143750757, "learning_rate": 0.00010225563909774436, "loss": 0.0, "step": 13000 }, { "epoch": 49.0, "eval_AUC": 0.7150274105127379, "eval_F1": 0.7544540322094451, "eval_Precision": 0.9007314524555904, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8878416588124411, "eval_loss": 1.1587177515029907, "eval_runtime": 11.7191, "eval_samples_per_second": 90.536, "eval_steps_per_second": 5.717, "step": 13034 }, { "epoch": 50.0, "eval_AUC": 0.7150274105127379, "eval_F1": 0.7544540322094451, "eval_Precision": 0.9007314524555904, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8878416588124411, "eval_loss": 1.174465537071228, "eval_runtime": 11.8222, "eval_samples_per_second": 89.747, "eval_steps_per_second": 5.667, "step": 13300 }, { "epoch": 50.75187969924812, "grad_norm": 9.584094368619844e-05, "learning_rate": 9.849624060150377e-05, "loss": 0.0, "step": 13500 }, { "epoch": 51.0, "eval_AUC": 0.7150274105127379, "eval_F1": 0.7544540322094451, "eval_Precision": 0.9007314524555904, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8878416588124411, "eval_loss": 1.1900520324707031, "eval_runtime": 11.7601, "eval_samples_per_second": 90.22, "eval_steps_per_second": 5.697, "step": 13566 }, { "epoch": 52.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.2051938772201538, "eval_runtime": 11.9347, "eval_samples_per_second": 88.901, "eval_steps_per_second": 5.614, "step": 13832 }, { "epoch": 52.63157894736842, "grad_norm": 7.240776903927326e-05, "learning_rate": 9.473684210526316e-05, "loss": 0.0, "step": 14000 }, { "epoch": 53.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.2201390266418457, "eval_runtime": 11.8013, "eval_samples_per_second": 89.905, "eval_steps_per_second": 5.677, "step": 14098 }, { "epoch": 54.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.2349706888198853, "eval_runtime": 11.8152, "eval_samples_per_second": 89.8, "eval_steps_per_second": 5.671, "step": 14364 }, { "epoch": 54.51127819548872, "grad_norm": 4.7142420953605324e-05, "learning_rate": 9.097744360902256e-05, "loss": 0.0, "step": 14500 }, { "epoch": 55.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.249691367149353, "eval_runtime": 11.9642, "eval_samples_per_second": 88.682, "eval_steps_per_second": 5.6, "step": 14630 }, { "epoch": 56.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.2640849351882935, "eval_runtime": 11.9363, "eval_samples_per_second": 88.889, "eval_steps_per_second": 5.613, "step": 14896 }, { "epoch": 56.390977443609025, "grad_norm": 4.406652442412451e-05, "learning_rate": 8.721804511278195e-05, "loss": 0.0, "step": 15000 }, { "epoch": 57.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.2785232067108154, "eval_runtime": 11.9798, "eval_samples_per_second": 88.566, "eval_steps_per_second": 5.593, "step": 15162 }, { "epoch": 58.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.2925220727920532, "eval_runtime": 11.9038, "eval_samples_per_second": 89.131, "eval_steps_per_second": 5.628, "step": 15428 }, { "epoch": 58.27067669172932, "grad_norm": 2.6122717827092856e-05, "learning_rate": 8.345864661654136e-05, "loss": 0.0, "step": 15500 }, { "epoch": 59.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.3067699670791626, "eval_runtime": 11.8267, "eval_samples_per_second": 89.713, "eval_steps_per_second": 5.665, "step": 15694 }, { "epoch": 60.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.3207120895385742, "eval_runtime": 11.6077, "eval_samples_per_second": 91.405, "eval_steps_per_second": 5.772, "step": 15960 }, { "epoch": 60.150375939849624, "grad_norm": 2.532277903810609e-05, "learning_rate": 7.969924812030075e-05, "loss": 0.0, "step": 16000 }, { "epoch": 61.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.3345941305160522, "eval_runtime": 11.8443, "eval_samples_per_second": 89.579, "eval_steps_per_second": 5.657, "step": 16226 }, { "epoch": 62.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.3484621047973633, "eval_runtime": 11.6458, "eval_samples_per_second": 91.106, "eval_steps_per_second": 5.753, "step": 16492 }, { "epoch": 62.03007518796993, "grad_norm": 1.7661703168414533e-05, "learning_rate": 7.593984962406016e-05, "loss": 0.0, "step": 16500 }, { "epoch": 63.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.3622149229049683, "eval_runtime": 11.7437, "eval_samples_per_second": 90.346, "eval_steps_per_second": 5.705, "step": 16758 }, { "epoch": 63.909774436090224, "grad_norm": 1.633859210414812e-05, "learning_rate": 7.218045112781955e-05, "loss": 0.0, "step": 17000 }, { "epoch": 64.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.3757728338241577, "eval_runtime": 11.6035, "eval_samples_per_second": 91.438, "eval_steps_per_second": 5.774, "step": 17024 }, { "epoch": 65.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.3893355131149292, "eval_runtime": 11.8424, "eval_samples_per_second": 89.593, "eval_steps_per_second": 5.658, "step": 17290 }, { "epoch": 65.78947368421052, "grad_norm": 1.2574956599564757e-05, "learning_rate": 6.842105263157895e-05, "loss": 0.0, "step": 17500 }, { "epoch": 66.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.40289306640625, "eval_runtime": 11.9699, "eval_samples_per_second": 88.639, "eval_steps_per_second": 5.597, "step": 17556 }, { "epoch": 67.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.4165505170822144, "eval_runtime": 11.6917, "eval_samples_per_second": 90.748, "eval_steps_per_second": 5.731, "step": 17822 }, { "epoch": 67.66917293233082, "grad_norm": 1.0964651664835401e-05, "learning_rate": 6.466165413533834e-05, "loss": 0.0, "step": 18000 }, { "epoch": 68.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.4297924041748047, "eval_runtime": 11.881, "eval_samples_per_second": 89.302, "eval_steps_per_second": 5.639, "step": 18088 }, { "epoch": 69.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.4431047439575195, "eval_runtime": 11.6298, "eval_samples_per_second": 91.231, "eval_steps_per_second": 5.761, "step": 18354 }, { "epoch": 69.54887218045113, "grad_norm": 8.276247172034346e-06, "learning_rate": 6.090225563909775e-05, "loss": 0.0, "step": 18500 }, { "epoch": 70.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.4565781354904175, "eval_runtime": 11.6654, "eval_samples_per_second": 90.952, "eval_steps_per_second": 5.743, "step": 18620 }, { "epoch": 71.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.4694792032241821, "eval_runtime": 12.0384, "eval_samples_per_second": 88.134, "eval_steps_per_second": 5.566, "step": 18886 }, { "epoch": 71.42857142857143, "grad_norm": 7.255929176608333e-06, "learning_rate": 5.714285714285714e-05, "loss": 0.0, "step": 19000 }, { "epoch": 72.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.482446551322937, "eval_runtime": 11.6854, "eval_samples_per_second": 90.797, "eval_steps_per_second": 5.734, "step": 19152 }, { "epoch": 73.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.4949710369110107, "eval_runtime": 11.7291, "eval_samples_per_second": 90.459, "eval_steps_per_second": 5.712, "step": 19418 }, { "epoch": 73.30827067669173, "grad_norm": 5.73582974539022e-06, "learning_rate": 5.338345864661655e-05, "loss": 0.0, "step": 19500 }, { "epoch": 74.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.50760817527771, "eval_runtime": 11.6937, "eval_samples_per_second": 90.732, "eval_steps_per_second": 5.73, "step": 19684 }, { "epoch": 75.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.5201044082641602, "eval_runtime": 11.779, "eval_samples_per_second": 90.075, "eval_steps_per_second": 5.688, "step": 19950 }, { "epoch": 75.18796992481202, "grad_norm": 3.381761189302779e-06, "learning_rate": 4.9624060150375936e-05, "loss": 0.0, "step": 20000 }, { "epoch": 76.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.5320940017700195, "eval_runtime": 11.7044, "eval_samples_per_second": 90.65, "eval_steps_per_second": 5.724, "step": 20216 }, { "epoch": 77.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.5440773963928223, "eval_runtime": 11.8766, "eval_samples_per_second": 89.335, "eval_steps_per_second": 5.641, "step": 20482 }, { "epoch": 77.06766917293233, "grad_norm": 4.261892627255293e-06, "learning_rate": 4.586466165413534e-05, "loss": 0.0, "step": 20500 }, { "epoch": 78.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.5564316511154175, "eval_runtime": 11.9626, "eval_samples_per_second": 88.693, "eval_steps_per_second": 5.601, "step": 20748 }, { "epoch": 78.94736842105263, "grad_norm": 2.5668264242995065e-06, "learning_rate": 4.210526315789474e-05, "loss": 0.0, "step": 21000 }, { "epoch": 79.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.5691113471984863, "eval_runtime": 11.9711, "eval_samples_per_second": 88.63, "eval_steps_per_second": 5.597, "step": 21014 }, { "epoch": 80.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.5799812078475952, "eval_runtime": 11.8905, "eval_samples_per_second": 89.231, "eval_steps_per_second": 5.635, "step": 21280 }, { "epoch": 80.82706766917293, "grad_norm": 1.7882749716591206e-06, "learning_rate": 3.834586466165413e-05, "loss": 0.0, "step": 21500 }, { "epoch": 81.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.5909699201583862, "eval_runtime": 11.8739, "eval_samples_per_second": 89.355, "eval_steps_per_second": 5.643, "step": 21546 }, { "epoch": 82.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.6020997762680054, "eval_runtime": 11.7593, "eval_samples_per_second": 90.226, "eval_steps_per_second": 5.698, "step": 21812 }, { "epoch": 82.70676691729324, "grad_norm": 3.307637371108285e-06, "learning_rate": 3.458646616541353e-05, "loss": 0.0, "step": 22000 }, { "epoch": 83.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.6133201122283936, "eval_runtime": 11.7049, "eval_samples_per_second": 90.645, "eval_steps_per_second": 5.724, "step": 22078 }, { "epoch": 84.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.6243833303451538, "eval_runtime": 11.7522, "eval_samples_per_second": 90.281, "eval_steps_per_second": 5.701, "step": 22344 }, { "epoch": 84.58646616541354, "grad_norm": 2.0808365661650896e-06, "learning_rate": 3.082706766917293e-05, "loss": 0.0, "step": 22500 }, { "epoch": 85.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.6356879472732544, "eval_runtime": 11.8494, "eval_samples_per_second": 89.54, "eval_steps_per_second": 5.654, "step": 22610 }, { "epoch": 86.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.646845817565918, "eval_runtime": 11.9457, "eval_samples_per_second": 88.819, "eval_steps_per_second": 5.609, "step": 22876 }, { "epoch": 86.46616541353383, "grad_norm": 1.6075608755272697e-06, "learning_rate": 2.706766917293233e-05, "loss": 0.0, "step": 23000 }, { "epoch": 87.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.6580337285995483, "eval_runtime": 11.988, "eval_samples_per_second": 88.505, "eval_steps_per_second": 5.589, "step": 23142 }, { "epoch": 88.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.6693716049194336, "eval_runtime": 11.563, "eval_samples_per_second": 91.758, "eval_steps_per_second": 5.794, "step": 23408 }, { "epoch": 88.34586466165413, "grad_norm": 1.4785607618250651e-06, "learning_rate": 2.3308270676691728e-05, "loss": 0.0, "step": 23500 }, { "epoch": 89.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.6805604696273804, "eval_runtime": 11.7292, "eval_samples_per_second": 90.458, "eval_steps_per_second": 5.712, "step": 23674 }, { "epoch": 90.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.6876078844070435, "eval_runtime": 11.6884, "eval_samples_per_second": 90.774, "eval_steps_per_second": 5.732, "step": 23940 }, { "epoch": 90.22556390977444, "grad_norm": 7.791019811520528e-07, "learning_rate": 1.954887218045113e-05, "loss": 0.0, "step": 24000 }, { "epoch": 91.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.6937507390975952, "eval_runtime": 11.7263, "eval_samples_per_second": 90.481, "eval_steps_per_second": 5.714, "step": 24206 }, { "epoch": 92.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.6996102333068848, "eval_runtime": 11.8252, "eval_samples_per_second": 89.723, "eval_steps_per_second": 5.666, "step": 24472 }, { "epoch": 92.10526315789474, "grad_norm": 8.590963034293964e-07, "learning_rate": 1.5789473684210526e-05, "loss": 0.0, "step": 24500 }, { "epoch": 93.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.705134630203247, "eval_runtime": 12.0159, "eval_samples_per_second": 88.3, "eval_steps_per_second": 5.576, "step": 24738 }, { "epoch": 93.98496240601504, "grad_norm": 1.100646727536514e-06, "learning_rate": 1.2030075187969925e-05, "loss": 0.0, "step": 25000 }, { "epoch": 94.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.7103519439697266, "eval_runtime": 11.7931, "eval_samples_per_second": 89.968, "eval_steps_per_second": 5.681, "step": 25004 }, { "epoch": 95.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.715171456336975, "eval_runtime": 11.6391, "eval_samples_per_second": 91.159, "eval_steps_per_second": 5.756, "step": 25270 }, { "epoch": 95.86466165413533, "grad_norm": 5.422148774414381e-07, "learning_rate": 8.270676691729324e-06, "loss": 0.0, "step": 25500 }, { "epoch": 96.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.7194596529006958, "eval_runtime": 11.8706, "eval_samples_per_second": 89.38, "eval_steps_per_second": 5.644, "step": 25536 }, { "epoch": 97.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.723157286643982, "eval_runtime": 12.0004, "eval_samples_per_second": 88.414, "eval_steps_per_second": 5.583, "step": 25802 }, { "epoch": 97.74436090225564, "grad_norm": 8.843226737553778e-07, "learning_rate": 4.511278195488722e-06, "loss": 0.0, "step": 26000 }, { "epoch": 98.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.7260410785675049, "eval_runtime": 11.8627, "eval_samples_per_second": 89.44, "eval_steps_per_second": 5.648, "step": 26068 }, { "epoch": 99.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.7279813289642334, "eval_runtime": 12.0306, "eval_samples_per_second": 88.192, "eval_steps_per_second": 5.569, "step": 26334 }, { "epoch": 99.62406015037594, "grad_norm": 6.334667546070705e-07, "learning_rate": 7.518796992481203e-07, "loss": 0.0, "step": 26500 }, { "epoch": 100.0, "eval_AUC": 0.7178845533698807, "eval_F1": 0.7572553125484722, "eval_Precision": 0.9016736401673641, "eval_Recall": 0.9729119638826185, "eval_accuracy": 0.8887841658812441, "eval_loss": 1.7286875247955322, "eval_runtime": 11.7137, "eval_samples_per_second": 90.578, "eval_steps_per_second": 5.72, "step": 26600 }, { "epoch": 100.0, "step": 26600, "total_flos": 3.2879851193471386e+19, "train_loss": 0.05622970362024654, "train_runtime": 7456.0224, "train_samples_per_second": 56.907, "train_steps_per_second": 3.568 } ], "logging_steps": 500, "max_steps": 26600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 3.2879851193471386e+19, "train_batch_size": 16, "trial_name": null, "trial_params": null }