{ "best_metric": 0.9181643400484828, "best_model_checkpoint": "hmBERT-CoNLL-cp3/checkpoint-1000", "epoch": 3.0, "global_step": 1317, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.06, "eval_accuracy": 0.9007242708617266, "eval_f1": 0.3684910996506405, "eval_loss": 0.4115295708179474, "eval_precision": 0.36430921052631576, "eval_recall": 0.37277011107371255, "eval_runtime": 21.3063, "eval_samples_per_second": 152.537, "eval_steps_per_second": 4.787, "step": 25 }, { "epoch": 0.11, "eval_accuracy": 0.9460301390132783, "eval_f1": 0.6640782981476988, "eval_loss": 0.22425369918346405, "eval_precision": 0.6393085189222862, "eval_recall": 0.6908448333894311, "eval_runtime": 21.4481, "eval_samples_per_second": 151.529, "eval_steps_per_second": 4.756, "step": 50 }, { "epoch": 0.17, "eval_accuracy": 0.958023441454772, "eval_f1": 0.7474880579805633, "eval_loss": 0.16170601546764374, "eval_precision": 0.7319354838709677, "eval_recall": 0.7637159205654662, "eval_runtime": 21.6197, "eval_samples_per_second": 150.326, "eval_steps_per_second": 4.718, "step": 75 }, { "epoch": 0.23, "eval_accuracy": 0.9585101826252872, "eval_f1": 0.7455232462625266, "eval_loss": 0.15437664091587067, "eval_precision": 0.7281771501925546, "eval_recall": 0.7637159205654662, "eval_runtime": 21.768, "eval_samples_per_second": 149.302, "eval_steps_per_second": 4.686, "step": 100 }, { "epoch": 0.28, "eval_accuracy": 0.964409485611931, "eval_f1": 0.784738041002278, "eval_loss": 0.13407838344573975, "eval_precision": 0.7595275590551182, "eval_recall": 0.81167956916863, "eval_runtime": 21.8222, "eval_samples_per_second": 148.931, "eval_steps_per_second": 4.674, "step": 125 }, { "epoch": 0.34, "eval_accuracy": 0.9692963669639033, "eval_f1": 0.811351977494622, "eval_loss": 0.12208627909421921, "eval_precision": 0.7980143229166666, "eval_recall": 0.8251430494782901, "eval_runtime": 21.2673, "eval_samples_per_second": 152.817, "eval_steps_per_second": 4.796, "step": 150 }, { "epoch": 0.4, "eval_accuracy": 0.9718663603442234, "eval_f1": 0.8151923709306149, "eval_loss": 0.10127394646406174, "eval_precision": 0.796849887495982, "eval_recall": 0.8343991921911814, "eval_runtime": 21.1083, "eval_samples_per_second": 153.968, "eval_steps_per_second": 4.832, "step": 175 }, { "epoch": 0.46, "eval_accuracy": 0.9731513570343834, "eval_f1": 0.8333472419260619, "eval_loss": 0.10758877545595169, "eval_precision": 0.8265187882800861, "eval_recall": 0.8402894648266577, "eval_runtime": 20.8538, "eval_samples_per_second": 155.847, "eval_steps_per_second": 4.891, "step": 200 }, { "epoch": 0.51, "eval_accuracy": 0.9762859701725011, "eval_f1": 0.8543123543123543, "eval_loss": 0.08832722157239914, "eval_precision": 0.8453047775947282, "eval_recall": 0.8635139683608213, "eval_runtime": 21.5789, "eval_samples_per_second": 150.61, "eval_steps_per_second": 4.727, "step": 225 }, { "epoch": 0.57, "eval_accuracy": 0.9762665005256804, "eval_f1": 0.8535063638632394, "eval_loss": 0.0972680076956749, "eval_precision": 0.8438887974995888, "eval_recall": 0.8633456748569506, "eval_runtime": 21.3825, "eval_samples_per_second": 151.993, "eval_steps_per_second": 4.77, "step": 250 }, { "epoch": 0.63, "eval_accuracy": 0.9765390755811689, "eval_f1": 0.8575239683201333, "eval_loss": 0.0882844626903534, "eval_precision": 0.8496613249628283, "eval_recall": 0.8655334904072702, "eval_runtime": 21.4561, "eval_samples_per_second": 151.472, "eval_steps_per_second": 4.754, "step": 275 }, { "epoch": 0.68, "eval_accuracy": 0.9766364238152719, "eval_f1": 0.8551207327227309, "eval_loss": 0.08785738795995712, "eval_precision": 0.8462425840474621, "eval_recall": 0.8641871423763042, "eval_runtime": 21.5171, "eval_samples_per_second": 151.043, "eval_steps_per_second": 4.74, "step": 300 }, { "epoch": 0.74, "eval_accuracy": 0.9786612670846151, "eval_f1": 0.8711310264708322, "eval_loss": 0.07805178314447403, "eval_precision": 0.8592240955966607, "eval_recall": 0.8833726018175698, "eval_runtime": 21.5676, "eval_samples_per_second": 150.689, "eval_steps_per_second": 4.729, "step": 325 }, { "epoch": 0.8, "eval_accuracy": 0.9803161870643666, "eval_f1": 0.8810828765985717, "eval_loss": 0.07252655178308487, "eval_precision": 0.8696721311475409, "eval_recall": 0.8927970380343319, "eval_runtime": 21.8654, "eval_samples_per_second": 148.637, "eval_steps_per_second": 4.665, "step": 350 }, { "epoch": 0.85, "eval_accuracy": 0.9807250496475994, "eval_f1": 0.881333443900821, "eval_loss": 0.07547631114721298, "eval_precision": 0.8687264999182606, "eval_recall": 0.8943116795691687, "eval_runtime": 21.5439, "eval_samples_per_second": 150.855, "eval_steps_per_second": 4.735, "step": 375 }, { "epoch": 0.91, "eval_accuracy": 0.9822242124527861, "eval_f1": 0.8890735355213959, "eval_loss": 0.06660941988229752, "eval_precision": 0.8780567864762843, "eval_recall": 0.9003702457085156, "eval_runtime": 21.2792, "eval_samples_per_second": 152.731, "eval_steps_per_second": 4.793, "step": 400 }, { "epoch": 0.97, "eval_accuracy": 0.982282621393248, "eval_f1": 0.8935885647412856, "eval_loss": 0.06582659482955933, "eval_precision": 0.8877262913137353, "eval_recall": 0.8995287781891619, "eval_runtime": 21.0258, "eval_samples_per_second": 154.572, "eval_steps_per_second": 4.851, "step": 425 }, { "epoch": 1.03, "eval_accuracy": 0.983664966317511, "eval_f1": 0.8993299832495812, "eval_loss": 0.0645442008972168, "eval_precision": 0.89513171057019, "eval_recall": 0.9035678222820599, "eval_runtime": 21.8717, "eval_samples_per_second": 148.594, "eval_steps_per_second": 4.664, "step": 450 }, { "epoch": 1.08, "eval_accuracy": 0.9831003465597135, "eval_f1": 0.8950920756603616, "eval_loss": 0.06972972303628922, "eval_precision": 0.8864499092259449, "eval_recall": 0.9039044092898014, "eval_runtime": 22.0283, "eval_samples_per_second": 147.537, "eval_steps_per_second": 4.63, "step": 475 }, { "epoch": 1.14, "learning_rate": 3.1017463933181475e-05, "loss": 0.1392, "step": 500 }, { "epoch": 1.14, "eval_accuracy": 0.9824189089209922, "eval_f1": 0.8908151358559759, "eval_loss": 0.06883182376623154, "eval_precision": 0.8824306472919419, "eval_recall": 0.8993604846852912, "eval_runtime": 21.1436, "eval_samples_per_second": 153.711, "eval_steps_per_second": 4.824, "step": 500 }, { "epoch": 1.2, "eval_accuracy": 0.9827498929169425, "eval_f1": 0.8999163179916319, "eval_loss": 0.06805375963449478, "eval_precision": 0.8949733688415447, "eval_recall": 0.9049141703130259, "eval_runtime": 21.618, "eval_samples_per_second": 150.337, "eval_steps_per_second": 4.718, "step": 525 }, { "epoch": 1.25, "eval_accuracy": 0.9823215606868891, "eval_f1": 0.8915259903058667, "eval_loss": 0.06759364902973175, "eval_precision": 0.8854581673306773, "eval_recall": 0.8976775496465836, "eval_runtime": 21.6174, "eval_samples_per_second": 150.342, "eval_steps_per_second": 4.718, "step": 550 }, { "epoch": 1.31, "eval_accuracy": 0.9841906467816673, "eval_f1": 0.9013520280420632, "eval_loss": 0.06176742911338806, "eval_precision": 0.8940397350993378, "eval_recall": 0.9087849209020532, "eval_runtime": 21.5727, "eval_samples_per_second": 150.653, "eval_steps_per_second": 4.728, "step": 575 }, { "epoch": 1.37, "eval_accuracy": 0.984015419960282, "eval_f1": 0.9010107760421018, "eval_loss": 0.0644294023513794, "eval_precision": 0.8945098689666612, "eval_recall": 0.9076068663749579, "eval_runtime": 22.0692, "eval_samples_per_second": 147.264, "eval_steps_per_second": 4.622, "step": 600 }, { "epoch": 1.42, "eval_accuracy": 0.9837233752579728, "eval_f1": 0.9010347129506008, "eval_loss": 0.0641368106007576, "eval_precision": 0.8935782853359815, "eval_recall": 0.9086166273981824, "eval_runtime": 21.6306, "eval_samples_per_second": 150.25, "eval_steps_per_second": 4.716, "step": 625 }, { "epoch": 1.48, "eval_accuracy": 0.9845800397180795, "eval_f1": 0.9043724966622163, "eval_loss": 0.06189671903848648, "eval_precision": 0.8968884475339292, "eval_recall": 0.9119824974755975, "eval_runtime": 20.932, "eval_samples_per_second": 155.265, "eval_steps_per_second": 4.873, "step": 650 }, { "epoch": 1.54, "eval_accuracy": 0.9848136754799268, "eval_f1": 0.9074897257401661, "eval_loss": 0.06076198071241379, "eval_precision": 0.9045310148804547, "eval_recall": 0.9104678559407607, "eval_runtime": 21.5144, "eval_samples_per_second": 151.062, "eval_steps_per_second": 4.741, "step": 675 }, { "epoch": 1.59, "eval_accuracy": 0.9851057201822359, "eval_f1": 0.9090604869070525, "eval_loss": 0.06238234415650368, "eval_precision": 0.903842954583264, "eval_recall": 0.9143386065297879, "eval_runtime": 21.3845, "eval_samples_per_second": 151.979, "eval_steps_per_second": 4.77, "step": 700 }, { "epoch": 1.65, "eval_accuracy": 0.9852420077099802, "eval_f1": 0.9115851108322878, "eval_loss": 0.05955210700631142, "eval_precision": 0.9062032263429237, "eval_recall": 0.9170313025917199, "eval_runtime": 21.1164, "eval_samples_per_second": 153.909, "eval_steps_per_second": 4.83, "step": 725 }, { "epoch": 1.71, "eval_accuracy": 0.9848331451267474, "eval_f1": 0.9068602904356534, "eval_loss": 0.0579909048974514, "eval_precision": 0.8995033112582781, "eval_recall": 0.9143386065297879, "eval_runtime": 21.1108, "eval_samples_per_second": 153.95, "eval_steps_per_second": 4.832, "step": 750 }, { "epoch": 1.77, "eval_accuracy": 0.9857676881741365, "eval_f1": 0.9126685087498954, "eval_loss": 0.05822019651532173, "eval_precision": 0.9081819696717214, "eval_recall": 0.9171995960955908, "eval_runtime": 22.2525, "eval_samples_per_second": 146.051, "eval_steps_per_second": 4.584, "step": 775 }, { "epoch": 1.82, "eval_accuracy": 0.9852420077099802, "eval_f1": 0.9100617386951443, "eval_loss": 0.0588374100625515, "eval_precision": 0.9023825281270682, "eval_recall": 0.9178727701110737, "eval_runtime": 21.7438, "eval_samples_per_second": 149.468, "eval_steps_per_second": 4.691, "step": 800 }, { "epoch": 1.88, "eval_accuracy": 0.9855535220591098, "eval_f1": 0.911860174781523, "eval_loss": 0.0592406764626503, "eval_precision": 0.9020253581425984, "eval_recall": 0.9219118142039717, "eval_runtime": 21.1485, "eval_samples_per_second": 153.675, "eval_steps_per_second": 4.823, "step": 825 }, { "epoch": 1.94, "eval_accuracy": 0.9852225380631595, "eval_f1": 0.911764705882353, "eval_loss": 0.06002892181277275, "eval_precision": 0.9054098904746101, "eval_recall": 0.9182093571188152, "eval_runtime": 22.0668, "eval_samples_per_second": 147.28, "eval_steps_per_second": 4.622, "step": 850 }, { "epoch": 1.99, "eval_accuracy": 0.9860792025232662, "eval_f1": 0.913464751085867, "eval_loss": 0.05682874843478203, "eval_precision": 0.9067993366500829, "eval_recall": 0.9202288791652642, "eval_runtime": 20.9827, "eval_samples_per_second": 154.89, "eval_steps_per_second": 4.861, "step": 875 }, { "epoch": 2.05, "eval_accuracy": 0.9860792025232662, "eval_f1": 0.9171483622350675, "eval_loss": 0.0570731945335865, "eval_precision": 0.9130942452043369, "eval_recall": 0.9212386401884888, "eval_runtime": 21.3364, "eval_samples_per_second": 152.322, "eval_steps_per_second": 4.781, "step": 900 }, { "epoch": 2.11, "eval_accuracy": 0.9857676881741365, "eval_f1": 0.9156969443281708, "eval_loss": 0.0577477402985096, "eval_precision": 0.9110444777611194, "eval_recall": 0.920397172669135, "eval_runtime": 21.9855, "eval_samples_per_second": 147.825, "eval_steps_per_second": 4.639, "step": 925 }, { "epoch": 2.16, "eval_accuracy": 0.986040263229625, "eval_f1": 0.9184714441006773, "eval_loss": 0.06048833578824997, "eval_precision": 0.912747216220708, "eval_recall": 0.9242679232581622, "eval_runtime": 21.8831, "eval_samples_per_second": 148.516, "eval_steps_per_second": 4.661, "step": 950 }, { "epoch": 2.22, "eval_accuracy": 0.986682761574705, "eval_f1": 0.9166318254034618, "eval_loss": 0.05745207890868187, "eval_precision": 0.9109190626558086, "eval_recall": 0.922416694715584, "eval_runtime": 21.8724, "eval_samples_per_second": 148.589, "eval_steps_per_second": 4.663, "step": 975 }, { "epoch": 2.28, "learning_rate": 1.2034927866362947e-05, "loss": 0.0392, "step": 1000 }, { "epoch": 2.28, "eval_accuracy": 0.9862154900510105, "eval_f1": 0.9181643400484828, "eval_loss": 0.0572221502661705, "eval_precision": 0.9121408403919614, "eval_recall": 0.9242679232581622, "eval_runtime": 21.5878, "eval_samples_per_second": 150.548, "eval_steps_per_second": 4.725, "step": 1000 }, { "epoch": 2.33, "eval_accuracy": 0.9869748062770142, "eval_f1": 0.9211694730669348, "eval_loss": 0.056650131940841675, "eval_precision": 0.9170975813177648, "eval_recall": 0.9252776842813868, "eval_runtime": 21.5295, "eval_samples_per_second": 150.956, "eval_steps_per_second": 4.738, "step": 1025 }, { "epoch": 2.39, "eval_accuracy": 0.9870916241579378, "eval_f1": 0.9243514644351465, "eval_loss": 0.0570232979953289, "eval_precision": 0.9192743009320905, "eval_recall": 0.9294850218781555, "eval_runtime": 21.5481, "eval_samples_per_second": 150.825, "eval_steps_per_second": 4.734, "step": 1050 }, { "epoch": 2.45, "eval_accuracy": 0.986682761574705, "eval_f1": 0.9215079829474212, "eval_loss": 0.05837239325046539, "eval_precision": 0.9154625477495433, "eval_recall": 0.9276337933355773, "eval_runtime": 21.2288, "eval_samples_per_second": 153.094, "eval_steps_per_second": 4.805, "step": 1075 }, { "epoch": 2.51, "eval_accuracy": 0.9867022312215257, "eval_f1": 0.9226653289858708, "eval_loss": 0.059072330594062805, "eval_precision": 0.9167635819903639, "eval_recall": 0.9286435543588017, "eval_runtime": 22.3224, "eval_samples_per_second": 145.594, "eval_steps_per_second": 4.569, "step": 1100 }, { "epoch": 2.56, "eval_accuracy": 0.9874031385070675, "eval_f1": 0.9246323529411764, "eval_loss": 0.057747144252061844, "eval_precision": 0.9181878526385662, "eval_recall": 0.931167956916863, "eval_runtime": 21.9739, "eval_samples_per_second": 147.903, "eval_steps_per_second": 4.642, "step": 1125 }, { "epoch": 2.62, "eval_accuracy": 0.987033215217476, "eval_f1": 0.9233344492802142, "eval_loss": 0.057037804275751114, "eval_precision": 0.9184149184149184, "eval_recall": 0.9283069673510602, "eval_runtime": 21.3838, "eval_samples_per_second": 151.984, "eval_steps_per_second": 4.77, "step": 1150 }, { "epoch": 2.68, "eval_accuracy": 0.987227911685682, "eval_f1": 0.9244541119384256, "eval_loss": 0.05629764869809151, "eval_precision": 0.9191482282482116, "eval_recall": 0.929821608885897, "eval_runtime": 21.8946, "eval_samples_per_second": 148.438, "eval_steps_per_second": 4.659, "step": 1175 }, { "epoch": 2.73, "eval_accuracy": 0.9871500330983995, "eval_f1": 0.9246449456975774, "eval_loss": 0.05648628994822502, "eval_precision": 0.918049104180491, "eval_recall": 0.9313362504207338, "eval_runtime": 21.2748, "eval_samples_per_second": 152.763, "eval_steps_per_second": 4.794, "step": 1200 }, { "epoch": 2.79, "eval_accuracy": 0.9873447295666057, "eval_f1": 0.9243767776476494, "eval_loss": 0.055928729474544525, "eval_precision": 0.9189953426480373, "eval_recall": 0.929821608885897, "eval_runtime": 21.5883, "eval_samples_per_second": 150.545, "eval_steps_per_second": 4.725, "step": 1225 }, { "epoch": 2.85, "eval_accuracy": 0.9873057902729645, "eval_f1": 0.9238748536054878, "eval_loss": 0.05620228126645088, "eval_precision": 0.9184963406520292, "eval_recall": 0.9293167283742848, "eval_runtime": 21.3558, "eval_samples_per_second": 152.184, "eval_steps_per_second": 4.776, "step": 1250 }, { "epoch": 2.9, "eval_accuracy": 0.9871500330983995, "eval_f1": 0.922961104140527, "eval_loss": 0.05639491230249405, "eval_precision": 0.9175120572093797, "eval_recall": 0.928475260854931, "eval_runtime": 21.3856, "eval_samples_per_second": 151.972, "eval_steps_per_second": 4.77, "step": 1275 }, { "epoch": 2.96, "eval_accuracy": 0.9873057902729645, "eval_f1": 0.9237330657300552, "eval_loss": 0.05629625543951988, "eval_precision": 0.9180518617021277, "eval_recall": 0.9294850218781555, "eval_runtime": 21.6582, "eval_samples_per_second": 150.059, "eval_steps_per_second": 4.71, "step": 1300 }, { "epoch": 3.0, "step": 1317, "total_flos": 1368370122693444.0, "train_loss": 0.07309725869308391, "train_runtime": 1743.2547, "train_samples_per_second": 24.163, "train_steps_per_second": 0.755 } ], "max_steps": 1317, "num_train_epochs": 3, "total_flos": 1368370122693444.0, "trial_name": null, "trial_params": null }