|
{ |
|
"best_metric": 0.6788413098236775, |
|
"best_model_checkpoint": "trained_models/wnut_17/checkpoint-9000", |
|
"epoch": 21.176470588235293, |
|
"global_step": 9000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.24, |
|
"eval_accuracy_score": 0.9205491641772071, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.5049907565116882, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 6.761, |
|
"eval_samples_per_second": 149.239, |
|
"eval_steps_per_second": 18.784, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_accuracy_score": 0.9205491641772071, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.48477333784103394, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 6.7798, |
|
"eval_samples_per_second": 148.825, |
|
"eval_steps_per_second": 18.732, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.71, |
|
"eval_accuracy_score": 0.9205491641772071, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.3834511935710907, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 6.7494, |
|
"eval_samples_per_second": 149.494, |
|
"eval_steps_per_second": 18.816, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 0.94, |
|
"eval_accuracy_score": 0.9218203775503718, |
|
"eval_f1": 0.016241299303944315, |
|
"eval_loss": 0.3428375720977783, |
|
"eval_precision": 0.2692307692307692, |
|
"eval_recall": 0.008373205741626795, |
|
"eval_runtime": 6.7397, |
|
"eval_samples_per_second": 149.711, |
|
"eval_steps_per_second": 18.844, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"learning_rate": 4.803921568627452e-06, |
|
"loss": 0.4388, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"eval_accuracy_score": 0.9387275154134621, |
|
"eval_f1": 0.3550877192982456, |
|
"eval_loss": 0.31836700439453125, |
|
"eval_precision": 0.4295415959252971, |
|
"eval_recall": 0.3026315789473684, |
|
"eval_runtime": 6.749, |
|
"eval_samples_per_second": 149.504, |
|
"eval_steps_per_second": 18.818, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.41, |
|
"eval_accuracy_score": 0.9413335028284497, |
|
"eval_f1": 0.40223463687150846, |
|
"eval_loss": 0.3077085316181183, |
|
"eval_precision": 0.48322147651006714, |
|
"eval_recall": 0.3444976076555024, |
|
"eval_runtime": 7.2416, |
|
"eval_samples_per_second": 139.333, |
|
"eval_steps_per_second": 17.537, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.65, |
|
"eval_accuracy_score": 0.9449564609419691, |
|
"eval_f1": 0.46935933147632314, |
|
"eval_loss": 0.29629671573638916, |
|
"eval_precision": 0.5616666666666666, |
|
"eval_recall": 0.40311004784689, |
|
"eval_runtime": 6.7314, |
|
"eval_samples_per_second": 149.895, |
|
"eval_steps_per_second": 18.867, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"eval_accuracy_score": 0.9471810843450074, |
|
"eval_f1": 0.5139186295503213, |
|
"eval_loss": 0.2875679135322571, |
|
"eval_precision": 0.6371681415929203, |
|
"eval_recall": 0.430622009569378, |
|
"eval_runtime": 6.7537, |
|
"eval_samples_per_second": 149.401, |
|
"eval_steps_per_second": 18.805, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.12, |
|
"eval_accuracy_score": 0.949278586410729, |
|
"eval_f1": 0.5329849771391247, |
|
"eval_loss": 0.27145618200302124, |
|
"eval_precision": 0.5870503597122302, |
|
"eval_recall": 0.4880382775119617, |
|
"eval_runtime": 6.7363, |
|
"eval_samples_per_second": 149.786, |
|
"eval_steps_per_second": 18.853, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 2.35, |
|
"learning_rate": 4.607843137254902e-06, |
|
"loss": 0.1974, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.35, |
|
"eval_accuracy_score": 0.9492150257420708, |
|
"eval_f1": 0.5209424083769634, |
|
"eval_loss": 0.2602783441543579, |
|
"eval_precision": 0.5751445086705202, |
|
"eval_recall": 0.47607655502392343, |
|
"eval_runtime": 6.736, |
|
"eval_samples_per_second": 149.792, |
|
"eval_steps_per_second": 18.854, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.59, |
|
"eval_accuracy_score": 0.9504862391152354, |
|
"eval_f1": 0.5558510638297872, |
|
"eval_loss": 0.24513839185237885, |
|
"eval_precision": 0.625748502994012, |
|
"eval_recall": 0.5, |
|
"eval_runtime": 7.332, |
|
"eval_samples_per_second": 137.616, |
|
"eval_steps_per_second": 17.321, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 2.82, |
|
"eval_accuracy_score": 0.9520116951630331, |
|
"eval_f1": 0.5626566416040101, |
|
"eval_loss": 0.23386946320533752, |
|
"eval_precision": 0.5907894736842105, |
|
"eval_recall": 0.5370813397129187, |
|
"eval_runtime": 6.737, |
|
"eval_samples_per_second": 149.771, |
|
"eval_steps_per_second": 18.851, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 3.06, |
|
"eval_accuracy_score": 0.9529651051929067, |
|
"eval_f1": 0.5635782747603835, |
|
"eval_loss": 0.23247480392456055, |
|
"eval_precision": 0.6049382716049383, |
|
"eval_recall": 0.527511961722488, |
|
"eval_runtime": 6.7326, |
|
"eval_samples_per_second": 149.868, |
|
"eval_steps_per_second": 18.864, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 3.29, |
|
"eval_accuracy_score": 0.9557617746138689, |
|
"eval_f1": 0.5892526250772081, |
|
"eval_loss": 0.2185893952846527, |
|
"eval_precision": 0.6091954022988506, |
|
"eval_recall": 0.5705741626794258, |
|
"eval_runtime": 6.7427, |
|
"eval_samples_per_second": 149.643, |
|
"eval_steps_per_second": 18.835, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.53, |
|
"learning_rate": 4.411764705882353e-06, |
|
"loss": 0.1395, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.53, |
|
"eval_accuracy_score": 0.9572236699930083, |
|
"eval_f1": 0.6000000000000001, |
|
"eval_loss": 0.2226746827363968, |
|
"eval_precision": 0.6464088397790055, |
|
"eval_recall": 0.5598086124401914, |
|
"eval_runtime": 6.7181, |
|
"eval_samples_per_second": 150.191, |
|
"eval_steps_per_second": 18.904, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.76, |
|
"eval_accuracy_score": 0.9590033687154389, |
|
"eval_f1": 0.598405885959534, |
|
"eval_loss": 0.21203213930130005, |
|
"eval_precision": 0.6138364779874214, |
|
"eval_recall": 0.583732057416268, |
|
"eval_runtime": 6.7595, |
|
"eval_samples_per_second": 149.27, |
|
"eval_steps_per_second": 18.788, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy_score": 0.9586855653721477, |
|
"eval_f1": 0.618421052631579, |
|
"eval_loss": 0.22468985617160797, |
|
"eval_precision": 0.6871345029239766, |
|
"eval_recall": 0.562200956937799, |
|
"eval_runtime": 6.7215, |
|
"eval_samples_per_second": 150.115, |
|
"eval_steps_per_second": 18.895, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 4.24, |
|
"eval_accuracy_score": 0.9599567787453124, |
|
"eval_f1": 0.6330749354005167, |
|
"eval_loss": 0.2214759886264801, |
|
"eval_precision": 0.6882022471910112, |
|
"eval_recall": 0.5861244019138756, |
|
"eval_runtime": 6.7281, |
|
"eval_samples_per_second": 149.969, |
|
"eval_steps_per_second": 18.876, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 4.47, |
|
"eval_accuracy_score": 0.96148223479311, |
|
"eval_f1": 0.6507115135834413, |
|
"eval_loss": 0.21751971542835236, |
|
"eval_precision": 0.7084507042253522, |
|
"eval_recall": 0.6016746411483254, |
|
"eval_runtime": 6.7505, |
|
"eval_samples_per_second": 149.471, |
|
"eval_steps_per_second": 18.813, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 4.71, |
|
"learning_rate": 4.215686274509805e-06, |
|
"loss": 0.1057, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 4.71, |
|
"eval_accuracy_score": 0.9605923854318947, |
|
"eval_f1": 0.6401062416998671, |
|
"eval_loss": 0.22828274965286255, |
|
"eval_precision": 0.7194029850746269, |
|
"eval_recall": 0.5765550239234449, |
|
"eval_runtime": 6.7552, |
|
"eval_samples_per_second": 149.366, |
|
"eval_steps_per_second": 18.8, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 4.94, |
|
"eval_accuracy_score": 0.9621814021483506, |
|
"eval_f1": 0.6484424666242848, |
|
"eval_loss": 0.2120533287525177, |
|
"eval_precision": 0.6919945725915875, |
|
"eval_recall": 0.6100478468899522, |
|
"eval_runtime": 6.7607, |
|
"eval_samples_per_second": 149.245, |
|
"eval_steps_per_second": 18.785, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 5.18, |
|
"eval_accuracy_score": 0.9617364774677429, |
|
"eval_f1": 0.6427196921103272, |
|
"eval_loss": 0.21272720396518707, |
|
"eval_precision": 0.6929460580912863, |
|
"eval_recall": 0.5992822966507177, |
|
"eval_runtime": 6.823, |
|
"eval_samples_per_second": 147.882, |
|
"eval_steps_per_second": 18.613, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 5.41, |
|
"eval_accuracy_score": 0.9614186741244518, |
|
"eval_f1": 0.6440460947503202, |
|
"eval_loss": 0.21506403386592865, |
|
"eval_precision": 0.6928374655647382, |
|
"eval_recall": 0.6016746411483254, |
|
"eval_runtime": 6.7509, |
|
"eval_samples_per_second": 149.462, |
|
"eval_steps_per_second": 18.812, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 5.65, |
|
"eval_accuracy_score": 0.9625627661603, |
|
"eval_f1": 0.6498740554156172, |
|
"eval_loss": 0.20958468317985535, |
|
"eval_precision": 0.6861702127659575, |
|
"eval_recall": 0.6172248803827751, |
|
"eval_runtime": 6.7421, |
|
"eval_samples_per_second": 149.656, |
|
"eval_steps_per_second": 18.837, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 5.88, |
|
"learning_rate": 4.019607843137255e-06, |
|
"loss": 0.0811, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 5.88, |
|
"eval_accuracy_score": 0.9624356448229835, |
|
"eval_f1": 0.6591337099811676, |
|
"eval_loss": 0.2008962631225586, |
|
"eval_precision": 0.6935270805812418, |
|
"eval_recall": 0.6279904306220095, |
|
"eval_runtime": 6.7089, |
|
"eval_samples_per_second": 150.397, |
|
"eval_steps_per_second": 18.93, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 6.12, |
|
"eval_accuracy_score": 0.9621178414796924, |
|
"eval_f1": 0.6448717948717948, |
|
"eval_loss": 0.21091684699058533, |
|
"eval_precision": 0.6947513812154696, |
|
"eval_recall": 0.6016746411483254, |
|
"eval_runtime": 6.7609, |
|
"eval_samples_per_second": 149.241, |
|
"eval_steps_per_second": 18.785, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 6.35, |
|
"eval_accuracy_score": 0.9621178414796924, |
|
"eval_f1": 0.6499057196731616, |
|
"eval_loss": 0.21349507570266724, |
|
"eval_precision": 0.6847682119205298, |
|
"eval_recall": 0.618421052631579, |
|
"eval_runtime": 6.7376, |
|
"eval_samples_per_second": 149.757, |
|
"eval_steps_per_second": 18.849, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 6.59, |
|
"eval_accuracy_score": 0.9620542808110342, |
|
"eval_f1": 0.6467218332272437, |
|
"eval_loss": 0.2102096974849701, |
|
"eval_precision": 0.691156462585034, |
|
"eval_recall": 0.6076555023923444, |
|
"eval_runtime": 6.7394, |
|
"eval_samples_per_second": 149.717, |
|
"eval_steps_per_second": 18.844, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 6.82, |
|
"eval_accuracy_score": 0.9630076908409076, |
|
"eval_f1": 0.6658385093167701, |
|
"eval_loss": 0.2015107125043869, |
|
"eval_precision": 0.6925064599483204, |
|
"eval_recall": 0.6411483253588517, |
|
"eval_runtime": 6.7773, |
|
"eval_samples_per_second": 148.879, |
|
"eval_steps_per_second": 18.739, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 7.06, |
|
"learning_rate": 3.8235294117647055e-06, |
|
"loss": 0.0674, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 7.06, |
|
"eval_accuracy_score": 0.96364329752749, |
|
"eval_f1": 0.6624921728240452, |
|
"eval_loss": 0.20179474353790283, |
|
"eval_precision": 0.695137976346912, |
|
"eval_recall": 0.6327751196172249, |
|
"eval_runtime": 6.8013, |
|
"eval_samples_per_second": 148.354, |
|
"eval_steps_per_second": 18.673, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 7.29, |
|
"eval_accuracy_score": 0.9629441301722494, |
|
"eval_f1": 0.6454431960049937, |
|
"eval_loss": 0.20865464210510254, |
|
"eval_precision": 0.674934725848564, |
|
"eval_recall": 0.618421052631579, |
|
"eval_runtime": 6.7901, |
|
"eval_samples_per_second": 148.599, |
|
"eval_steps_per_second": 18.704, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 7.53, |
|
"eval_accuracy_score": 0.9631983728468824, |
|
"eval_f1": 0.6507237256135934, |
|
"eval_loss": 0.2077988088130951, |
|
"eval_precision": 0.6865869853917662, |
|
"eval_recall": 0.618421052631579, |
|
"eval_runtime": 6.7566, |
|
"eval_samples_per_second": 149.335, |
|
"eval_steps_per_second": 18.796, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 7.76, |
|
"eval_accuracy_score": 0.9626898874976165, |
|
"eval_f1": 0.6499678869621066, |
|
"eval_loss": 0.2155311405658722, |
|
"eval_precision": 0.7018030513176144, |
|
"eval_recall": 0.6052631578947368, |
|
"eval_runtime": 6.7572, |
|
"eval_samples_per_second": 149.321, |
|
"eval_steps_per_second": 18.795, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy_score": 0.9624356448229835, |
|
"eval_f1": 0.6524271844660194, |
|
"eval_loss": 0.21822784841060638, |
|
"eval_precision": 0.7108603667136812, |
|
"eval_recall": 0.6028708133971292, |
|
"eval_runtime": 6.7807, |
|
"eval_samples_per_second": 148.804, |
|
"eval_steps_per_second": 18.73, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 8.24, |
|
"learning_rate": 3.6274509803921573e-06, |
|
"loss": 0.0559, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 8.24, |
|
"eval_accuracy_score": 0.9631348121782242, |
|
"eval_f1": 0.659062103929024, |
|
"eval_loss": 0.21273677051067352, |
|
"eval_precision": 0.7008086253369272, |
|
"eval_recall": 0.6220095693779905, |
|
"eval_runtime": 6.7444, |
|
"eval_samples_per_second": 149.606, |
|
"eval_steps_per_second": 18.831, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 8.47, |
|
"eval_accuracy_score": 0.9634526155215153, |
|
"eval_f1": 0.6608478802992518, |
|
"eval_loss": 0.20193149149417877, |
|
"eval_precision": 0.6901041666666666, |
|
"eval_recall": 0.6339712918660287, |
|
"eval_runtime": 8.1777, |
|
"eval_samples_per_second": 123.384, |
|
"eval_steps_per_second": 15.53, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 8.71, |
|
"eval_accuracy_score": 0.9634526155215153, |
|
"eval_f1": 0.6587942821628341, |
|
"eval_loss": 0.20160645246505737, |
|
"eval_precision": 0.685640362225097, |
|
"eval_recall": 0.6339712918660287, |
|
"eval_runtime": 6.7668, |
|
"eval_samples_per_second": 149.11, |
|
"eval_steps_per_second": 18.768, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 8.94, |
|
"eval_accuracy_score": 0.9634526155215153, |
|
"eval_f1": 0.662553979025293, |
|
"eval_loss": 0.20665320754051208, |
|
"eval_precision": 0.6840764331210191, |
|
"eval_recall": 0.6423444976076556, |
|
"eval_runtime": 6.7328, |
|
"eval_samples_per_second": 149.863, |
|
"eval_steps_per_second": 18.863, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 9.18, |
|
"eval_accuracy_score": 0.9629441301722494, |
|
"eval_f1": 0.6566775244299674, |
|
"eval_loss": 0.22287048399448395, |
|
"eval_precision": 0.721030042918455, |
|
"eval_recall": 0.6028708133971292, |
|
"eval_runtime": 6.7851, |
|
"eval_samples_per_second": 148.709, |
|
"eval_steps_per_second": 18.718, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 9.41, |
|
"learning_rate": 3.431372549019608e-06, |
|
"loss": 0.0459, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 9.41, |
|
"eval_accuracy_score": 0.9635797368588318, |
|
"eval_f1": 0.6574827802128992, |
|
"eval_loss": 0.20987075567245483, |
|
"eval_precision": 0.6898817345597897, |
|
"eval_recall": 0.6279904306220095, |
|
"eval_runtime": 6.7469, |
|
"eval_samples_per_second": 149.549, |
|
"eval_steps_per_second": 18.823, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 9.65, |
|
"eval_accuracy_score": 0.9628805695035911, |
|
"eval_f1": 0.6568690095846645, |
|
"eval_loss": 0.22190582752227783, |
|
"eval_precision": 0.7050754458161865, |
|
"eval_recall": 0.6148325358851675, |
|
"eval_runtime": 6.7586, |
|
"eval_samples_per_second": 149.292, |
|
"eval_steps_per_second": 18.791, |
|
"step": 4100 |
|
}, |
|
{ |
|
"epoch": 9.88, |
|
"eval_accuracy_score": 0.9632619335155406, |
|
"eval_f1": 0.6525265127885215, |
|
"eval_loss": 0.21028834581375122, |
|
"eval_precision": 0.681877444589309, |
|
"eval_recall": 0.6255980861244019, |
|
"eval_runtime": 6.7583, |
|
"eval_samples_per_second": 149.298, |
|
"eval_steps_per_second": 18.792, |
|
"step": 4200 |
|
}, |
|
{ |
|
"epoch": 10.12, |
|
"eval_accuracy_score": 0.9640882222080976, |
|
"eval_f1": 0.6692111959287532, |
|
"eval_loss": 0.2170829027891159, |
|
"eval_precision": 0.7146739130434783, |
|
"eval_recall": 0.6291866028708134, |
|
"eval_runtime": 6.7544, |
|
"eval_samples_per_second": 149.383, |
|
"eval_steps_per_second": 18.802, |
|
"step": 4300 |
|
}, |
|
{ |
|
"epoch": 10.35, |
|
"eval_accuracy_score": 0.9630712515095659, |
|
"eval_f1": 0.6495619524405507, |
|
"eval_loss": 0.2193835973739624, |
|
"eval_precision": 0.6811023622047244, |
|
"eval_recall": 0.6208133971291866, |
|
"eval_runtime": 6.7362, |
|
"eval_samples_per_second": 149.787, |
|
"eval_steps_per_second": 18.853, |
|
"step": 4400 |
|
}, |
|
{ |
|
"epoch": 10.59, |
|
"learning_rate": 3.2352941176470594e-06, |
|
"loss": 0.0399, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 10.59, |
|
"eval_accuracy_score": 0.9634526155215153, |
|
"eval_f1": 0.6556543837357053, |
|
"eval_loss": 0.21863853931427002, |
|
"eval_precision": 0.6991869918699187, |
|
"eval_recall": 0.6172248803827751, |
|
"eval_runtime": 6.769, |
|
"eval_samples_per_second": 149.062, |
|
"eval_steps_per_second": 18.762, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 10.82, |
|
"eval_accuracy_score": 0.9637068581961482, |
|
"eval_f1": 0.6624685138539044, |
|
"eval_loss": 0.21445031464099884, |
|
"eval_precision": 0.699468085106383, |
|
"eval_recall": 0.6291866028708134, |
|
"eval_runtime": 6.7298, |
|
"eval_samples_per_second": 149.93, |
|
"eval_steps_per_second": 18.871, |
|
"step": 4600 |
|
}, |
|
{ |
|
"epoch": 11.06, |
|
"eval_accuracy_score": 0.9644695862200471, |
|
"eval_f1": 0.6759142496847416, |
|
"eval_loss": 0.20991285145282745, |
|
"eval_precision": 0.7146666666666667, |
|
"eval_recall": 0.6411483253588517, |
|
"eval_runtime": 6.734, |
|
"eval_samples_per_second": 149.837, |
|
"eval_steps_per_second": 18.86, |
|
"step": 4700 |
|
}, |
|
{ |
|
"epoch": 11.29, |
|
"eval_accuracy_score": 0.96364329752749, |
|
"eval_f1": 0.6649778340721977, |
|
"eval_loss": 0.22495105862617493, |
|
"eval_precision": 0.7065948855989233, |
|
"eval_recall": 0.6279904306220095, |
|
"eval_runtime": 6.7408, |
|
"eval_samples_per_second": 149.687, |
|
"eval_steps_per_second": 18.841, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 11.53, |
|
"eval_accuracy_score": 0.9639611008707811, |
|
"eval_f1": 0.6670894102726697, |
|
"eval_loss": 0.22267203032970428, |
|
"eval_precision": 0.7098515519568152, |
|
"eval_recall": 0.6291866028708134, |
|
"eval_runtime": 6.7689, |
|
"eval_samples_per_second": 149.064, |
|
"eval_steps_per_second": 18.762, |
|
"step": 4900 |
|
}, |
|
{ |
|
"epoch": 11.76, |
|
"learning_rate": 3.03921568627451e-06, |
|
"loss": 0.0368, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 11.76, |
|
"eval_accuracy_score": 0.9637068581961482, |
|
"eval_f1": 0.6588235294117647, |
|
"eval_loss": 0.21161217987537384, |
|
"eval_precision": 0.6829268292682927, |
|
"eval_recall": 0.6363636363636364, |
|
"eval_runtime": 6.7536, |
|
"eval_samples_per_second": 149.402, |
|
"eval_steps_per_second": 18.805, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy_score": 0.9625627661603, |
|
"eval_f1": 0.6593830334190232, |
|
"eval_loss": 0.227540984749794, |
|
"eval_precision": 0.7125, |
|
"eval_recall": 0.6136363636363636, |
|
"eval_runtime": 6.7584, |
|
"eval_samples_per_second": 149.295, |
|
"eval_steps_per_second": 18.791, |
|
"step": 5100 |
|
}, |
|
{ |
|
"epoch": 12.24, |
|
"eval_accuracy_score": 0.9628805695035911, |
|
"eval_f1": 0.6640471512770137, |
|
"eval_loss": 0.23519518971443176, |
|
"eval_precision": 0.7337192474674384, |
|
"eval_recall": 0.6064593301435407, |
|
"eval_runtime": 6.7729, |
|
"eval_samples_per_second": 148.976, |
|
"eval_steps_per_second": 18.751, |
|
"step": 5200 |
|
}, |
|
{ |
|
"epoch": 12.47, |
|
"eval_accuracy_score": 0.9628170088349329, |
|
"eval_f1": 0.6679462571976967, |
|
"eval_loss": 0.2271033227443695, |
|
"eval_precision": 0.7180192572214581, |
|
"eval_recall": 0.6244019138755981, |
|
"eval_runtime": 6.7726, |
|
"eval_samples_per_second": 148.983, |
|
"eval_steps_per_second": 18.752, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 12.71, |
|
"eval_accuracy_score": 0.9630076908409076, |
|
"eval_f1": 0.6628643852978454, |
|
"eval_loss": 0.22853700816631317, |
|
"eval_precision": 0.7048517520215634, |
|
"eval_recall": 0.6255980861244019, |
|
"eval_runtime": 6.7535, |
|
"eval_samples_per_second": 149.405, |
|
"eval_steps_per_second": 18.805, |
|
"step": 5400 |
|
}, |
|
{ |
|
"epoch": 12.94, |
|
"learning_rate": 2.843137254901961e-06, |
|
"loss": 0.0321, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 12.94, |
|
"eval_accuracy_score": 0.9631348121782242, |
|
"eval_f1": 0.664548919949174, |
|
"eval_loss": 0.22333784401416779, |
|
"eval_precision": 0.7086720867208672, |
|
"eval_recall": 0.6255980861244019, |
|
"eval_runtime": 6.7401, |
|
"eval_samples_per_second": 149.702, |
|
"eval_steps_per_second": 18.843, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 13.18, |
|
"eval_accuracy_score": 0.9637068581961482, |
|
"eval_f1": 0.6705054382597568, |
|
"eval_loss": 0.222885861992836, |
|
"eval_precision": 0.7207702888583218, |
|
"eval_recall": 0.6267942583732058, |
|
"eval_runtime": 6.7486, |
|
"eval_samples_per_second": 149.513, |
|
"eval_steps_per_second": 18.819, |
|
"step": 5600 |
|
}, |
|
{ |
|
"epoch": 13.41, |
|
"eval_accuracy_score": 0.9633254941841988, |
|
"eval_f1": 0.6619718309859155, |
|
"eval_loss": 0.2285127490758896, |
|
"eval_precision": 0.7121212121212122, |
|
"eval_recall": 0.618421052631579, |
|
"eval_runtime": 6.8129, |
|
"eval_samples_per_second": 148.102, |
|
"eval_steps_per_second": 18.641, |
|
"step": 5700 |
|
}, |
|
{ |
|
"epoch": 13.65, |
|
"eval_accuracy_score": 0.9644695862200471, |
|
"eval_f1": 0.6734177215189874, |
|
"eval_loss": 0.22083869576454163, |
|
"eval_precision": 0.7150537634408602, |
|
"eval_recall": 0.6363636363636364, |
|
"eval_runtime": 6.7283, |
|
"eval_samples_per_second": 149.964, |
|
"eval_steps_per_second": 18.876, |
|
"step": 5800 |
|
}, |
|
{ |
|
"epoch": 13.88, |
|
"eval_accuracy_score": 0.9635161761901735, |
|
"eval_f1": 0.6684005201560469, |
|
"eval_loss": 0.2334665209054947, |
|
"eval_precision": 0.7321937321937322, |
|
"eval_recall": 0.6148325358851675, |
|
"eval_runtime": 6.7215, |
|
"eval_samples_per_second": 150.116, |
|
"eval_steps_per_second": 18.895, |
|
"step": 5900 |
|
}, |
|
{ |
|
"epoch": 14.12, |
|
"learning_rate": 2.647058823529412e-06, |
|
"loss": 0.0291, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 14.12, |
|
"eval_accuracy_score": 0.9641517828767558, |
|
"eval_f1": 0.663265306122449, |
|
"eval_loss": 0.2206926792860031, |
|
"eval_precision": 0.7103825136612022, |
|
"eval_recall": 0.6220095693779905, |
|
"eval_runtime": 6.7314, |
|
"eval_samples_per_second": 149.894, |
|
"eval_steps_per_second": 18.867, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 14.35, |
|
"eval_accuracy_score": 0.9650416322379711, |
|
"eval_f1": 0.6737633061991233, |
|
"eval_loss": 0.21664156019687653, |
|
"eval_precision": 0.7069645203679369, |
|
"eval_recall": 0.6435406698564593, |
|
"eval_runtime": 6.8128, |
|
"eval_samples_per_second": 148.104, |
|
"eval_steps_per_second": 18.641, |
|
"step": 6100 |
|
}, |
|
{ |
|
"epoch": 14.59, |
|
"eval_accuracy_score": 0.9646602682260217, |
|
"eval_f1": 0.6654275092936804, |
|
"eval_loss": 0.20899562537670135, |
|
"eval_precision": 0.6902313624678663, |
|
"eval_recall": 0.6423444976076556, |
|
"eval_runtime": 6.7812, |
|
"eval_samples_per_second": 148.794, |
|
"eval_steps_per_second": 18.728, |
|
"step": 6200 |
|
}, |
|
{ |
|
"epoch": 14.82, |
|
"eval_accuracy_score": 0.9647873895633382, |
|
"eval_f1": 0.6766917293233083, |
|
"eval_loss": 0.21245865523815155, |
|
"eval_precision": 0.7105263157894737, |
|
"eval_recall": 0.645933014354067, |
|
"eval_runtime": 6.7236, |
|
"eval_samples_per_second": 150.069, |
|
"eval_steps_per_second": 18.889, |
|
"step": 6300 |
|
}, |
|
{ |
|
"epoch": 15.06, |
|
"eval_accuracy_score": 0.9637704188648064, |
|
"eval_f1": 0.6666666666666667, |
|
"eval_loss": 0.22959989309310913, |
|
"eval_precision": 0.713506139154161, |
|
"eval_recall": 0.6255980861244019, |
|
"eval_runtime": 6.7691, |
|
"eval_samples_per_second": 149.061, |
|
"eval_steps_per_second": 18.762, |
|
"step": 6400 |
|
}, |
|
{ |
|
"epoch": 15.29, |
|
"learning_rate": 2.450980392156863e-06, |
|
"loss": 0.0251, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 15.29, |
|
"eval_accuracy_score": 0.9645331468887053, |
|
"eval_f1": 0.6733542319749217, |
|
"eval_loss": 0.22114437818527222, |
|
"eval_precision": 0.7075098814229249, |
|
"eval_recall": 0.6423444976076556, |
|
"eval_runtime": 6.8495, |
|
"eval_samples_per_second": 147.311, |
|
"eval_steps_per_second": 18.542, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 15.53, |
|
"eval_accuracy_score": 0.9640882222080976, |
|
"eval_f1": 0.6713197969543148, |
|
"eval_loss": 0.22384566068649292, |
|
"eval_precision": 0.7148648648648649, |
|
"eval_recall": 0.6327751196172249, |
|
"eval_runtime": 6.7143, |
|
"eval_samples_per_second": 150.277, |
|
"eval_steps_per_second": 18.915, |
|
"step": 6600 |
|
}, |
|
{ |
|
"epoch": 15.76, |
|
"eval_accuracy_score": 0.9637068581961482, |
|
"eval_f1": 0.6641172721478649, |
|
"eval_loss": 0.23098178207874298, |
|
"eval_precision": 0.7107776261937244, |
|
"eval_recall": 0.6232057416267942, |
|
"eval_runtime": 6.7457, |
|
"eval_samples_per_second": 149.576, |
|
"eval_steps_per_second": 18.827, |
|
"step": 6700 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy_score": 0.9650416322379711, |
|
"eval_f1": 0.6762860727728984, |
|
"eval_loss": 0.21991874277591705, |
|
"eval_precision": 0.7110817941952506, |
|
"eval_recall": 0.6447368421052632, |
|
"eval_runtime": 6.7686, |
|
"eval_samples_per_second": 149.07, |
|
"eval_steps_per_second": 18.763, |
|
"step": 6800 |
|
}, |
|
{ |
|
"epoch": 16.24, |
|
"eval_accuracy_score": 0.96364329752749, |
|
"eval_f1": 0.6636771300448431, |
|
"eval_loss": 0.23369288444519043, |
|
"eval_precision": 0.7144827586206897, |
|
"eval_recall": 0.6196172248803827, |
|
"eval_runtime": 6.8164, |
|
"eval_samples_per_second": 148.025, |
|
"eval_steps_per_second": 18.631, |
|
"step": 6900 |
|
}, |
|
{ |
|
"epoch": 16.47, |
|
"learning_rate": 2.254901960784314e-06, |
|
"loss": 0.0227, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 16.47, |
|
"eval_accuracy_score": 0.9646602682260217, |
|
"eval_f1": 0.6712243629583592, |
|
"eval_loss": 0.22149834036827087, |
|
"eval_precision": 0.6985769728331177, |
|
"eval_recall": 0.645933014354067, |
|
"eval_runtime": 6.7644, |
|
"eval_samples_per_second": 149.164, |
|
"eval_steps_per_second": 18.775, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 16.71, |
|
"eval_accuracy_score": 0.9645331468887053, |
|
"eval_f1": 0.6687422166874221, |
|
"eval_loss": 0.2212422788143158, |
|
"eval_precision": 0.6974025974025974, |
|
"eval_recall": 0.6423444976076556, |
|
"eval_runtime": 6.7009, |
|
"eval_samples_per_second": 150.576, |
|
"eval_steps_per_second": 18.953, |
|
"step": 7100 |
|
}, |
|
{ |
|
"epoch": 16.94, |
|
"eval_accuracy_score": 0.9635161761901735, |
|
"eval_f1": 0.6653821451509313, |
|
"eval_loss": 0.24178394675254822, |
|
"eval_precision": 0.7184466019417476, |
|
"eval_recall": 0.6196172248803827, |
|
"eval_runtime": 6.7952, |
|
"eval_samples_per_second": 148.486, |
|
"eval_steps_per_second": 18.69, |
|
"step": 7200 |
|
}, |
|
{ |
|
"epoch": 17.18, |
|
"eval_accuracy_score": 0.9633890548528571, |
|
"eval_f1": 0.6675307841866494, |
|
"eval_loss": 0.24713467061519623, |
|
"eval_precision": 0.7284299858557284, |
|
"eval_recall": 0.6160287081339713, |
|
"eval_runtime": 6.807, |
|
"eval_samples_per_second": 148.229, |
|
"eval_steps_per_second": 18.657, |
|
"step": 7300 |
|
}, |
|
{ |
|
"epoch": 17.41, |
|
"eval_accuracy_score": 0.9643424648827306, |
|
"eval_f1": 0.670031545741325, |
|
"eval_loss": 0.22886203229427338, |
|
"eval_precision": 0.7089452603471295, |
|
"eval_recall": 0.6351674641148325, |
|
"eval_runtime": 6.7775, |
|
"eval_samples_per_second": 148.874, |
|
"eval_steps_per_second": 18.738, |
|
"step": 7400 |
|
}, |
|
{ |
|
"epoch": 17.65, |
|
"learning_rate": 2.058823529411765e-06, |
|
"loss": 0.0197, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 17.65, |
|
"eval_accuracy_score": 0.9646602682260217, |
|
"eval_f1": 0.6753731343283582, |
|
"eval_loss": 0.22524945437908173, |
|
"eval_precision": 0.7033678756476683, |
|
"eval_recall": 0.6495215311004785, |
|
"eval_runtime": 6.7338, |
|
"eval_samples_per_second": 149.84, |
|
"eval_steps_per_second": 18.86, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 17.88, |
|
"eval_accuracy_score": 0.9633890548528571, |
|
"eval_f1": 0.664528543938422, |
|
"eval_loss": 0.24701638519763947, |
|
"eval_precision": 0.7164591977869986, |
|
"eval_recall": 0.6196172248803827, |
|
"eval_runtime": 6.7838, |
|
"eval_samples_per_second": 148.736, |
|
"eval_steps_per_second": 18.721, |
|
"step": 7600 |
|
}, |
|
{ |
|
"epoch": 18.12, |
|
"eval_accuracy_score": 0.9654865569185788, |
|
"eval_f1": 0.6825, |
|
"eval_loss": 0.22353364527225494, |
|
"eval_precision": 0.7146596858638743, |
|
"eval_recall": 0.65311004784689, |
|
"eval_runtime": 6.7595, |
|
"eval_samples_per_second": 149.272, |
|
"eval_steps_per_second": 18.788, |
|
"step": 7700 |
|
}, |
|
{ |
|
"epoch": 18.35, |
|
"eval_accuracy_score": 0.9638975402021229, |
|
"eval_f1": 0.6590765338393421, |
|
"eval_loss": 0.23786970973014832, |
|
"eval_precision": 0.6993288590604027, |
|
"eval_recall": 0.6232057416267942, |
|
"eval_runtime": 6.8141, |
|
"eval_samples_per_second": 148.075, |
|
"eval_steps_per_second": 18.638, |
|
"step": 7800 |
|
}, |
|
{ |
|
"epoch": 18.59, |
|
"eval_accuracy_score": 0.9644060255513888, |
|
"eval_f1": 0.6666666666666667, |
|
"eval_loss": 0.23264023661613464, |
|
"eval_precision": 0.7014531043593131, |
|
"eval_recall": 0.6351674641148325, |
|
"eval_runtime": 6.8013, |
|
"eval_samples_per_second": 148.353, |
|
"eval_steps_per_second": 18.673, |
|
"step": 7900 |
|
}, |
|
{ |
|
"epoch": 18.82, |
|
"learning_rate": 1.8627450980392158e-06, |
|
"loss": 0.0183, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 18.82, |
|
"eval_accuracy_score": 0.9649780715693129, |
|
"eval_f1": 0.6724244293645897, |
|
"eval_loss": 0.22304123640060425, |
|
"eval_precision": 0.6942675159235668, |
|
"eval_recall": 0.6519138755980861, |
|
"eval_runtime": 6.7426, |
|
"eval_samples_per_second": 149.646, |
|
"eval_steps_per_second": 18.835, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 19.06, |
|
"eval_accuracy_score": 0.9643424648827306, |
|
"eval_f1": 0.6683480453972257, |
|
"eval_loss": 0.2350449413061142, |
|
"eval_precision": 0.7066666666666667, |
|
"eval_recall": 0.6339712918660287, |
|
"eval_runtime": 6.8057, |
|
"eval_samples_per_second": 148.259, |
|
"eval_steps_per_second": 18.661, |
|
"step": 8100 |
|
}, |
|
{ |
|
"epoch": 19.29, |
|
"eval_accuracy_score": 0.9652323142439458, |
|
"eval_f1": 0.6790582403965303, |
|
"eval_loss": 0.226871520280838, |
|
"eval_precision": 0.7043701799485861, |
|
"eval_recall": 0.6555023923444976, |
|
"eval_runtime": 6.7483, |
|
"eval_samples_per_second": 149.519, |
|
"eval_steps_per_second": 18.819, |
|
"step": 8200 |
|
}, |
|
{ |
|
"epoch": 19.53, |
|
"eval_accuracy_score": 0.96472382889468, |
|
"eval_f1": 0.6683354192740926, |
|
"eval_loss": 0.23186342418193817, |
|
"eval_precision": 0.7007874015748031, |
|
"eval_recall": 0.638755980861244, |
|
"eval_runtime": 6.7632, |
|
"eval_samples_per_second": 149.19, |
|
"eval_steps_per_second": 18.778, |
|
"step": 8300 |
|
}, |
|
{ |
|
"epoch": 19.76, |
|
"eval_accuracy_score": 0.9645967075573635, |
|
"eval_f1": 0.6712933753943218, |
|
"eval_loss": 0.2337142825126648, |
|
"eval_precision": 0.7102803738317757, |
|
"eval_recall": 0.6363636363636364, |
|
"eval_runtime": 6.7451, |
|
"eval_samples_per_second": 149.591, |
|
"eval_steps_per_second": 18.829, |
|
"step": 8400 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"learning_rate": 1.6666666666666667e-06, |
|
"loss": 0.0162, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy_score": 0.9647873895633382, |
|
"eval_f1": 0.6751430387794024, |
|
"eval_loss": 0.2389359027147293, |
|
"eval_precision": 0.7204884667571235, |
|
"eval_recall": 0.6351674641148325, |
|
"eval_runtime": 6.7503, |
|
"eval_samples_per_second": 149.474, |
|
"eval_steps_per_second": 18.814, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 20.24, |
|
"eval_accuracy_score": 0.9638975402021229, |
|
"eval_f1": 0.6709677419354839, |
|
"eval_loss": 0.25359493494033813, |
|
"eval_precision": 0.7282913165266106, |
|
"eval_recall": 0.6220095693779905, |
|
"eval_runtime": 6.7422, |
|
"eval_samples_per_second": 149.655, |
|
"eval_steps_per_second": 18.837, |
|
"step": 8600 |
|
}, |
|
{ |
|
"epoch": 20.47, |
|
"eval_accuracy_score": 0.964215343545414, |
|
"eval_f1": 0.6709346991037132, |
|
"eval_loss": 0.24693100154399872, |
|
"eval_precision": 0.721763085399449, |
|
"eval_recall": 0.6267942583732058, |
|
"eval_runtime": 6.7296, |
|
"eval_samples_per_second": 149.934, |
|
"eval_steps_per_second": 18.872, |
|
"step": 8700 |
|
}, |
|
{ |
|
"epoch": 20.71, |
|
"eval_accuracy_score": 0.9637704188648064, |
|
"eval_f1": 0.6687938736439056, |
|
"eval_loss": 0.2458009421825409, |
|
"eval_precision": 0.7168262653898769, |
|
"eval_recall": 0.6267942583732058, |
|
"eval_runtime": 6.7627, |
|
"eval_samples_per_second": 149.201, |
|
"eval_steps_per_second": 18.78, |
|
"step": 8800 |
|
}, |
|
{ |
|
"epoch": 20.94, |
|
"eval_accuracy_score": 0.9648509502319964, |
|
"eval_f1": 0.676304211187932, |
|
"eval_loss": 0.23430827260017395, |
|
"eval_precision": 0.7125827814569536, |
|
"eval_recall": 0.6435406698564593, |
|
"eval_runtime": 6.7289, |
|
"eval_samples_per_second": 149.951, |
|
"eval_steps_per_second": 18.874, |
|
"step": 8900 |
|
}, |
|
{ |
|
"epoch": 21.18, |
|
"learning_rate": 1.4705882352941177e-06, |
|
"loss": 0.0149, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 21.18, |
|
"eval_accuracy_score": 0.9651687535752876, |
|
"eval_f1": 0.6788413098236775, |
|
"eval_loss": 0.23078210651874542, |
|
"eval_precision": 0.7167553191489362, |
|
"eval_recall": 0.6447368421052632, |
|
"eval_runtime": 6.7181, |
|
"eval_samples_per_second": 150.19, |
|
"eval_steps_per_second": 18.904, |
|
"step": 9000 |
|
} |
|
], |
|
"max_steps": 12750, |
|
"num_train_epochs": 30, |
|
"total_flos": 4695577703714304.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|