llmv3-4000 / trainer_state.json
bmpipli's picture
Upload 11 files
78d35d2
{
"best_metric": 0.9796821008984106,
"best_model_checkpoint": "test/checkpoint-1500",
"epoch": 13.377926421404682,
"global_step": 4000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.03,
"eval_accuracy": 0.8922687113634554,
"eval_f1": 0.0,
"eval_loss": 1.3138163089752197,
"eval_precision": 0.0,
"eval_recall": 0.0,
"eval_runtime": 42.6447,
"eval_samples_per_second": 10.06,
"eval_steps_per_second": 1.688,
"step": 10
},
{
"epoch": 0.07,
"eval_accuracy": 0.8922687113634554,
"eval_f1": 0.0,
"eval_loss": 0.7134402394294739,
"eval_precision": 0.0,
"eval_recall": 0.0,
"eval_runtime": 44.6528,
"eval_samples_per_second": 9.607,
"eval_steps_per_second": 1.612,
"step": 20
},
{
"epoch": 0.1,
"eval_accuracy": 0.8922687113634554,
"eval_f1": 0.0,
"eval_loss": 0.6043053865432739,
"eval_precision": 0.0,
"eval_recall": 0.0,
"eval_runtime": 44.2765,
"eval_samples_per_second": 9.689,
"eval_steps_per_second": 1.626,
"step": 30
},
{
"epoch": 0.13,
"eval_accuracy": 0.8922687113634554,
"eval_f1": 0.0,
"eval_loss": 0.5121276378631592,
"eval_precision": 0.0,
"eval_recall": 0.0,
"eval_runtime": 45.3257,
"eval_samples_per_second": 9.465,
"eval_steps_per_second": 1.589,
"step": 40
},
{
"epoch": 0.17,
"eval_accuracy": 0.8922687113634554,
"eval_f1": 0.0,
"eval_loss": 0.4018501937389374,
"eval_precision": 0.0,
"eval_recall": 0.0,
"eval_runtime": 44.7272,
"eval_samples_per_second": 9.591,
"eval_steps_per_second": 1.61,
"step": 50
},
{
"epoch": 0.2,
"eval_accuracy": 0.908479477859436,
"eval_f1": 0.0,
"eval_loss": 0.3501987159252167,
"eval_precision": 0.0,
"eval_recall": 0.0,
"eval_runtime": 44.7765,
"eval_samples_per_second": 9.581,
"eval_steps_per_second": 1.608,
"step": 60
},
{
"epoch": 0.23,
"eval_accuracy": 0.9237218434108938,
"eval_f1": 0.0,
"eval_loss": 0.29354768991470337,
"eval_precision": 0.0,
"eval_recall": 0.0,
"eval_runtime": 44.776,
"eval_samples_per_second": 9.581,
"eval_steps_per_second": 1.608,
"step": 70
},
{
"epoch": 0.27,
"eval_accuracy": 0.9264413255153751,
"eval_f1": 0.0008230452674897119,
"eval_loss": 0.24890266358852386,
"eval_precision": 0.001594896331738437,
"eval_recall": 0.0005546311702717693,
"eval_runtime": 44.807,
"eval_samples_per_second": 9.574,
"eval_steps_per_second": 1.607,
"step": 80
},
{
"epoch": 0.3,
"eval_accuracy": 0.9392427900559815,
"eval_f1": 0.013897161008536827,
"eval_loss": 0.2203027307987213,
"eval_precision": 0.02445842068483578,
"eval_recall": 0.009706045479755962,
"eval_runtime": 44.7926,
"eval_samples_per_second": 9.577,
"eval_steps_per_second": 1.607,
"step": 90
},
{
"epoch": 0.33,
"eval_accuracy": 0.935727361969701,
"eval_f1": 0.00045840018336007336,
"eval_loss": 0.19940191507339478,
"eval_precision": 0.001321003963011889,
"eval_recall": 0.00027731558513588466,
"eval_runtime": 44.7253,
"eval_samples_per_second": 9.592,
"eval_steps_per_second": 1.61,
"step": 100
},
{
"epoch": 0.37,
"eval_accuracy": 0.943779682152238,
"eval_f1": 0.07579030041233065,
"eval_loss": 0.1813557893037796,
"eval_precision": 0.12979152656355078,
"eval_recall": 0.053521907931225736,
"eval_runtime": 44.6764,
"eval_samples_per_second": 9.602,
"eval_steps_per_second": 1.612,
"step": 110
},
{
"epoch": 0.4,
"eval_accuracy": 0.9479053354912313,
"eval_f1": 0.11372837688627163,
"eval_loss": 0.16338485479354858,
"eval_precision": 0.16903719912472648,
"eval_recall": 0.08569051580698835,
"eval_runtime": 44.7776,
"eval_samples_per_second": 9.581,
"eval_steps_per_second": 1.608,
"step": 120
},
{
"epoch": 0.43,
"eval_accuracy": 0.9628027911172429,
"eval_f1": 0.33931930904737473,
"eval_loss": 0.14094215631484985,
"eval_precision": 0.4426595269968764,
"eval_recall": 0.27509706045479754,
"eval_runtime": 44.9683,
"eval_samples_per_second": 9.54,
"eval_steps_per_second": 1.601,
"step": 130
},
{
"epoch": 0.47,
"eval_accuracy": 0.9663580165026133,
"eval_f1": 0.34743875278396436,
"eval_loss": 0.12451943010091782,
"eval_precision": 0.40746268656716417,
"eval_recall": 0.30282861896838603,
"eval_runtime": 44.682,
"eval_samples_per_second": 9.601,
"eval_steps_per_second": 1.611,
"step": 140
},
{
"epoch": 0.5,
"eval_accuracy": 0.9711734896924995,
"eval_f1": 0.47246835443037977,
"eval_loss": 0.11197753250598907,
"eval_precision": 0.5501105379513633,
"eval_recall": 0.4140321686078758,
"eval_runtime": 44.7253,
"eval_samples_per_second": 9.592,
"eval_steps_per_second": 1.61,
"step": 150
},
{
"epoch": 0.54,
"eval_accuracy": 0.9736674537688043,
"eval_f1": 0.5392111368909513,
"eval_loss": 0.09976229071617126,
"eval_precision": 0.6096537250786989,
"eval_recall": 0.48336106489184694,
"eval_runtime": 44.7165,
"eval_samples_per_second": 9.594,
"eval_steps_per_second": 1.61,
"step": 160
},
{
"epoch": 0.57,
"eval_accuracy": 0.9746623862460534,
"eval_f1": 0.5685945368533496,
"eval_loss": 0.09186050295829773,
"eval_precision": 0.6321683067526298,
"eval_recall": 0.5166389351081531,
"eval_runtime": 44.7738,
"eval_samples_per_second": 9.582,
"eval_steps_per_second": 1.608,
"step": 170
},
{
"epoch": 0.6,
"eval_accuracy": 0.9771696160887214,
"eval_f1": 0.5888754534461911,
"eval_loss": 0.0845290869474411,
"eval_precision": 0.6471760797342193,
"eval_recall": 0.5402107598447032,
"eval_runtime": 44.7399,
"eval_samples_per_second": 9.589,
"eval_steps_per_second": 1.609,
"step": 180
},
{
"epoch": 0.64,
"eval_accuracy": 0.980194210819559,
"eval_f1": 0.6471658078205517,
"eval_loss": 0.07714465260505676,
"eval_precision": 0.7135695187165776,
"eval_recall": 0.5920687742651137,
"eval_runtime": 44.734,
"eval_samples_per_second": 9.59,
"eval_steps_per_second": 1.61,
"step": 190
},
{
"epoch": 0.67,
"eval_accuracy": 0.9795839855668462,
"eval_f1": 0.7072773084333779,
"eval_loss": 0.07666940242052078,
"eval_precision": 0.7596306908627826,
"eval_recall": 0.6616749861342207,
"eval_runtime": 44.7886,
"eval_samples_per_second": 9.578,
"eval_steps_per_second": 1.608,
"step": 200
},
{
"epoch": 0.7,
"eval_accuracy": 0.9832586028494866,
"eval_f1": 0.7367480643240022,
"eval_loss": 0.06706634908914566,
"eval_precision": 0.7954983922829582,
"eval_recall": 0.6860787576261785,
"eval_runtime": 44.9641,
"eval_samples_per_second": 9.541,
"eval_steps_per_second": 1.601,
"step": 210
},
{
"epoch": 0.74,
"eval_accuracy": 0.9847576344485421,
"eval_f1": 0.7383826191913097,
"eval_loss": 0.06665363162755966,
"eval_precision": 0.8097286565188617,
"eval_recall": 0.6785912368275097,
"eval_runtime": 44.8134,
"eval_samples_per_second": 9.573,
"eval_steps_per_second": 1.607,
"step": 220
},
{
"epoch": 0.77,
"eval_accuracy": 0.9845321164203656,
"eval_f1": 0.752096513167574,
"eval_loss": 0.06071800738573074,
"eval_precision": 0.8010028204324663,
"eval_recall": 0.7088186356073212,
"eval_runtime": 44.7268,
"eval_samples_per_second": 9.592,
"eval_steps_per_second": 1.61,
"step": 230
},
{
"epoch": 0.8,
"eval_accuracy": 0.986482184075774,
"eval_f1": 0.7756542193472508,
"eval_loss": 0.057662855833768845,
"eval_precision": 0.8254067584480601,
"eval_recall": 0.7315585135884637,
"eval_runtime": 44.6791,
"eval_samples_per_second": 9.602,
"eval_steps_per_second": 1.611,
"step": 240
},
{
"epoch": 0.84,
"eval_accuracy": 0.9871454723939402,
"eval_f1": 0.7851227662356531,
"eval_loss": 0.054133981466293335,
"eval_precision": 0.8245346353371986,
"eval_recall": 0.7493067110371603,
"eval_runtime": 44.7641,
"eval_samples_per_second": 9.584,
"eval_steps_per_second": 1.608,
"step": 250
},
{
"epoch": 0.87,
"eval_accuracy": 0.9884985805629991,
"eval_f1": 0.8150755242704208,
"eval_loss": 0.05026474595069885,
"eval_precision": 0.8649237472766884,
"eval_recall": 0.7706600110926234,
"eval_runtime": 44.9736,
"eval_samples_per_second": 9.539,
"eval_steps_per_second": 1.601,
"step": 260
},
{
"epoch": 0.9,
"eval_accuracy": 0.9881934679366426,
"eval_f1": 0.801503541997976,
"eval_loss": 0.04910367354750633,
"eval_precision": 0.8372093023255814,
"eval_recall": 0.7687188019966722,
"eval_runtime": 44.8146,
"eval_samples_per_second": 9.573,
"eval_steps_per_second": 1.607,
"step": 270
},
{
"epoch": 0.94,
"eval_accuracy": 0.987875089543923,
"eval_f1": 0.8106457242582897,
"eval_loss": 0.04733191058039665,
"eval_precision": 0.8522935779816514,
"eval_recall": 0.7728785357737105,
"eval_runtime": 44.8863,
"eval_samples_per_second": 9.557,
"eval_steps_per_second": 1.604,
"step": 280
},
{
"epoch": 0.97,
"eval_accuracy": 0.9887904274229923,
"eval_f1": 0.8112208387004436,
"eval_loss": 0.046026937663555145,
"eval_precision": 0.8382135462880804,
"eval_recall": 0.785912368275097,
"eval_runtime": 44.8674,
"eval_samples_per_second": 9.562,
"eval_steps_per_second": 1.605,
"step": 290
},
{
"epoch": 1.0,
"eval_accuracy": 0.9894404499747951,
"eval_f1": 0.8500071766901106,
"eval_loss": 0.0429680198431015,
"eval_precision": 0.880987801249628,
"eval_recall": 0.8211314475873545,
"eval_runtime": 45.1867,
"eval_samples_per_second": 9.494,
"eval_steps_per_second": 1.593,
"step": 300
},
{
"epoch": 1.04,
"eval_accuracy": 0.9901170040593245,
"eval_f1": 0.8402282453637661,
"eval_loss": 0.04167770594358444,
"eval_precision": 0.8651586368977673,
"eval_recall": 0.8166943982251803,
"eval_runtime": 44.8739,
"eval_samples_per_second": 9.56,
"eval_steps_per_second": 1.604,
"step": 310
},
{
"epoch": 1.07,
"eval_accuracy": 0.9908333554429439,
"eval_f1": 0.8512689635616051,
"eval_loss": 0.039857033640146255,
"eval_precision": 0.8709022338265158,
"eval_recall": 0.8325013865779257,
"eval_runtime": 44.8161,
"eval_samples_per_second": 9.572,
"eval_steps_per_second": 1.607,
"step": 320
},
{
"epoch": 1.1,
"eval_accuracy": 0.9919211482847364,
"eval_f1": 0.8664764621968616,
"eval_loss": 0.03763346001505852,
"eval_precision": 0.8921856639247944,
"eval_recall": 0.8422074320576817,
"eval_runtime": 45.0124,
"eval_samples_per_second": 9.531,
"eval_steps_per_second": 1.6,
"step": 330
},
{
"epoch": 1.14,
"eval_accuracy": 0.992106869013823,
"eval_f1": 0.8503758332151468,
"eval_loss": 0.035481277853250504,
"eval_precision": 0.8702467343976777,
"eval_recall": 0.8313921242373822,
"eval_runtime": 44.8357,
"eval_samples_per_second": 9.568,
"eval_steps_per_second": 1.606,
"step": 340
},
{
"epoch": 1.17,
"eval_accuracy": 0.9925048420047227,
"eval_f1": 0.8676303854875284,
"eval_loss": 0.03401191905140877,
"eval_precision": 0.8872463768115942,
"eval_recall": 0.8488630061009429,
"eval_runtime": 44.9137,
"eval_samples_per_second": 9.552,
"eval_steps_per_second": 1.603,
"step": 350
},
{
"epoch": 1.2,
"eval_accuracy": 0.9926905627338092,
"eval_f1": 0.8718825708992448,
"eval_loss": 0.032262638211250305,
"eval_precision": 0.8968044561712107,
"eval_recall": 0.8483083749306711,
"eval_runtime": 44.876,
"eval_samples_per_second": 9.56,
"eval_steps_per_second": 1.604,
"step": 360
},
{
"epoch": 1.24,
"eval_accuracy": 0.9930487384256188,
"eval_f1": 0.8813077469793889,
"eval_loss": 0.03254028782248497,
"eval_precision": 0.9040536599591718,
"eval_recall": 0.8596783139212424,
"eval_runtime": 44.7683,
"eval_samples_per_second": 9.583,
"eval_steps_per_second": 1.608,
"step": 370
},
{
"epoch": 1.27,
"eval_accuracy": 0.9927038285001725,
"eval_f1": 0.8627060830017056,
"eval_loss": 0.030650299042463303,
"eval_precision": 0.8848396501457726,
"eval_recall": 0.8416528008874099,
"eval_runtime": 44.7059,
"eval_samples_per_second": 9.596,
"eval_steps_per_second": 1.611,
"step": 380
},
{
"epoch": 1.3,
"eval_accuracy": 0.9934467114165185,
"eval_f1": 0.8900583131844688,
"eval_loss": 0.029178058728575706,
"eval_precision": 0.9135766423357664,
"eval_recall": 0.867720465890183,
"eval_runtime": 44.67,
"eval_samples_per_second": 9.604,
"eval_steps_per_second": 1.612,
"step": 390
},
{
"epoch": 1.34,
"eval_accuracy": 0.993300787986522,
"eval_f1": 0.8887311950042579,
"eval_loss": 0.02753848023712635,
"eval_precision": 0.9101744186046512,
"eval_recall": 0.8682750970604548,
"eval_runtime": 44.9312,
"eval_samples_per_second": 9.548,
"eval_steps_per_second": 1.602,
"step": 400
},
{
"epoch": 1.37,
"eval_accuracy": 0.9936456979119683,
"eval_f1": 0.894469525959368,
"eval_loss": 0.027282511815428734,
"eval_precision": 0.9103963239517519,
"eval_recall": 0.8790904048807543,
"eval_runtime": 44.6914,
"eval_samples_per_second": 9.599,
"eval_steps_per_second": 1.611,
"step": 410
},
{
"epoch": 1.4,
"eval_accuracy": 0.9922925897429095,
"eval_f1": 0.8725379853685987,
"eval_loss": 0.02893451787531376,
"eval_precision": 0.8854940034266133,
"eval_recall": 0.8599556295063783,
"eval_runtime": 44.7493,
"eval_samples_per_second": 9.587,
"eval_steps_per_second": 1.609,
"step": 420
},
{
"epoch": 1.44,
"eval_accuracy": 0.9938712159401448,
"eval_f1": 0.8959954719117023,
"eval_loss": 0.024990031495690346,
"eval_precision": 0.9147645189251662,
"eval_recall": 0.8779811425402108,
"eval_runtime": 44.6669,
"eval_samples_per_second": 9.604,
"eval_steps_per_second": 1.612,
"step": 430
},
{
"epoch": 1.47,
"eval_accuracy": 0.9938181528746916,
"eval_f1": 0.8929327126534067,
"eval_loss": 0.026491543278098106,
"eval_precision": 0.9086993970714901,
"eval_recall": 0.8777038269550749,
"eval_runtime": 44.7596,
"eval_samples_per_second": 9.585,
"eval_steps_per_second": 1.609,
"step": 440
},
{
"epoch": 1.51,
"eval_accuracy": 0.9945610357910376,
"eval_f1": 0.9141895681435781,
"eval_loss": 0.0247773639857769,
"eval_precision": 0.9245604083947816,
"eval_recall": 0.9040488075429839,
"eval_runtime": 44.7459,
"eval_samples_per_second": 9.587,
"eval_steps_per_second": 1.609,
"step": 450
},
{
"epoch": 1.54,
"eval_accuracy": 0.9943753150619511,
"eval_f1": 0.9076814658210007,
"eval_loss": 0.0243705864995718,
"eval_precision": 0.9229005445686443,
"eval_recall": 0.8929561841375485,
"eval_runtime": 44.7374,
"eval_samples_per_second": 9.589,
"eval_steps_per_second": 1.609,
"step": 460
},
{
"epoch": 1.57,
"eval_accuracy": 0.994534504258311,
"eval_f1": 0.9149444678757205,
"eval_loss": 0.023830989375710487,
"eval_precision": 0.9278585685771314,
"eval_recall": 0.9023849140321686,
"eval_runtime": 44.7741,
"eval_samples_per_second": 9.581,
"eval_steps_per_second": 1.608,
"step": 470
},
{
"epoch": 1.61,
"eval_accuracy": 0.9947069592210342,
"eval_f1": 0.9177099451399635,
"eval_loss": 0.022406980395317078,
"eval_precision": 0.931201827005424,
"eval_recall": 0.9046034387132557,
"eval_runtime": 44.7025,
"eval_samples_per_second": 9.597,
"eval_steps_per_second": 1.611,
"step": 480
},
{
"epoch": 1.64,
"eval_accuracy": 0.9947069592210342,
"eval_f1": 0.9264129826524903,
"eval_loss": 0.023025579750537872,
"eval_precision": 0.9347826086956522,
"eval_recall": 0.918191902384914,
"eval_runtime": 45.0649,
"eval_samples_per_second": 9.52,
"eval_steps_per_second": 1.598,
"step": 490
},
{
"epoch": 1.67,
"learning_rate": 9.5e-06,
"loss": 0.1784,
"step": 500
},
{
"epoch": 1.67,
"eval_accuracy": 0.9953702475392003,
"eval_f1": 0.9400780379041248,
"eval_loss": 0.022061465308070183,
"eval_precision": 0.9448179271708683,
"eval_recall": 0.9353854686633388,
"eval_runtime": 44.7675,
"eval_samples_per_second": 9.583,
"eval_steps_per_second": 1.608,
"step": 500
},
{
"epoch": 1.71,
"eval_accuracy": 0.9954100448382903,
"eval_f1": 0.9358616843279419,
"eval_loss": 0.02172040194272995,
"eval_precision": 0.9411104879416713,
"eval_recall": 0.9306711037160288,
"eval_runtime": 44.9669,
"eval_samples_per_second": 9.54,
"eval_steps_per_second": 1.601,
"step": 510
},
{
"epoch": 1.74,
"eval_accuracy": 0.9952243241092038,
"eval_f1": 0.9297780259667735,
"eval_loss": 0.021418150514364243,
"eval_precision": 0.9361821759910036,
"eval_recall": 0.9234608985024958,
"eval_runtime": 44.7829,
"eval_samples_per_second": 9.58,
"eval_steps_per_second": 1.608,
"step": 520
},
{
"epoch": 1.77,
"eval_accuracy": 0.9950651349128439,
"eval_f1": 0.9294002516426674,
"eval_loss": 0.02137417532503605,
"eval_precision": 0.937129968987877,
"eval_recall": 0.9217970049916805,
"eval_runtime": 44.837,
"eval_samples_per_second": 9.568,
"eval_steps_per_second": 1.606,
"step": 530
},
{
"epoch": 1.81,
"eval_accuracy": 0.9954100448382903,
"eval_f1": 0.9379098646574578,
"eval_loss": 0.02044159732758999,
"eval_precision": 0.94383600112328,
"eval_recall": 0.9320576816417082,
"eval_runtime": 44.8548,
"eval_samples_per_second": 9.564,
"eval_steps_per_second": 1.605,
"step": 540
},
{
"epoch": 1.84,
"eval_accuracy": 0.9959274097264599,
"eval_f1": 0.9561111111111111,
"eval_loss": 0.020166810601949692,
"eval_precision": 0.9577072899276572,
"eval_recall": 0.954520244037715,
"eval_runtime": 44.8166,
"eval_samples_per_second": 9.572,
"eval_steps_per_second": 1.607,
"step": 550
},
{
"epoch": 1.87,
"eval_accuracy": 0.9952375898755671,
"eval_f1": 0.9289403881055422,
"eval_loss": 0.020729683339595795,
"eval_precision": 0.935338768625246,
"eval_recall": 0.9226289517470881,
"eval_runtime": 44.8369,
"eval_samples_per_second": 9.568,
"eval_steps_per_second": 1.606,
"step": 560
},
{
"epoch": 1.91,
"eval_accuracy": 0.9960600673900931,
"eval_f1": 0.9606211869107044,
"eval_loss": 0.019887683913111687,
"eval_precision": 0.9606211869107044,
"eval_recall": 0.9606211869107044,
"eval_runtime": 44.8366,
"eval_samples_per_second": 9.568,
"eval_steps_per_second": 1.606,
"step": 570
},
{
"epoch": 1.94,
"eval_accuracy": 0.9956753601655568,
"eval_f1": 0.9422407794015311,
"eval_loss": 0.021609965711832047,
"eval_precision": 0.945794914780665,
"eval_recall": 0.9387132556849695,
"eval_runtime": 44.9147,
"eval_samples_per_second": 9.551,
"eval_steps_per_second": 1.603,
"step": 580
},
{
"epoch": 1.97,
"eval_accuracy": 0.9960468016237298,
"eval_f1": 0.9564975677553856,
"eval_loss": 0.019716205075383186,
"eval_precision": 0.9587628865979382,
"eval_recall": 0.9542429284525791,
"eval_runtime": 45.3593,
"eval_samples_per_second": 9.458,
"eval_steps_per_second": 1.587,
"step": 590
},
{
"epoch": 2.01,
"eval_accuracy": 0.9957549547637367,
"eval_f1": 0.9439577249339453,
"eval_loss": 0.020143885165452957,
"eval_precision": 0.9467224546722455,
"eval_recall": 0.9412090959511925,
"eval_runtime": 45.0377,
"eval_samples_per_second": 9.525,
"eval_steps_per_second": 1.599,
"step": 600
},
{
"epoch": 2.04,
"eval_accuracy": 0.9955029052028336,
"eval_f1": 0.9359207036158034,
"eval_loss": 0.019947798922657967,
"eval_precision": 0.9423671633398931,
"eval_recall": 0.9295618413754853,
"eval_runtime": 45.1113,
"eval_samples_per_second": 9.51,
"eval_steps_per_second": 1.596,
"step": 610
},
{
"epoch": 2.07,
"eval_accuracy": 0.9961131304555464,
"eval_f1": 0.9537564227190668,
"eval_loss": 0.01930239051580429,
"eval_precision": 0.9552155771905424,
"eval_recall": 0.9523017193566279,
"eval_runtime": 45.0399,
"eval_samples_per_second": 9.525,
"eval_steps_per_second": 1.599,
"step": 620
},
{
"epoch": 2.11,
"eval_accuracy": 0.9959141439600966,
"eval_f1": 0.9510664993726474,
"eval_loss": 0.020125582814216614,
"eval_precision": 0.9562657695542472,
"eval_recall": 0.9459234608985025,
"eval_runtime": 44.9443,
"eval_samples_per_second": 9.545,
"eval_steps_per_second": 1.602,
"step": 630
},
{
"epoch": 2.14,
"eval_accuracy": 0.9965376349791727,
"eval_f1": 0.9709141274238227,
"eval_loss": 0.01933199167251587,
"eval_precision": 0.9698395130049806,
"eval_recall": 0.9719911259012757,
"eval_runtime": 44.9595,
"eval_samples_per_second": 9.542,
"eval_steps_per_second": 1.601,
"step": 640
},
{
"epoch": 2.17,
"eval_accuracy": 0.9962988511846329,
"eval_f1": 0.9642262895174709,
"eval_loss": 0.0191953107714653,
"eval_precision": 0.9642262895174709,
"eval_recall": 0.9642262895174709,
"eval_runtime": 44.8109,
"eval_samples_per_second": 9.574,
"eval_steps_per_second": 1.607,
"step": 650
},
{
"epoch": 2.21,
"eval_accuracy": 0.9957814862964633,
"eval_f1": 0.947662247034194,
"eval_loss": 0.019274834543466568,
"eval_precision": 0.9539196403484125,
"eval_recall": 0.9414864115363284,
"eval_runtime": 45.2879,
"eval_samples_per_second": 9.473,
"eval_steps_per_second": 1.59,
"step": 660
},
{
"epoch": 2.24,
"eval_accuracy": 0.9965906980446261,
"eval_f1": 0.9721568084222192,
"eval_loss": 0.018348801881074905,
"eval_precision": 0.9712150567395517,
"eval_recall": 0.9731003882418192,
"eval_runtime": 44.979,
"eval_samples_per_second": 9.538,
"eval_steps_per_second": 1.601,
"step": 670
},
{
"epoch": 2.27,
"eval_accuracy": 0.9968029503064392,
"eval_f1": 0.975387168141593,
"eval_loss": 0.018433524295687675,
"eval_precision": 0.9726971869829013,
"eval_recall": 0.9780920687742651,
"eval_runtime": 44.9845,
"eval_samples_per_second": 9.537,
"eval_steps_per_second": 1.601,
"step": 680
},
{
"epoch": 2.31,
"eval_accuracy": 0.9967631530073492,
"eval_f1": 0.9695880564003317,
"eval_loss": 0.018039193004369736,
"eval_precision": 0.9666482910694597,
"eval_recall": 0.9725457570715474,
"eval_runtime": 44.9711,
"eval_samples_per_second": 9.539,
"eval_steps_per_second": 1.601,
"step": 690
},
{
"epoch": 2.34,
"eval_accuracy": 0.9968029503064392,
"eval_f1": 0.9738625363020329,
"eval_loss": 0.01683180034160614,
"eval_precision": 0.9713103448275862,
"eval_recall": 0.9764281752634498,
"eval_runtime": 44.9102,
"eval_samples_per_second": 9.552,
"eval_steps_per_second": 1.603,
"step": 700
},
{
"epoch": 2.37,
"eval_accuracy": 0.9969223422037091,
"eval_f1": 0.9755152856550007,
"eval_loss": 0.01656004600226879,
"eval_precision": 0.9732266077836047,
"eval_recall": 0.9778147531891292,
"eval_runtime": 44.9636,
"eval_samples_per_second": 9.541,
"eval_steps_per_second": 1.601,
"step": 710
},
{
"epoch": 2.41,
"eval_accuracy": 0.9967498872409859,
"eval_f1": 0.973655019412091,
"eval_loss": 0.016868896782398224,
"eval_precision": 0.973655019412091,
"eval_recall": 0.973655019412091,
"eval_runtime": 44.8793,
"eval_samples_per_second": 9.559,
"eval_steps_per_second": 1.604,
"step": 720
},
{
"epoch": 2.44,
"eval_accuracy": 0.9968427476055292,
"eval_f1": 0.975765129483451,
"eval_loss": 0.01695641689002514,
"eval_precision": 0.9745504840940525,
"eval_recall": 0.9769828064337216,
"eval_runtime": 44.9769,
"eval_samples_per_second": 9.538,
"eval_steps_per_second": 1.601,
"step": 730
},
{
"epoch": 2.47,
"eval_accuracy": 0.9966968241755326,
"eval_f1": 0.9696128763701957,
"eval_loss": 0.017096424475312233,
"eval_precision": 0.9702860316578729,
"eval_recall": 0.968940654464781,
"eval_runtime": 45.2584,
"eval_samples_per_second": 9.479,
"eval_steps_per_second": 1.591,
"step": 740
},
{
"epoch": 2.51,
"eval_accuracy": 0.9968294818391659,
"eval_f1": 0.9747992245915259,
"eval_loss": 0.016900014132261276,
"eval_precision": 0.9734513274336283,
"eval_recall": 0.9761508596783139,
"eval_runtime": 44.9939,
"eval_samples_per_second": 9.535,
"eval_steps_per_second": 1.6,
"step": 750
},
{
"epoch": 2.54,
"eval_accuracy": 0.9969090764373458,
"eval_f1": 0.9747992245915259,
"eval_loss": 0.01711142621934414,
"eval_precision": 0.9734513274336283,
"eval_recall": 0.9761508596783139,
"eval_runtime": 44.9916,
"eval_samples_per_second": 9.535,
"eval_steps_per_second": 1.6,
"step": 760
},
{
"epoch": 2.58,
"eval_accuracy": 0.9968029503064392,
"eval_f1": 0.9726957726957727,
"eval_loss": 0.017322950065135956,
"eval_precision": 0.972291493488501,
"eval_recall": 0.9731003882418192,
"eval_runtime": 44.9667,
"eval_samples_per_second": 9.54,
"eval_steps_per_second": 1.601,
"step": 770
},
{
"epoch": 2.61,
"eval_accuracy": 0.9970019368018891,
"eval_f1": 0.9776853776853778,
"eval_loss": 0.015976430848240852,
"eval_precision": 0.9772790246605708,
"eval_recall": 0.9780920687742651,
"eval_runtime": 44.9823,
"eval_samples_per_second": 9.537,
"eval_steps_per_second": 1.601,
"step": 780
},
{
"epoch": 2.64,
"eval_accuracy": 0.9968427476055292,
"eval_f1": 0.9725685785536159,
"eval_loss": 0.016221042722463608,
"eval_precision": 0.9717607973421927,
"eval_recall": 0.9733777038269551,
"eval_runtime": 45.0356,
"eval_samples_per_second": 9.526,
"eval_steps_per_second": 1.599,
"step": 790
},
{
"epoch": 2.68,
"eval_accuracy": 0.9967764187737126,
"eval_f1": 0.9714760454167821,
"eval_loss": 0.016350209712982178,
"eval_precision": 0.9701327433628318,
"eval_recall": 0.9728230726566833,
"eval_runtime": 44.9594,
"eval_samples_per_second": 9.542,
"eval_steps_per_second": 1.601,
"step": 800
},
{
"epoch": 2.71,
"eval_accuracy": 0.9969223422037091,
"eval_f1": 0.9753325942350333,
"eval_loss": 0.0164735559374094,
"eval_precision": 0.974792243767313,
"eval_recall": 0.9758735440931781,
"eval_runtime": 44.8809,
"eval_samples_per_second": 9.559,
"eval_steps_per_second": 1.604,
"step": 810
},
{
"epoch": 2.74,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.9754541672444876,
"eval_loss": 0.01638418808579445,
"eval_precision": 0.9755894590846047,
"eval_recall": 0.9753189129229063,
"eval_runtime": 45.2809,
"eval_samples_per_second": 9.474,
"eval_steps_per_second": 1.59,
"step": 820
},
{
"epoch": 2.78,
"eval_accuracy": 0.9951712610437505,
"eval_f1": 0.9239864864864865,
"eval_loss": 0.0193793848156929,
"eval_precision": 0.9382504288164666,
"eval_recall": 0.9101497504159733,
"eval_runtime": 44.9984,
"eval_samples_per_second": 9.534,
"eval_steps_per_second": 1.6,
"step": 830
},
{
"epoch": 2.81,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.979071379071379,
"eval_loss": 0.015317755751311779,
"eval_precision": 0.9786644499861458,
"eval_recall": 0.9794786466999446,
"eval_runtime": 44.8121,
"eval_samples_per_second": 9.573,
"eval_steps_per_second": 1.607,
"step": 840
},
{
"epoch": 2.84,
"eval_accuracy": 0.9968825449046191,
"eval_f1": 0.9747712780704185,
"eval_loss": 0.016130488365888596,
"eval_precision": 0.9745011086474501,
"eval_recall": 0.9750415973377704,
"eval_runtime": 44.9246,
"eval_samples_per_second": 9.549,
"eval_steps_per_second": 1.603,
"step": 850
},
{
"epoch": 2.88,
"eval_accuracy": 0.9965111034464461,
"eval_f1": 0.9585304759254106,
"eval_loss": 0.017094574868679047,
"eval_precision": 0.9620111731843576,
"eval_recall": 0.9550748752079867,
"eval_runtime": 44.9689,
"eval_samples_per_second": 9.54,
"eval_steps_per_second": 1.601,
"step": 860
},
{
"epoch": 2.91,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9767634854771784,
"eval_loss": 0.016324549913406372,
"eval_precision": 0.9743377483443708,
"eval_recall": 0.9792013311148087,
"eval_runtime": 44.9212,
"eval_samples_per_second": 9.55,
"eval_steps_per_second": 1.603,
"step": 870
},
{
"epoch": 2.94,
"eval_accuracy": 0.9970284683346157,
"eval_f1": 0.9753394292047659,
"eval_loss": 0.016577888280153275,
"eval_precision": 0.9745293466223699,
"eval_recall": 0.9761508596783139,
"eval_runtime": 45.0626,
"eval_samples_per_second": 9.52,
"eval_steps_per_second": 1.598,
"step": 880
},
{
"epoch": 2.98,
"eval_accuracy": 0.9968560133718924,
"eval_f1": 0.9743589743589743,
"eval_loss": 0.01666262373328209,
"eval_precision": 0.973954003879191,
"eval_recall": 0.9747642817526345,
"eval_runtime": 44.929,
"eval_samples_per_second": 9.548,
"eval_steps_per_second": 1.603,
"step": 890
},
{
"epoch": 3.01,
"eval_accuracy": 0.9966570268764426,
"eval_f1": 0.9715396362626684,
"eval_loss": 0.01778605580329895,
"eval_precision": 0.9727550736725049,
"eval_recall": 0.9703272323904604,
"eval_runtime": 44.9166,
"eval_samples_per_second": 9.551,
"eval_steps_per_second": 1.603,
"step": 900
},
{
"epoch": 3.04,
"eval_accuracy": 0.9970815314000689,
"eval_f1": 0.9786407766990292,
"eval_loss": 0.016635755077004433,
"eval_precision": 0.978912319644839,
"eval_recall": 0.978369384359401,
"eval_runtime": 45.1716,
"eval_samples_per_second": 9.497,
"eval_steps_per_second": 1.594,
"step": 910
},
{
"epoch": 3.08,
"eval_accuracy": 0.9971478602318856,
"eval_f1": 0.9811529933481152,
"eval_loss": 0.01662967912852764,
"eval_precision": 0.9806094182825484,
"eval_recall": 0.9816971713810316,
"eval_runtime": 44.9112,
"eval_samples_per_second": 9.552,
"eval_steps_per_second": 1.603,
"step": 920
},
{
"epoch": 3.11,
"eval_accuracy": 0.9969488737364357,
"eval_f1": 0.9753052164261932,
"eval_loss": 0.016620052978396416,
"eval_precision": 0.975846751804553,
"eval_recall": 0.9747642817526345,
"eval_runtime": 44.9363,
"eval_samples_per_second": 9.547,
"eval_steps_per_second": 1.602,
"step": 930
},
{
"epoch": 3.14,
"eval_accuracy": 0.9972407205964289,
"eval_f1": 0.9815508392287419,
"eval_loss": 0.015619627200067043,
"eval_precision": 0.9819594782126007,
"eval_recall": 0.9811425402107599,
"eval_runtime": 44.9174,
"eval_samples_per_second": 9.551,
"eval_steps_per_second": 1.603,
"step": 940
},
{
"epoch": 3.18,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9779442363712026,
"eval_loss": 0.015341303311288357,
"eval_precision": 0.9783513738551207,
"eval_recall": 0.9775374376039934,
"eval_runtime": 45.0123,
"eval_samples_per_second": 9.531,
"eval_steps_per_second": 1.6,
"step": 950
},
{
"epoch": 3.21,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.9764281752634498,
"eval_loss": 0.01650950312614441,
"eval_precision": 0.9764281752634498,
"eval_recall": 0.9764281752634498,
"eval_runtime": 44.93,
"eval_samples_per_second": 9.548,
"eval_steps_per_second": 1.602,
"step": 960
},
{
"epoch": 3.24,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.9774144381321879,
"eval_loss": 0.01659621112048626,
"eval_precision": 0.9767377457767932,
"eval_recall": 0.9780920687742651,
"eval_runtime": 44.9897,
"eval_samples_per_second": 9.536,
"eval_steps_per_second": 1.6,
"step": 970
},
{
"epoch": 3.28,
"eval_accuracy": 0.9967498872409859,
"eval_f1": 0.9746572496884087,
"eval_loss": 0.016826625913381577,
"eval_precision": 0.9734439834024896,
"eval_recall": 0.9758735440931781,
"eval_runtime": 45.2137,
"eval_samples_per_second": 9.488,
"eval_steps_per_second": 1.592,
"step": 980
},
{
"epoch": 3.31,
"eval_accuracy": 0.9968958106709824,
"eval_f1": 0.978146611341632,
"eval_loss": 0.016263196244835854,
"eval_precision": 0.9757174392935982,
"eval_recall": 0.9805879090404881,
"eval_runtime": 44.9271,
"eval_samples_per_second": 9.549,
"eval_steps_per_second": 1.603,
"step": 990
},
{
"epoch": 3.34,
"learning_rate": 9e-06,
"loss": 0.0154,
"step": 1000
},
{
"epoch": 3.34,
"eval_accuracy": 0.9968294818391659,
"eval_f1": 0.9775809576529201,
"eval_loss": 0.016901057213544846,
"eval_precision": 0.9756906077348066,
"eval_recall": 0.9794786466999446,
"eval_runtime": 44.996,
"eval_samples_per_second": 9.534,
"eval_steps_per_second": 1.6,
"step": 1000
},
{
"epoch": 3.38,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9803269603768356,
"eval_loss": 0.01609906367957592,
"eval_precision": 0.9795127353266888,
"eval_recall": 0.9811425402107599,
"eval_runtime": 45.3202,
"eval_samples_per_second": 9.466,
"eval_steps_per_second": 1.589,
"step": 1010
},
{
"epoch": 3.41,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.977993079584775,
"eval_loss": 0.016519052907824516,
"eval_precision": 0.9762365294280188,
"eval_recall": 0.9797559622850804,
"eval_runtime": 45.0574,
"eval_samples_per_second": 9.521,
"eval_steps_per_second": 1.598,
"step": 1020
},
{
"epoch": 3.44,
"eval_accuracy": 0.9967233557082593,
"eval_f1": 0.9722530521642619,
"eval_loss": 0.01666153408586979,
"eval_precision": 0.9727928928373126,
"eval_recall": 0.9717138103161398,
"eval_runtime": 45.0201,
"eval_samples_per_second": 9.529,
"eval_steps_per_second": 1.599,
"step": 1030
},
{
"epoch": 3.48,
"eval_accuracy": 0.9969090764373458,
"eval_f1": 0.9761640798226164,
"eval_loss": 0.015780288726091385,
"eval_precision": 0.9756232686980609,
"eval_recall": 0.9767054908485857,
"eval_runtime": 45.2347,
"eval_samples_per_second": 9.484,
"eval_steps_per_second": 1.592,
"step": 1040
},
{
"epoch": 3.51,
"eval_accuracy": 0.9968958106709824,
"eval_f1": 0.9766284054764209,
"eval_loss": 0.015381171368062496,
"eval_precision": 0.9740689655172414,
"eval_recall": 0.9792013311148087,
"eval_runtime": 45.2769,
"eval_samples_per_second": 9.475,
"eval_steps_per_second": 1.59,
"step": 1050
},
{
"epoch": 3.55,
"eval_accuracy": 0.9959804727919132,
"eval_f1": 0.9448555074689375,
"eval_loss": 0.01652899943292141,
"eval_precision": 0.9513635085746416,
"eval_recall": 0.9384359400998337,
"eval_runtime": 45.1375,
"eval_samples_per_second": 9.504,
"eval_steps_per_second": 1.595,
"step": 1060
},
{
"epoch": 3.58,
"eval_accuracy": 0.9968825449046191,
"eval_f1": 0.9749619587771476,
"eval_loss": 0.015719007700681686,
"eval_precision": 0.9726745790781121,
"eval_recall": 0.9772601220188575,
"eval_runtime": 45.0215,
"eval_samples_per_second": 9.529,
"eval_steps_per_second": 1.599,
"step": 1070
},
{
"epoch": 3.61,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.9782458085076902,
"eval_loss": 0.01600920408964157,
"eval_precision": 0.977568540570479,
"eval_recall": 0.9789240155296728,
"eval_runtime": 45.1658,
"eval_samples_per_second": 9.498,
"eval_steps_per_second": 1.594,
"step": 1080
},
{
"epoch": 3.65,
"eval_accuracy": 0.99580801782919,
"eval_f1": 0.9429732380552053,
"eval_loss": 0.01786983013153076,
"eval_precision": 0.9529878221467006,
"eval_recall": 0.9331669439822518,
"eval_runtime": 45.14,
"eval_samples_per_second": 9.504,
"eval_steps_per_second": 1.595,
"step": 1090
},
{
"epoch": 3.68,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.977439446366782,
"eval_loss": 0.015765171498060226,
"eval_precision": 0.9756838905775076,
"eval_recall": 0.9792013311148087,
"eval_runtime": 45.1016,
"eval_samples_per_second": 9.512,
"eval_steps_per_second": 1.596,
"step": 1100
},
{
"epoch": 3.71,
"eval_accuracy": 0.9968958106709824,
"eval_f1": 0.977703919124775,
"eval_loss": 0.015863990411162376,
"eval_precision": 0.9764868603042877,
"eval_recall": 0.9789240155296728,
"eval_runtime": 45.1212,
"eval_samples_per_second": 9.508,
"eval_steps_per_second": 1.596,
"step": 1110
},
{
"epoch": 3.75,
"eval_accuracy": 0.9969621395027991,
"eval_f1": 0.975609756097561,
"eval_loss": 0.01584913209080696,
"eval_precision": 0.9750692520775623,
"eval_recall": 0.9761508596783139,
"eval_runtime": 45.0612,
"eval_samples_per_second": 9.52,
"eval_steps_per_second": 1.598,
"step": 1120
},
{
"epoch": 3.78,
"eval_accuracy": 0.9969488737364357,
"eval_f1": 0.9744869661674986,
"eval_loss": 0.01588474027812481,
"eval_precision": 0.9744869661674986,
"eval_recall": 0.9744869661674986,
"eval_runtime": 45.3578,
"eval_samples_per_second": 9.458,
"eval_steps_per_second": 1.587,
"step": 1130
},
{
"epoch": 3.81,
"eval_accuracy": 0.9968958106709824,
"eval_f1": 0.9752846431546792,
"eval_loss": 0.016261184588074684,
"eval_precision": 0.9766407119021134,
"eval_recall": 0.9739323349972269,
"eval_runtime": 45.1022,
"eval_samples_per_second": 9.512,
"eval_steps_per_second": 1.596,
"step": 1140
},
{
"epoch": 3.85,
"eval_accuracy": 0.9967100899418959,
"eval_f1": 0.9723145071982281,
"eval_loss": 0.016805831342935562,
"eval_precision": 0.970702045328911,
"eval_recall": 0.9739323349972269,
"eval_runtime": 45.1109,
"eval_samples_per_second": 9.51,
"eval_steps_per_second": 1.596,
"step": 1150
},
{
"epoch": 3.88,
"eval_accuracy": 0.9970152025682524,
"eval_f1": 0.9805771365149833,
"eval_loss": 0.01488415990024805,
"eval_precision": 0.9811215991116047,
"eval_recall": 0.9800332778702163,
"eval_runtime": 45.1408,
"eval_samples_per_second": 9.504,
"eval_steps_per_second": 1.595,
"step": 1160
},
{
"epoch": 3.91,
"eval_accuracy": 0.9970152025682524,
"eval_f1": 0.9792531120331951,
"eval_loss": 0.014714999124407768,
"eval_precision": 0.9768211920529801,
"eval_recall": 0.9816971713810316,
"eval_runtime": 45.0991,
"eval_samples_per_second": 9.512,
"eval_steps_per_second": 1.596,
"step": 1170
},
{
"epoch": 3.95,
"eval_accuracy": 0.9969754052691624,
"eval_f1": 0.9757986447241046,
"eval_loss": 0.01566295139491558,
"eval_precision": 0.9732413793103448,
"eval_recall": 0.978369384359401,
"eval_runtime": 45.1028,
"eval_samples_per_second": 9.512,
"eval_steps_per_second": 1.596,
"step": 1180
},
{
"epoch": 3.98,
"eval_accuracy": 0.9969886710355257,
"eval_f1": 0.9786880708552449,
"eval_loss": 0.015323741361498833,
"eval_precision": 0.9767955801104973,
"eval_recall": 0.9805879090404881,
"eval_runtime": 45.1524,
"eval_samples_per_second": 9.501,
"eval_steps_per_second": 1.595,
"step": 1190
},
{
"epoch": 4.01,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.9747642817526345,
"eval_loss": 0.015690365806221962,
"eval_precision": 0.9747642817526345,
"eval_recall": 0.9747642817526345,
"eval_runtime": 45.1208,
"eval_samples_per_second": 9.508,
"eval_steps_per_second": 1.596,
"step": 1200
},
{
"epoch": 4.05,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9797783933518006,
"eval_loss": 0.015430403873324394,
"eval_precision": 0.978693967902601,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.032,
"eval_samples_per_second": 9.527,
"eval_steps_per_second": 1.599,
"step": 1210
},
{
"epoch": 4.08,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9780052566053397,
"eval_loss": 0.0156533382833004,
"eval_precision": 0.9757107369583218,
"eval_recall": 0.9803105934553522,
"eval_runtime": 45.2988,
"eval_samples_per_second": 9.47,
"eval_steps_per_second": 1.589,
"step": 1220
},
{
"epoch": 4.11,
"eval_accuracy": 0.9968958106709824,
"eval_f1": 0.9735493698933665,
"eval_loss": 0.016326196491718292,
"eval_precision": 0.9723374827109267,
"eval_recall": 0.9747642817526345,
"eval_runtime": 45.0756,
"eval_samples_per_second": 9.517,
"eval_steps_per_second": 1.597,
"step": 1230
},
{
"epoch": 4.15,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9778699861687413,
"eval_loss": 0.015600275248289108,
"eval_precision": 0.9754415011037527,
"eval_recall": 0.9803105934553522,
"eval_runtime": 44.9579,
"eval_samples_per_second": 9.542,
"eval_steps_per_second": 1.601,
"step": 1240
},
{
"epoch": 4.18,
"eval_accuracy": 0.9970152025682524,
"eval_f1": 0.9774331995015921,
"eval_loss": 0.015862880274653435,
"eval_precision": 0.9759469173348079,
"eval_recall": 0.9789240155296728,
"eval_runtime": 45.0784,
"eval_samples_per_second": 9.517,
"eval_steps_per_second": 1.597,
"step": 1250
},
{
"epoch": 4.21,
"eval_accuracy": 0.9970284683346157,
"eval_f1": 0.9802076124567475,
"eval_loss": 0.01617247611284256,
"eval_precision": 0.9784470848300636,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.0516,
"eval_samples_per_second": 9.522,
"eval_steps_per_second": 1.598,
"step": 1260
},
{
"epoch": 4.25,
"eval_accuracy": 0.9970815314000689,
"eval_f1": 0.978146611341632,
"eval_loss": 0.016013789921998978,
"eval_precision": 0.9757174392935982,
"eval_recall": 0.9805879090404881,
"eval_runtime": 45.1173,
"eval_samples_per_second": 9.509,
"eval_steps_per_second": 1.596,
"step": 1270
},
{
"epoch": 4.28,
"eval_accuracy": 0.9968560133718924,
"eval_f1": 0.9744157101369105,
"eval_loss": 0.01655399613082409,
"eval_precision": 0.9718620689655172,
"eval_recall": 0.9769828064337216,
"eval_runtime": 45.0171,
"eval_samples_per_second": 9.53,
"eval_steps_per_second": 1.599,
"step": 1280
},
{
"epoch": 4.31,
"eval_accuracy": 0.9971080629327956,
"eval_f1": 0.9793600221637346,
"eval_loss": 0.015200940892100334,
"eval_precision": 0.9784112925546637,
"eval_recall": 0.9803105934553522,
"eval_runtime": 45.0877,
"eval_samples_per_second": 9.515,
"eval_steps_per_second": 1.597,
"step": 1290
},
{
"epoch": 4.35,
"eval_accuracy": 0.9968294818391659,
"eval_f1": 0.9751175006911805,
"eval_loss": 0.016674669459462166,
"eval_precision": 0.9721609702315325,
"eval_recall": 0.9780920687742651,
"eval_runtime": 45.3184,
"eval_samples_per_second": 9.466,
"eval_steps_per_second": 1.589,
"step": 1300
},
{
"epoch": 4.38,
"eval_accuracy": 0.9968294818391659,
"eval_f1": 0.9766413268832067,
"eval_loss": 0.01657554879784584,
"eval_precision": 0.9735464315238358,
"eval_recall": 0.9797559622850804,
"eval_runtime": 45.1144,
"eval_samples_per_second": 9.509,
"eval_steps_per_second": 1.596,
"step": 1310
},
{
"epoch": 4.41,
"eval_accuracy": 0.9968958106709824,
"eval_f1": 0.9781586950511474,
"eval_loss": 0.016078708693385124,
"eval_precision": 0.9751929437706726,
"eval_recall": 0.9811425402107599,
"eval_runtime": 45.1076,
"eval_samples_per_second": 9.511,
"eval_steps_per_second": 1.596,
"step": 1320
},
{
"epoch": 4.45,
"eval_accuracy": 0.9967764187737126,
"eval_f1": 0.9739251040221916,
"eval_loss": 0.015717538073658943,
"eval_precision": 0.9741953385127636,
"eval_recall": 0.973655019412091,
"eval_runtime": 45.0205,
"eval_samples_per_second": 9.529,
"eval_steps_per_second": 1.599,
"step": 1330
},
{
"epoch": 4.48,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.9795127353266887,
"eval_loss": 0.015196431428194046,
"eval_precision": 0.9778883360972913,
"eval_recall": 0.9811425402107599,
"eval_runtime": 45.4378,
"eval_samples_per_second": 9.441,
"eval_steps_per_second": 1.585,
"step": 1340
},
{
"epoch": 4.52,
"eval_accuracy": 0.9967233557082593,
"eval_f1": 0.971064654575661,
"eval_loss": 0.015703538432717323,
"eval_precision": 0.9695880564003317,
"eval_recall": 0.9725457570715474,
"eval_runtime": 45.4022,
"eval_samples_per_second": 9.449,
"eval_steps_per_second": 1.586,
"step": 1350
},
{
"epoch": 4.55,
"eval_accuracy": 0.9968162160728026,
"eval_f1": 0.9755828390122776,
"eval_loss": 0.015339327044785023,
"eval_precision": 0.9706286027998902,
"eval_recall": 0.9805879090404881,
"eval_runtime": 45.4342,
"eval_samples_per_second": 9.442,
"eval_steps_per_second": 1.585,
"step": 1360
},
{
"epoch": 4.58,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.9758587391364325,
"eval_loss": 0.015390865504741669,
"eval_precision": 0.9709031018391435,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.7337,
"eval_samples_per_second": 9.38,
"eval_steps_per_second": 1.574,
"step": 1370
},
{
"epoch": 4.62,
"eval_accuracy": 0.9969886710355257,
"eval_f1": 0.9785822854774078,
"eval_loss": 0.015035979449748993,
"eval_precision": 0.97521343982374,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.4663,
"eval_samples_per_second": 9.436,
"eval_steps_per_second": 1.584,
"step": 1380
},
{
"epoch": 4.65,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.9809234171965718,
"eval_loss": 0.014896390959620476,
"eval_precision": 0.9779492833517089,
"eval_recall": 0.9839156960621187,
"eval_runtime": 45.0989,
"eval_samples_per_second": 9.512,
"eval_steps_per_second": 1.596,
"step": 1390
},
{
"epoch": 4.68,
"eval_accuracy": 0.9968560133718924,
"eval_f1": 0.9768339768339769,
"eval_loss": 0.015806537121534348,
"eval_precision": 0.9714755896873286,
"eval_recall": 0.9822518025513034,
"eval_runtime": 45.0416,
"eval_samples_per_second": 9.525,
"eval_steps_per_second": 1.599,
"step": 1400
},
{
"epoch": 4.72,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9778761061946902,
"eval_loss": 0.015140415169298649,
"eval_precision": 0.9751792608935466,
"eval_recall": 0.9805879090404881,
"eval_runtime": 45.6611,
"eval_samples_per_second": 9.395,
"eval_steps_per_second": 1.577,
"step": 1410
},
{
"epoch": 4.75,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9795353982300885,
"eval_loss": 0.015615841373801231,
"eval_precision": 0.9768339768339769,
"eval_recall": 0.9822518025513034,
"eval_runtime": 45.3516,
"eval_samples_per_second": 9.459,
"eval_steps_per_second": 1.588,
"step": 1420
},
{
"epoch": 4.78,
"eval_accuracy": 0.9971876575309756,
"eval_f1": 0.9802240354031254,
"eval_loss": 0.015609286725521088,
"eval_precision": 0.9776551724137931,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.8817,
"eval_samples_per_second": 9.35,
"eval_steps_per_second": 1.569,
"step": 1430
},
{
"epoch": 4.82,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.980777209238003,
"eval_loss": 0.015975775197148323,
"eval_precision": 0.9782068965517241,
"eval_recall": 0.9833610648918469,
"eval_runtime": 45.1602,
"eval_samples_per_second": 9.5,
"eval_steps_per_second": 1.594,
"step": 1440
},
{
"epoch": 4.85,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.9810642709053213,
"eval_loss": 0.015114562585949898,
"eval_precision": 0.9779553596031965,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.0898,
"eval_samples_per_second": 9.514,
"eval_steps_per_second": 1.597,
"step": 1450
},
{
"epoch": 4.88,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9806576402321082,
"eval_loss": 0.01497586164623499,
"eval_precision": 0.977147577092511,
"eval_recall": 0.9841930116472546,
"eval_runtime": 47.111,
"eval_samples_per_second": 9.106,
"eval_steps_per_second": 1.528,
"step": 1460
},
{
"epoch": 4.92,
"eval_accuracy": 0.9970284683346157,
"eval_f1": 0.9779005524861878,
"eval_loss": 0.014804758131504059,
"eval_precision": 0.9741331865712713,
"eval_recall": 0.9816971713810316,
"eval_runtime": 45.7757,
"eval_samples_per_second": 9.372,
"eval_steps_per_second": 1.573,
"step": 1470
},
{
"epoch": 4.95,
"eval_accuracy": 0.9969621395027991,
"eval_f1": 0.9767634854771784,
"eval_loss": 0.015325279906392097,
"eval_precision": 0.9743377483443708,
"eval_recall": 0.9792013311148087,
"eval_runtime": 45.788,
"eval_samples_per_second": 9.369,
"eval_steps_per_second": 1.572,
"step": 1480
},
{
"epoch": 4.98,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9820143884892086,
"eval_loss": 0.014990455470979214,
"eval_precision": 0.9798453892876864,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.1213,
"eval_samples_per_second": 9.508,
"eval_steps_per_second": 1.596,
"step": 1490
},
{
"epoch": 5.02,
"learning_rate": 8.5e-06,
"loss": 0.0081,
"step": 1500
},
{
"epoch": 5.02,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9796821008984106,
"eval_loss": 0.01517151016741991,
"eval_precision": 0.9765775695783963,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.193,
"eval_samples_per_second": 9.493,
"eval_steps_per_second": 1.593,
"step": 1500
},
{
"epoch": 5.05,
"eval_accuracy": 0.9967366214746226,
"eval_f1": 0.9682408174537421,
"eval_loss": 0.01580970361828804,
"eval_precision": 0.9642464246424642,
"eval_recall": 0.9722684414864116,
"eval_runtime": 45.4381,
"eval_samples_per_second": 9.441,
"eval_steps_per_second": 1.585,
"step": 1510
},
{
"epoch": 5.08,
"eval_accuracy": 0.9966702926428059,
"eval_f1": 0.9666759233546237,
"eval_loss": 0.01570785790681839,
"eval_precision": 0.9680200222469411,
"eval_recall": 0.9653355518580145,
"eval_runtime": 45.4491,
"eval_samples_per_second": 9.439,
"eval_steps_per_second": 1.584,
"step": 1520
},
{
"epoch": 5.12,
"eval_accuracy": 0.9969886710355257,
"eval_f1": 0.9800388134183532,
"eval_loss": 0.015114962123334408,
"eval_precision": 0.9797671840354767,
"eval_recall": 0.9803105934553522,
"eval_runtime": 45.1961,
"eval_samples_per_second": 9.492,
"eval_steps_per_second": 1.593,
"step": 1530
},
{
"epoch": 5.15,
"eval_accuracy": 0.9970815314000689,
"eval_f1": 0.9818835569077582,
"eval_loss": 0.01481586042791605,
"eval_precision": 0.9793103448275862,
"eval_recall": 0.9844703272323905,
"eval_runtime": 45.6531,
"eval_samples_per_second": 9.397,
"eval_steps_per_second": 1.577,
"step": 1540
},
{
"epoch": 5.18,
"eval_accuracy": 0.9971478602318856,
"eval_f1": 0.9807878369039392,
"eval_loss": 0.014275978319346905,
"eval_precision": 0.9776798015982364,
"eval_recall": 0.9839156960621187,
"eval_runtime": 45.7198,
"eval_samples_per_second": 9.383,
"eval_steps_per_second": 1.575,
"step": 1550
},
{
"epoch": 5.22,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.9792703150912107,
"eval_loss": 0.01468308549374342,
"eval_precision": 0.9760330578512396,
"eval_recall": 0.9825291181364393,
"eval_runtime": 45.5952,
"eval_samples_per_second": 9.409,
"eval_steps_per_second": 1.579,
"step": 1560
},
{
"epoch": 5.25,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9810695039380959,
"eval_loss": 0.014422405511140823,
"eval_precision": 0.977692095841366,
"eval_recall": 0.9844703272323905,
"eval_runtime": 45.732,
"eval_samples_per_second": 9.381,
"eval_steps_per_second": 1.574,
"step": 1570
},
{
"epoch": 5.28,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9809075816270061,
"eval_loss": 0.01434118952602148,
"eval_precision": 0.9787410270568746,
"eval_recall": 0.983083749306711,
"eval_runtime": 45.5148,
"eval_samples_per_second": 9.425,
"eval_steps_per_second": 1.582,
"step": 1580
},
{
"epoch": 5.32,
"eval_accuracy": 0.9970019368018891,
"eval_f1": 0.9791350006908941,
"eval_loss": 0.014856048859655857,
"eval_precision": 0.9757642522721014,
"eval_recall": 0.9825291181364393,
"eval_runtime": 46.2893,
"eval_samples_per_second": 9.268,
"eval_steps_per_second": 1.555,
"step": 1590
},
{
"epoch": 5.35,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9803541781959049,
"eval_loss": 0.015461008064448833,
"eval_precision": 0.9781888459414688,
"eval_recall": 0.9825291181364393,
"eval_runtime": 45.2253,
"eval_samples_per_second": 9.486,
"eval_steps_per_second": 1.592,
"step": 1600
},
{
"epoch": 5.38,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9800884955752212,
"eval_loss": 0.01574764773249626,
"eval_precision": 0.9773855488141202,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.056,
"eval_samples_per_second": 9.521,
"eval_steps_per_second": 1.598,
"step": 1610
},
{
"epoch": 5.42,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9792645839093173,
"eval_loss": 0.015540325082838535,
"eval_precision": 0.976295479603087,
"eval_recall": 0.9822518025513034,
"eval_runtime": 45.1752,
"eval_samples_per_second": 9.496,
"eval_steps_per_second": 1.594,
"step": 1620
},
{
"epoch": 5.45,
"eval_accuracy": 0.9969621395027991,
"eval_f1": 0.9781526548672567,
"eval_loss": 0.015259744599461555,
"eval_precision": 0.9754550468836183,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.477,
"eval_samples_per_second": 9.433,
"eval_steps_per_second": 1.583,
"step": 1630
},
{
"epoch": 5.48,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9809075816270061,
"eval_loss": 0.01531192846596241,
"eval_precision": 0.9787410270568746,
"eval_recall": 0.983083749306711,
"eval_runtime": 45.3307,
"eval_samples_per_second": 9.464,
"eval_steps_per_second": 1.588,
"step": 1640
},
{
"epoch": 5.52,
"eval_accuracy": 0.9970152025682524,
"eval_f1": 0.9804790253357331,
"eval_loss": 0.015362209640443325,
"eval_precision": 0.9789881116947746,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.5289,
"eval_samples_per_second": 9.423,
"eval_steps_per_second": 1.581,
"step": 1650
},
{
"epoch": 5.55,
"eval_accuracy": 0.9968825449046191,
"eval_f1": 0.9736151402127364,
"eval_loss": 0.016267232596874237,
"eval_precision": 0.9699972474538948,
"eval_recall": 0.9772601220188575,
"eval_runtime": 45.4269,
"eval_samples_per_second": 9.444,
"eval_steps_per_second": 1.585,
"step": 1660
},
{
"epoch": 5.59,
"eval_accuracy": 0.9970152025682524,
"eval_f1": 0.9776181265542968,
"eval_loss": 0.01579289324581623,
"eval_precision": 0.9741189427312775,
"eval_recall": 0.9811425402107599,
"eval_runtime": 46.1943,
"eval_samples_per_second": 9.287,
"eval_steps_per_second": 1.559,
"step": 1670
},
{
"epoch": 5.62,
"eval_accuracy": 0.9970284683346157,
"eval_f1": 0.9785407725321887,
"eval_loss": 0.01532789133489132,
"eval_precision": 0.9770528061929776,
"eval_recall": 0.9800332778702163,
"eval_runtime": 46.2745,
"eval_samples_per_second": 9.271,
"eval_steps_per_second": 1.556,
"step": 1680
},
{
"epoch": 5.65,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.979665237238899,
"eval_loss": 0.01536885742098093,
"eval_precision": 0.9773668230747999,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.136,
"eval_samples_per_second": 9.505,
"eval_steps_per_second": 1.595,
"step": 1690
},
{
"epoch": 5.69,
"eval_accuracy": 0.9969488737364357,
"eval_f1": 0.9772445179975174,
"eval_loss": 0.01578596606850624,
"eval_precision": 0.9720164609053498,
"eval_recall": 0.9825291181364393,
"eval_runtime": 45.0296,
"eval_samples_per_second": 9.527,
"eval_steps_per_second": 1.599,
"step": 1700
},
{
"epoch": 5.72,
"eval_accuracy": 0.9968560133718924,
"eval_f1": 0.9757040309221425,
"eval_loss": 0.01535722240805626,
"eval_precision": 0.971412864211105,
"eval_recall": 0.9800332778702163,
"eval_runtime": 45.2636,
"eval_samples_per_second": 9.478,
"eval_steps_per_second": 1.591,
"step": 1710
},
{
"epoch": 5.75,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9769496204278812,
"eval_loss": 0.01525976974517107,
"eval_precision": 0.9725199230557846,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.5287,
"eval_samples_per_second": 9.423,
"eval_steps_per_second": 1.581,
"step": 1720
},
{
"epoch": 5.79,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.9776181265542968,
"eval_loss": 0.014473304152488708,
"eval_precision": 0.9741189427312775,
"eval_recall": 0.9811425402107599,
"eval_runtime": 45.6773,
"eval_samples_per_second": 9.392,
"eval_steps_per_second": 1.576,
"step": 1730
},
{
"epoch": 5.82,
"eval_accuracy": 0.9971345944655223,
"eval_f1": 0.9802349689011749,
"eval_loss": 0.013995842076838017,
"eval_precision": 0.9771286855883163,
"eval_recall": 0.9833610648918469,
"eval_runtime": 45.5912,
"eval_samples_per_second": 9.41,
"eval_steps_per_second": 1.579,
"step": 1740
},
{
"epoch": 5.85,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9808864265927978,
"eval_loss": 0.014489100314676762,
"eval_precision": 0.9798007747648035,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.3576,
"eval_samples_per_second": 9.458,
"eval_steps_per_second": 1.587,
"step": 1750
},
{
"epoch": 5.89,
"eval_accuracy": 0.9972274548300656,
"eval_f1": 0.9808864265927978,
"eval_loss": 0.014342778362333775,
"eval_precision": 0.9798007747648035,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.5077,
"eval_samples_per_second": 9.427,
"eval_steps_per_second": 1.582,
"step": 1760
},
{
"epoch": 5.92,
"eval_accuracy": 0.9972805178955189,
"eval_f1": 0.9800774764803543,
"eval_loss": 0.014782003127038479,
"eval_precision": 0.9779127553837659,
"eval_recall": 0.9822518025513034,
"eval_runtime": 45.3932,
"eval_samples_per_second": 9.451,
"eval_steps_per_second": 1.586,
"step": 1770
},
{
"epoch": 5.95,
"eval_accuracy": 0.9972009232973389,
"eval_f1": 0.978852798894264,
"eval_loss": 0.014779850840568542,
"eval_precision": 0.9757508955635161,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.6592,
"eval_samples_per_second": 9.396,
"eval_steps_per_second": 1.577,
"step": 1780
},
{
"epoch": 5.99,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.9799141155284665,
"eval_loss": 0.015209286473691463,
"eval_precision": 0.9789648491558262,
"eval_recall": 0.980865224625624,
"eval_runtime": 46.4662,
"eval_samples_per_second": 9.233,
"eval_steps_per_second": 1.55,
"step": 1790
},
{
"epoch": 6.02,
"eval_accuracy": 0.9971876575309756,
"eval_f1": 0.981011781011781,
"eval_loss": 0.015130845829844475,
"eval_precision": 0.9806040454419507,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.3314,
"eval_samples_per_second": 9.464,
"eval_steps_per_second": 1.588,
"step": 1800
},
{
"epoch": 6.05,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.9795297372060858,
"eval_loss": 0.015158111229538918,
"eval_precision": 0.9770971302428256,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.4446,
"eval_samples_per_second": 9.44,
"eval_steps_per_second": 1.584,
"step": 1810
},
{
"epoch": 6.09,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9782638792745397,
"eval_loss": 0.015132046304643154,
"eval_precision": 0.9767763339784352,
"eval_recall": 0.9797559622850804,
"eval_runtime": 45.4433,
"eval_samples_per_second": 9.44,
"eval_steps_per_second": 1.584,
"step": 1820
},
{
"epoch": 6.12,
"eval_accuracy": 0.9968825449046191,
"eval_f1": 0.9705516383243468,
"eval_loss": 0.01593286544084549,
"eval_precision": 0.967741935483871,
"eval_recall": 0.9733777038269551,
"eval_runtime": 45.4009,
"eval_samples_per_second": 9.449,
"eval_steps_per_second": 1.586,
"step": 1830
},
{
"epoch": 6.15,
"eval_accuracy": 0.9969356079700724,
"eval_f1": 0.9730774540936076,
"eval_loss": 0.014840428717434406,
"eval_precision": 0.9689304371734946,
"eval_recall": 0.9772601220188575,
"eval_runtime": 45.3952,
"eval_samples_per_second": 9.45,
"eval_steps_per_second": 1.586,
"step": 1840
},
{
"epoch": 6.19,
"eval_accuracy": 0.9966570268764426,
"eval_f1": 0.9764868603042877,
"eval_loss": 0.016662631183862686,
"eval_precision": 0.9740618101545254,
"eval_recall": 0.9789240155296728,
"eval_runtime": 45.439,
"eval_samples_per_second": 9.441,
"eval_steps_per_second": 1.585,
"step": 1850
},
{
"epoch": 6.22,
"eval_accuracy": 0.9965376349791727,
"eval_f1": 0.9750761561894212,
"eval_loss": 0.01773080602288246,
"eval_precision": 0.9737278761061947,
"eval_recall": 0.9764281752634498,
"eval_runtime": 45.6526,
"eval_samples_per_second": 9.397,
"eval_steps_per_second": 1.577,
"step": 1860
},
{
"epoch": 6.25,
"eval_accuracy": 0.9964182430819029,
"eval_f1": 0.9697221070095395,
"eval_loss": 0.018397442996501923,
"eval_precision": 0.9669148056244831,
"eval_recall": 0.9725457570715474,
"eval_runtime": 45.4014,
"eval_samples_per_second": 9.449,
"eval_steps_per_second": 1.586,
"step": 1870
},
{
"epoch": 6.29,
"eval_accuracy": 0.9966968241755326,
"eval_f1": 0.9773292784075199,
"eval_loss": 0.0170457661151886,
"eval_precision": 0.9743660418963617,
"eval_recall": 0.9803105934553522,
"eval_runtime": 45.6124,
"eval_samples_per_second": 9.405,
"eval_steps_per_second": 1.579,
"step": 1880
},
{
"epoch": 6.32,
"eval_accuracy": 0.9968029503064392,
"eval_f1": 0.9793046357615895,
"eval_loss": 0.01652824692428112,
"eval_precision": 0.9744645799011532,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.4345,
"eval_samples_per_second": 9.442,
"eval_steps_per_second": 1.585,
"step": 1890
},
{
"epoch": 6.35,
"eval_accuracy": 0.9967233557082593,
"eval_f1": 0.978476821192053,
"eval_loss": 0.016787514090538025,
"eval_precision": 0.9736408566721582,
"eval_recall": 0.9833610648918469,
"eval_runtime": 45.5818,
"eval_samples_per_second": 9.412,
"eval_steps_per_second": 1.58,
"step": 1900
},
{
"epoch": 6.39,
"eval_accuracy": 0.9965641665118994,
"eval_f1": 0.975320557010892,
"eval_loss": 0.01782037876546383,
"eval_precision": 0.9698382231971483,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.9556,
"eval_samples_per_second": 9.335,
"eval_steps_per_second": 1.567,
"step": 1910
},
{
"epoch": 6.42,
"eval_accuracy": 0.9966702926428059,
"eval_f1": 0.9768211920529801,
"eval_loss": 0.017588861286640167,
"eval_precision": 0.9719934102141681,
"eval_recall": 0.9816971713810316,
"eval_runtime": 45.1589,
"eval_samples_per_second": 9.5,
"eval_steps_per_second": 1.594,
"step": 1920
},
{
"epoch": 6.45,
"eval_accuracy": 0.9969488737364357,
"eval_f1": 0.9810799613313078,
"eval_loss": 0.016702750697731972,
"eval_precision": 0.9771664374140303,
"eval_recall": 0.9850249584026622,
"eval_runtime": 45.117,
"eval_samples_per_second": 9.509,
"eval_steps_per_second": 1.596,
"step": 1930
},
{
"epoch": 6.49,
"eval_accuracy": 0.9968029503064392,
"eval_f1": 0.9783179118906229,
"eval_loss": 0.016243569552898407,
"eval_precision": 0.9744154057771665,
"eval_recall": 0.9822518025513034,
"eval_runtime": 45.1078,
"eval_samples_per_second": 9.511,
"eval_steps_per_second": 1.596,
"step": 1940
},
{
"epoch": 6.52,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.9773418071290412,
"eval_loss": 0.01623663119971752,
"eval_precision": 0.9738436123348018,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.7949,
"eval_samples_per_second": 9.368,
"eval_steps_per_second": 1.572,
"step": 1950
},
{
"epoch": 6.56,
"eval_accuracy": 0.9967896845400759,
"eval_f1": 0.9769496204278812,
"eval_loss": 0.016976099461317062,
"eval_precision": 0.9725199230557846,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.3661,
"eval_samples_per_second": 9.456,
"eval_steps_per_second": 1.587,
"step": 1960
},
{
"epoch": 6.59,
"eval_accuracy": 0.9967233557082593,
"eval_f1": 0.9759933774834438,
"eval_loss": 0.017524730414152145,
"eval_precision": 0.971169686985173,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.7337,
"eval_samples_per_second": 9.38,
"eval_steps_per_second": 1.574,
"step": 1970
},
{
"epoch": 6.62,
"eval_accuracy": 0.9968029503064392,
"eval_f1": 0.9794397681799365,
"eval_loss": 0.016901282593607903,
"eval_precision": 0.9747322164240593,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.4807,
"eval_samples_per_second": 9.433,
"eval_steps_per_second": 1.583,
"step": 1980
},
{
"epoch": 6.66,
"eval_accuracy": 0.9967896845400759,
"eval_f1": 0.9788761562888305,
"eval_loss": 0.01667814515531063,
"eval_precision": 0.9747044267253231,
"eval_recall": 0.983083749306711,
"eval_runtime": 45.6668,
"eval_samples_per_second": 9.394,
"eval_steps_per_second": 1.577,
"step": 1990
},
{
"epoch": 6.69,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0064,
"step": 2000
},
{
"epoch": 6.69,
"eval_accuracy": 0.9967100899418959,
"eval_f1": 0.9776428374275461,
"eval_loss": 0.016720809042453766,
"eval_precision": 0.9730769230769231,
"eval_recall": 0.9822518025513034,
"eval_runtime": 45.4912,
"eval_samples_per_second": 9.43,
"eval_steps_per_second": 1.583,
"step": 2000
},
{
"epoch": 6.72,
"eval_accuracy": 0.9966172295773527,
"eval_f1": 0.9770781552057443,
"eval_loss": 0.017004678025841713,
"eval_precision": 0.9730473047304731,
"eval_recall": 0.9811425402107599,
"eval_runtime": 45.7222,
"eval_samples_per_second": 9.383,
"eval_steps_per_second": 1.575,
"step": 2010
},
{
"epoch": 6.76,
"eval_accuracy": 0.9966172295773527,
"eval_f1": 0.9774892970584174,
"eval_loss": 0.016945617273449898,
"eval_precision": 0.9735900962861073,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.3731,
"eval_samples_per_second": 9.455,
"eval_steps_per_second": 1.587,
"step": 2020
},
{
"epoch": 6.79,
"eval_accuracy": 0.9967100899418959,
"eval_f1": 0.9788994621431527,
"eval_loss": 0.016928063705563545,
"eval_precision": 0.9736625514403292,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.8513,
"eval_samples_per_second": 9.356,
"eval_steps_per_second": 1.57,
"step": 2030
},
{
"epoch": 6.82,
"eval_accuracy": 0.9967896845400759,
"eval_f1": 0.9779675020655467,
"eval_loss": 0.01666436158120632,
"eval_precision": 0.9712800875273523,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.4258,
"eval_samples_per_second": 9.444,
"eval_steps_per_second": 1.585,
"step": 2040
},
{
"epoch": 6.86,
"eval_accuracy": 0.9968560133718924,
"eval_f1": 0.9770130763936682,
"eval_loss": 0.016234010457992554,
"eval_precision": 0.969937141295436,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.6745,
"eval_samples_per_second": 9.393,
"eval_steps_per_second": 1.576,
"step": 2050
},
{
"epoch": 6.89,
"eval_accuracy": 0.9968029503064392,
"eval_f1": 0.9758986365514392,
"eval_loss": 0.015693064779043198,
"eval_precision": 0.9693570451436389,
"eval_recall": 0.9825291181364393,
"eval_runtime": 46.507,
"eval_samples_per_second": 9.224,
"eval_steps_per_second": 1.548,
"step": 2060
},
{
"epoch": 6.92,
"eval_accuracy": 0.9968825449046191,
"eval_f1": 0.978476821192053,
"eval_loss": 0.015247814357280731,
"eval_precision": 0.9736408566721582,
"eval_recall": 0.9833610648918469,
"eval_runtime": 45.4327,
"eval_samples_per_second": 9.443,
"eval_steps_per_second": 1.585,
"step": 2070
},
{
"epoch": 6.96,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.9795636564484949,
"eval_loss": 0.01587117277085781,
"eval_precision": 0.9755225522552256,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.1551,
"eval_samples_per_second": 9.501,
"eval_steps_per_second": 1.595,
"step": 2080
},
{
"epoch": 6.99,
"eval_accuracy": 0.9967100899418959,
"eval_f1": 0.9783776339347198,
"eval_loss": 0.017061389982700348,
"eval_precision": 0.9718194254445964,
"eval_recall": 0.9850249584026622,
"eval_runtime": 45.1957,
"eval_samples_per_second": 9.492,
"eval_steps_per_second": 1.593,
"step": 2090
},
{
"epoch": 7.02,
"eval_accuracy": 0.9965906980446261,
"eval_f1": 0.9775821757667446,
"eval_loss": 0.018233157694339752,
"eval_precision": 0.9697135061391542,
"eval_recall": 0.985579589572934,
"eval_runtime": 45.2503,
"eval_samples_per_second": 9.481,
"eval_steps_per_second": 1.591,
"step": 2100
},
{
"epoch": 7.06,
"eval_accuracy": 0.9970019368018891,
"eval_f1": 0.9790113228389947,
"eval_loss": 0.01590120792388916,
"eval_precision": 0.974972497249725,
"eval_recall": 0.983083749306711,
"eval_runtime": 45.4565,
"eval_samples_per_second": 9.438,
"eval_steps_per_second": 1.584,
"step": 2110
},
{
"epoch": 7.09,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.9770971302428255,
"eval_loss": 0.015739668160676956,
"eval_precision": 0.972267984623833,
"eval_recall": 0.9819744869661675,
"eval_runtime": 46.0012,
"eval_samples_per_second": 9.326,
"eval_steps_per_second": 1.565,
"step": 2120
},
{
"epoch": 7.12,
"eval_accuracy": 0.9969223422037091,
"eval_f1": 0.9790113228389947,
"eval_loss": 0.015736253932118416,
"eval_precision": 0.974972497249725,
"eval_recall": 0.983083749306711,
"eval_runtime": 45.4255,
"eval_samples_per_second": 9.444,
"eval_steps_per_second": 1.585,
"step": 2130
},
{
"epoch": 7.16,
"eval_accuracy": 0.9968825449046191,
"eval_f1": 0.9784827586206897,
"eval_loss": 0.016040045768022537,
"eval_precision": 0.9733809001097695,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.5296,
"eval_samples_per_second": 9.422,
"eval_steps_per_second": 1.581,
"step": 2140
},
{
"epoch": 7.19,
"eval_accuracy": 0.9969223422037091,
"eval_f1": 0.9786413118368471,
"eval_loss": 0.01620173640549183,
"eval_precision": 0.9726102437688304,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.6034,
"eval_samples_per_second": 9.407,
"eval_steps_per_second": 1.579,
"step": 2150
},
{
"epoch": 7.22,
"eval_accuracy": 0.9969886710355257,
"eval_f1": 0.9798565121412803,
"eval_loss": 0.0158588457852602,
"eval_precision": 0.9750137287204832,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.789,
"eval_samples_per_second": 9.369,
"eval_steps_per_second": 1.572,
"step": 2160
},
{
"epoch": 7.26,
"eval_accuracy": 0.9969488737364357,
"eval_f1": 0.9791522849647936,
"eval_loss": 0.015738798305392265,
"eval_precision": 0.9749793786087435,
"eval_recall": 0.9833610648918469,
"eval_runtime": 45.511,
"eval_samples_per_second": 9.426,
"eval_steps_per_second": 1.582,
"step": 2170
},
{
"epoch": 7.29,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9794113582976371,
"eval_loss": 0.015642931684851646,
"eval_precision": 0.976039658496282,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.1132,
"eval_samples_per_second": 9.509,
"eval_steps_per_second": 1.596,
"step": 2180
},
{
"epoch": 7.32,
"eval_accuracy": 0.9971611259982489,
"eval_f1": 0.9811998894111142,
"eval_loss": 0.015118683688342571,
"eval_precision": 0.9782249173098125,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.0629,
"eval_samples_per_second": 9.52,
"eval_steps_per_second": 1.598,
"step": 2190
},
{
"epoch": 7.36,
"eval_accuracy": 0.9973601124936987,
"eval_f1": 0.982160143825197,
"eval_loss": 0.015025600790977478,
"eval_precision": 0.9795862068965517,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.3715,
"eval_samples_per_second": 9.455,
"eval_steps_per_second": 1.587,
"step": 2200
},
{
"epoch": 7.39,
"eval_accuracy": 0.9972539863627922,
"eval_f1": 0.9786821705426357,
"eval_loss": 0.014340460300445557,
"eval_precision": 0.9770591487009398,
"eval_recall": 0.9803105934553522,
"eval_runtime": 45.1287,
"eval_samples_per_second": 9.506,
"eval_steps_per_second": 1.595,
"step": 2210
},
{
"epoch": 7.42,
"eval_accuracy": 0.9973335809609721,
"eval_f1": 0.9813097051086805,
"eval_loss": 0.0135923121124506,
"eval_precision": 0.979817528338402,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.1943,
"eval_samples_per_second": 9.492,
"eval_steps_per_second": 1.593,
"step": 2220
},
{
"epoch": 7.46,
"eval_accuracy": 0.9972009232973389,
"eval_f1": 0.978570441034149,
"eval_loss": 0.014164491556584835,
"eval_precision": 0.9757375241246209,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.309,
"eval_samples_per_second": 9.468,
"eval_steps_per_second": 1.589,
"step": 2230
},
{
"epoch": 7.49,
"eval_accuracy": 0.9972672521291555,
"eval_f1": 0.9806308799114555,
"eval_loss": 0.01402602344751358,
"eval_precision": 0.9784649364991718,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.5204,
"eval_samples_per_second": 9.424,
"eval_steps_per_second": 1.582,
"step": 2240
},
{
"epoch": 7.53,
"eval_accuracy": 0.9972539863627922,
"eval_f1": 0.9809181415929205,
"eval_loss": 0.014084520749747753,
"eval_precision": 0.9782129067843354,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.1882,
"eval_samples_per_second": 9.494,
"eval_steps_per_second": 1.593,
"step": 2250
},
{
"epoch": 7.56,
"eval_accuracy": 0.9972937836618821,
"eval_f1": 0.9835111542192047,
"eval_loss": 0.014140544459223747,
"eval_precision": 0.9828302409304902,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.1162,
"eval_samples_per_second": 9.509,
"eval_steps_per_second": 1.596,
"step": 2260
},
{
"epoch": 7.59,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.980484429065744,
"eval_loss": 0.015128599479794502,
"eval_precision": 0.9787234042553191,
"eval_recall": 0.9822518025513034,
"eval_runtime": 45.1622,
"eval_samples_per_second": 9.499,
"eval_steps_per_second": 1.594,
"step": 2270
},
{
"epoch": 7.63,
"eval_accuracy": 0.9971743917646122,
"eval_f1": 0.9838017444275232,
"eval_loss": 0.014916467480361462,
"eval_precision": 0.9823057782692839,
"eval_recall": 0.9853022739877981,
"eval_runtime": 45.3078,
"eval_samples_per_second": 9.469,
"eval_steps_per_second": 1.589,
"step": 2280
},
{
"epoch": 7.66,
"eval_accuracy": 0.9971876575309756,
"eval_f1": 0.9826989619377162,
"eval_loss": 0.014806441031396389,
"eval_precision": 0.980933959657364,
"eval_recall": 0.9844703272323905,
"eval_runtime": 45.215,
"eval_samples_per_second": 9.488,
"eval_steps_per_second": 1.592,
"step": 2290
},
{
"epoch": 7.69,
"eval_accuracy": 0.9973335809609721,
"eval_f1": 0.9828444936358606,
"eval_loss": 0.014511052519083023,
"eval_precision": 0.9806736609607951,
"eval_recall": 0.9850249584026622,
"eval_runtime": 45.1721,
"eval_samples_per_second": 9.497,
"eval_steps_per_second": 1.594,
"step": 2300
},
{
"epoch": 7.73,
"eval_accuracy": 0.9973070494282454,
"eval_f1": 0.9824124082537044,
"eval_loss": 0.014819289557635784,
"eval_precision": 0.9811894882434301,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.484,
"eval_samples_per_second": 9.432,
"eval_steps_per_second": 1.583,
"step": 2310
},
{
"epoch": 7.76,
"eval_accuracy": 0.9971611259982489,
"eval_f1": 0.9818935729094679,
"eval_loss": 0.015233664773404598,
"eval_precision": 0.9787820336180766,
"eval_recall": 0.9850249584026622,
"eval_runtime": 45.245,
"eval_samples_per_second": 9.482,
"eval_steps_per_second": 1.591,
"step": 2320
},
{
"epoch": 7.79,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9814865985078752,
"eval_loss": 0.01592710055410862,
"eval_precision": 0.9779735682819384,
"eval_recall": 0.9850249584026622,
"eval_runtime": 45.1068,
"eval_samples_per_second": 9.511,
"eval_steps_per_second": 1.596,
"step": 2330
},
{
"epoch": 7.83,
"eval_accuracy": 0.9970019368018891,
"eval_f1": 0.9807984528249758,
"eval_loss": 0.01635568030178547,
"eval_precision": 0.9771538673272777,
"eval_recall": 0.9844703272323905,
"eval_runtime": 45.3054,
"eval_samples_per_second": 9.469,
"eval_steps_per_second": 1.589,
"step": 2340
},
{
"epoch": 7.86,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.9810747340792927,
"eval_loss": 0.015507887117564678,
"eval_precision": 0.9774291219377924,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.3049,
"eval_samples_per_second": 9.469,
"eval_steps_per_second": 1.589,
"step": 2350
},
{
"epoch": 7.89,
"eval_accuracy": 0.9971743917646122,
"eval_f1": 0.9814814814814814,
"eval_loss": 0.01488608680665493,
"eval_precision": 0.978236914600551,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.3669,
"eval_samples_per_second": 9.456,
"eval_steps_per_second": 1.587,
"step": 2360
},
{
"epoch": 7.93,
"eval_accuracy": 0.9969090764373458,
"eval_f1": 0.9790055248618784,
"eval_loss": 0.016140291467308998,
"eval_precision": 0.9752339020363237,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.5755,
"eval_samples_per_second": 9.413,
"eval_steps_per_second": 1.58,
"step": 2370
},
{
"epoch": 7.96,
"eval_accuracy": 0.9968427476055292,
"eval_f1": 0.980511402902557,
"eval_loss": 0.01678432524204254,
"eval_precision": 0.9774042435932764,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.3412,
"eval_samples_per_second": 9.462,
"eval_steps_per_second": 1.588,
"step": 2380
},
{
"epoch": 7.99,
"eval_accuracy": 0.9968162160728026,
"eval_f1": 0.9803704727674868,
"eval_loss": 0.016629330813884735,
"eval_precision": 0.9773980154355016,
"eval_recall": 0.9833610648918469,
"eval_runtime": 45.5099,
"eval_samples_per_second": 9.427,
"eval_steps_per_second": 1.582,
"step": 2390
},
{
"epoch": 8.03,
"eval_accuracy": 0.9968560133718924,
"eval_f1": 0.9798119469026549,
"eval_loss": 0.01662250980734825,
"eval_precision": 0.9771097628240485,
"eval_recall": 0.9825291181364393,
"eval_runtime": 45.337,
"eval_samples_per_second": 9.462,
"eval_steps_per_second": 1.588,
"step": 2400
},
{
"epoch": 8.06,
"eval_accuracy": 0.9970019368018891,
"eval_f1": 0.9813355454168395,
"eval_loss": 0.0163425225764513,
"eval_precision": 0.978494623655914,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.4794,
"eval_samples_per_second": 9.433,
"eval_steps_per_second": 1.583,
"step": 2410
},
{
"epoch": 8.09,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9811842833425568,
"eval_loss": 0.016381612047553062,
"eval_precision": 0.9790171176145775,
"eval_recall": 0.9833610648918469,
"eval_runtime": 45.1726,
"eval_samples_per_second": 9.497,
"eval_steps_per_second": 1.594,
"step": 2420
},
{
"epoch": 8.13,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.9817528338401991,
"eval_loss": 0.016340401023626328,
"eval_precision": 0.9787761852260198,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.3524,
"eval_samples_per_second": 9.459,
"eval_steps_per_second": 1.588,
"step": 2430
},
{
"epoch": 8.16,
"eval_accuracy": 0.9970019368018891,
"eval_f1": 0.980771890994605,
"eval_loss": 0.016326354816555977,
"eval_precision": 0.9784708804857852,
"eval_recall": 0.983083749306711,
"eval_runtime": 45.2927,
"eval_samples_per_second": 9.472,
"eval_steps_per_second": 1.59,
"step": 2440
},
{
"epoch": 8.19,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.9817275747508305,
"eval_loss": 0.015510362572968006,
"eval_precision": 0.9800995024875622,
"eval_recall": 0.9833610648918469,
"eval_runtime": 45.5096,
"eval_samples_per_second": 9.427,
"eval_steps_per_second": 1.582,
"step": 2450
},
{
"epoch": 8.23,
"eval_accuracy": 0.9971345944655223,
"eval_f1": 0.9824464409122322,
"eval_loss": 0.015236412174999714,
"eval_precision": 0.9793331496279967,
"eval_recall": 0.985579589572934,
"eval_runtime": 45.3704,
"eval_samples_per_second": 9.455,
"eval_steps_per_second": 1.587,
"step": 2460
},
{
"epoch": 8.26,
"eval_accuracy": 0.9971345944655223,
"eval_f1": 0.9814865985078752,
"eval_loss": 0.015579747967422009,
"eval_precision": 0.9779735682819384,
"eval_recall": 0.9850249584026622,
"eval_runtime": 45.2219,
"eval_samples_per_second": 9.487,
"eval_steps_per_second": 1.592,
"step": 2470
},
{
"epoch": 8.29,
"eval_accuracy": 0.9972009232973389,
"eval_f1": 0.9789590254706533,
"eval_loss": 0.014976629987359047,
"eval_precision": 0.9773355444997236,
"eval_recall": 0.9805879090404881,
"eval_runtime": 45.5521,
"eval_samples_per_second": 9.418,
"eval_steps_per_second": 1.581,
"step": 2480
},
{
"epoch": 8.33,
"eval_accuracy": 0.9973335809609721,
"eval_f1": 0.9824318716281643,
"eval_loss": 0.014180959202349186,
"eval_precision": 0.9801269666022633,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.6388,
"eval_samples_per_second": 9.4,
"eval_steps_per_second": 1.578,
"step": 2490
},
{
"epoch": 8.36,
"learning_rate": 7.500000000000001e-06,
"loss": 0.0051,
"step": 2500
},
{
"epoch": 8.36,
"eval_accuracy": 0.9972274548300656,
"eval_f1": 0.9791522849647936,
"eval_loss": 0.014656171202659607,
"eval_precision": 0.9749793786087435,
"eval_recall": 0.9833610648918469,
"eval_runtime": 45.2727,
"eval_samples_per_second": 9.476,
"eval_steps_per_second": 1.59,
"step": 2500
},
{
"epoch": 8.39,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.9780477702609416,
"eval_loss": 0.014881155453622341,
"eval_precision": 0.9738795710750618,
"eval_recall": 0.9822518025513034,
"eval_runtime": 45.7124,
"eval_samples_per_second": 9.385,
"eval_steps_per_second": 1.575,
"step": 2510
},
{
"epoch": 8.43,
"eval_accuracy": 0.9972141890637022,
"eval_f1": 0.9806629834254144,
"eval_loss": 0.014929546974599361,
"eval_precision": 0.976884975233902,
"eval_recall": 0.9844703272323905,
"eval_runtime": 45.3886,
"eval_samples_per_second": 9.452,
"eval_steps_per_second": 1.586,
"step": 2520
},
{
"epoch": 8.46,
"eval_accuracy": 0.9972009232973389,
"eval_f1": 0.9802404311178665,
"eval_loss": 0.014953644014894962,
"eval_precision": 0.976865877168824,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.8505,
"eval_samples_per_second": 9.356,
"eval_steps_per_second": 1.57,
"step": 2530
},
{
"epoch": 8.49,
"eval_accuracy": 0.9971345944655223,
"eval_f1": 0.9813252178724583,
"eval_loss": 0.014914426021277905,
"eval_precision": 0.979022909191278,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.5694,
"eval_samples_per_second": 9.414,
"eval_steps_per_second": 1.58,
"step": 2540
},
{
"epoch": 8.53,
"eval_accuracy": 0.9972672521291555,
"eval_f1": 0.9826941713969264,
"eval_loss": 0.014766544103622437,
"eval_precision": 0.9811998894111141,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.2509,
"eval_samples_per_second": 9.48,
"eval_steps_per_second": 1.591,
"step": 2550
},
{
"epoch": 8.56,
"eval_accuracy": 0.9972407205964289,
"eval_f1": 0.9839468585662884,
"eval_loss": 0.015172240324318409,
"eval_precision": 0.9820441988950276,
"eval_recall": 0.9858569051580699,
"eval_runtime": 45.7001,
"eval_samples_per_second": 9.387,
"eval_steps_per_second": 1.575,
"step": 2560
},
{
"epoch": 8.6,
"eval_accuracy": 0.9971345944655223,
"eval_f1": 0.9829993089149965,
"eval_loss": 0.015841683372855186,
"eval_precision": 0.9798842656379168,
"eval_recall": 0.9861342207432058,
"eval_runtime": 45.6884,
"eval_samples_per_second": 9.39,
"eval_steps_per_second": 1.576,
"step": 2570
},
{
"epoch": 8.63,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9813407049067036,
"eval_loss": 0.016232503578066826,
"eval_precision": 0.9782309176081565,
"eval_recall": 0.9844703272323905,
"eval_runtime": 45.3554,
"eval_samples_per_second": 9.459,
"eval_steps_per_second": 1.587,
"step": 2580
},
{
"epoch": 8.66,
"eval_accuracy": 0.9969621395027991,
"eval_f1": 0.9763714246234628,
"eval_loss": 0.015989486128091812,
"eval_precision": 0.9730101900302947,
"eval_recall": 0.9797559622850804,
"eval_runtime": 45.3338,
"eval_samples_per_second": 9.463,
"eval_steps_per_second": 1.588,
"step": 2590
},
{
"epoch": 8.7,
"eval_accuracy": 0.9969223422037091,
"eval_f1": 0.9746922970543493,
"eval_loss": 0.015164612792432308,
"eval_precision": 0.9721379310344828,
"eval_recall": 0.9772601220188575,
"eval_runtime": 45.3618,
"eval_samples_per_second": 9.457,
"eval_steps_per_second": 1.587,
"step": 2600
},
{
"epoch": 8.73,
"eval_accuracy": 0.9970284683346157,
"eval_f1": 0.9752111895859299,
"eval_loss": 0.015361527912318707,
"eval_precision": 0.9739972337482711,
"eval_recall": 0.9764281752634498,
"eval_runtime": 45.7043,
"eval_samples_per_second": 9.386,
"eval_steps_per_second": 1.575,
"step": 2610
},
{
"epoch": 8.76,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9776057506220625,
"eval_loss": 0.015215002000331879,
"eval_precision": 0.9746416758544653,
"eval_recall": 0.9805879090404881,
"eval_runtime": 45.5622,
"eval_samples_per_second": 9.416,
"eval_steps_per_second": 1.58,
"step": 2620
},
{
"epoch": 8.8,
"eval_accuracy": 0.9970815314000689,
"eval_f1": 0.9777470628887354,
"eval_loss": 0.014545532874763012,
"eval_precision": 0.974648663543676,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.4027,
"eval_samples_per_second": 9.449,
"eval_steps_per_second": 1.586,
"step": 2630
},
{
"epoch": 8.83,
"eval_accuracy": 0.9971611259982489,
"eval_f1": 0.9813355454168395,
"eval_loss": 0.014298198744654655,
"eval_precision": 0.978494623655914,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.6015,
"eval_samples_per_second": 9.408,
"eval_steps_per_second": 1.579,
"step": 2640
},
{
"epoch": 8.86,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.9804952275556785,
"eval_loss": 0.014669723808765411,
"eval_precision": 0.978194866133039,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.6583,
"eval_samples_per_second": 9.396,
"eval_steps_per_second": 1.577,
"step": 2650
},
{
"epoch": 8.9,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9749550297495504,
"eval_loss": 0.014710523188114166,
"eval_precision": 0.9729356531344933,
"eval_recall": 0.9769828064337216,
"eval_runtime": 45.2863,
"eval_samples_per_second": 9.473,
"eval_steps_per_second": 1.59,
"step": 2660
},
{
"epoch": 8.93,
"eval_accuracy": 0.9972141890637022,
"eval_f1": 0.9820094104622197,
"eval_loss": 0.014592879451811314,
"eval_precision": 0.980110497237569,
"eval_recall": 0.9839156960621187,
"eval_runtime": 45.3618,
"eval_samples_per_second": 9.457,
"eval_steps_per_second": 1.587,
"step": 2670
},
{
"epoch": 8.96,
"eval_accuracy": 0.9971876575309756,
"eval_f1": 0.9817477876106194,
"eval_loss": 0.014163294807076454,
"eval_precision": 0.9790402647545504,
"eval_recall": 0.9844703272323905,
"eval_runtime": 45.3659,
"eval_samples_per_second": 9.456,
"eval_steps_per_second": 1.587,
"step": 2680
},
{
"epoch": 9.0,
"eval_accuracy": 0.9971345944655223,
"eval_f1": 0.9792932081722805,
"eval_loss": 0.01418287307024002,
"eval_precision": 0.9749862561847169,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.6259,
"eval_samples_per_second": 9.403,
"eval_steps_per_second": 1.578,
"step": 2690
},
{
"epoch": 9.03,
"eval_accuracy": 0.9971478602318856,
"eval_f1": 0.9809286898839138,
"eval_loss": 0.014496715739369392,
"eval_precision": 0.9776859504132231,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.371,
"eval_samples_per_second": 9.455,
"eval_steps_per_second": 1.587,
"step": 2700
},
{
"epoch": 9.06,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9802295036637633,
"eval_loss": 0.014654590748250484,
"eval_precision": 0.9773917838433968,
"eval_recall": 0.983083749306711,
"eval_runtime": 45.386,
"eval_samples_per_second": 9.452,
"eval_steps_per_second": 1.586,
"step": 2710
},
{
"epoch": 9.1,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.9795410561238596,
"eval_loss": 0.014612732455134392,
"eval_precision": 0.9765711135611908,
"eval_recall": 0.9825291181364393,
"eval_runtime": 45.3853,
"eval_samples_per_second": 9.452,
"eval_steps_per_second": 1.586,
"step": 2720
},
{
"epoch": 9.13,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9796989366109652,
"eval_loss": 0.014642550610005856,
"eval_precision": 0.9757909215955983,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.583,
"eval_samples_per_second": 9.411,
"eval_steps_per_second": 1.58,
"step": 2730
},
{
"epoch": 9.16,
"eval_accuracy": 0.9970815314000689,
"eval_f1": 0.9792817679558011,
"eval_loss": 0.014756478369235992,
"eval_precision": 0.9755090809025867,
"eval_recall": 0.983083749306711,
"eval_runtime": 45.3958,
"eval_samples_per_second": 9.45,
"eval_steps_per_second": 1.586,
"step": 2740
},
{
"epoch": 9.2,
"eval_accuracy": 0.9971611259982489,
"eval_f1": 0.9781526548672567,
"eval_loss": 0.014514540322124958,
"eval_precision": 0.9754550468836183,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.3479,
"eval_samples_per_second": 9.46,
"eval_steps_per_second": 1.588,
"step": 2750
},
{
"epoch": 9.23,
"eval_accuracy": 0.9971876575309756,
"eval_f1": 0.9780234968901176,
"eval_loss": 0.014607676304876804,
"eval_precision": 0.974924221548636,
"eval_recall": 0.9811425402107599,
"eval_runtime": 45.3679,
"eval_samples_per_second": 9.456,
"eval_steps_per_second": 1.587,
"step": 2760
},
{
"epoch": 9.26,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.9799585348997927,
"eval_loss": 0.014230134896934032,
"eval_precision": 0.9768531275833563,
"eval_recall": 0.983083749306711,
"eval_runtime": 45.6606,
"eval_samples_per_second": 9.395,
"eval_steps_per_second": 1.577,
"step": 2770
},
{
"epoch": 9.3,
"eval_accuracy": 0.9970815314000689,
"eval_f1": 0.9814814814814814,
"eval_loss": 0.014004090800881386,
"eval_precision": 0.978236914600551,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.4655,
"eval_samples_per_second": 9.436,
"eval_steps_per_second": 1.584,
"step": 2780
},
{
"epoch": 9.33,
"eval_accuracy": 0.9971080629327956,
"eval_f1": 0.980359612724758,
"eval_loss": 0.013850794173777103,
"eval_precision": 0.977924944812362,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.4768,
"eval_samples_per_second": 9.433,
"eval_steps_per_second": 1.583,
"step": 2790
},
{
"epoch": 9.36,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9795070617557464,
"eval_loss": 0.014602423645555973,
"eval_precision": 0.9781526548672567,
"eval_recall": 0.980865224625624,
"eval_runtime": 46.0797,
"eval_samples_per_second": 9.31,
"eval_steps_per_second": 1.563,
"step": 2800
},
{
"epoch": 9.4,
"eval_accuracy": 0.9971345944655223,
"eval_f1": 0.9811738648947951,
"eval_loss": 0.01487213745713234,
"eval_precision": 0.9795467108899945,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.4621,
"eval_samples_per_second": 9.436,
"eval_steps_per_second": 1.584,
"step": 2810
},
{
"epoch": 9.43,
"eval_accuracy": 0.9971345944655223,
"eval_f1": 0.9789648491558263,
"eval_loss": 0.01481552142649889,
"eval_precision": 0.9770718232044199,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.388,
"eval_samples_per_second": 9.452,
"eval_steps_per_second": 1.586,
"step": 2820
},
{
"epoch": 9.46,
"eval_accuracy": 0.9973601124936987,
"eval_f1": 0.9822763777346994,
"eval_loss": 0.01404637098312378,
"eval_precision": 0.9809181415929203,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.4647,
"eval_samples_per_second": 9.436,
"eval_steps_per_second": 1.584,
"step": 2830
},
{
"epoch": 9.5,
"eval_accuracy": 0.9969488737364357,
"eval_f1": 0.9712539925010416,
"eval_loss": 0.014825278893113136,
"eval_precision": 0.972739916550765,
"eval_recall": 0.9697726012201886,
"eval_runtime": 45.3762,
"eval_samples_per_second": 9.454,
"eval_steps_per_second": 1.587,
"step": 2840
},
{
"epoch": 9.53,
"eval_accuracy": 0.9964978376800828,
"eval_f1": 0.9593767390094602,
"eval_loss": 0.015539586544036865,
"eval_precision": 0.9625907314349526,
"eval_recall": 0.9561841375485303,
"eval_runtime": 45.6548,
"eval_samples_per_second": 9.397,
"eval_steps_per_second": 1.577,
"step": 2850
},
{
"epoch": 9.57,
"eval_accuracy": 0.9964978376800828,
"eval_f1": 0.9605006954102921,
"eval_loss": 0.016403868794441223,
"eval_precision": 0.9634486607142857,
"eval_recall": 0.9575707154742097,
"eval_runtime": 45.6372,
"eval_samples_per_second": 9.4,
"eval_steps_per_second": 1.578,
"step": 2860
},
{
"epoch": 9.6,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9791350006908941,
"eval_loss": 0.015382306650280952,
"eval_precision": 0.9757642522721014,
"eval_recall": 0.9825291181364393,
"eval_runtime": 45.4505,
"eval_samples_per_second": 9.439,
"eval_steps_per_second": 1.584,
"step": 2870
},
{
"epoch": 9.63,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9781647318960752,
"eval_loss": 0.015797466039657593,
"eval_precision": 0.974931129476584,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.42,
"eval_samples_per_second": 9.445,
"eval_steps_per_second": 1.585,
"step": 2880
},
{
"epoch": 9.67,
"eval_accuracy": 0.9969223422037091,
"eval_f1": 0.9791637919138954,
"eval_loss": 0.01617647521197796,
"eval_precision": 0.9744575666025818,
"eval_recall": 0.9839156960621187,
"eval_runtime": 45.4393,
"eval_samples_per_second": 9.441,
"eval_steps_per_second": 1.585,
"step": 2890
},
{
"epoch": 9.7,
"eval_accuracy": 0.9969223422037091,
"eval_f1": 0.978629532607197,
"eval_loss": 0.0164639949798584,
"eval_precision": 0.9731285988483686,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.4559,
"eval_samples_per_second": 9.438,
"eval_steps_per_second": 1.584,
"step": 2900
},
{
"epoch": 9.73,
"eval_accuracy": 0.9969886710355257,
"eval_f1": 0.9791810285399146,
"eval_loss": 0.016681063920259476,
"eval_precision": 0.9736769947902385,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.5001,
"eval_samples_per_second": 9.429,
"eval_steps_per_second": 1.582,
"step": 2910
},
{
"epoch": 9.77,
"eval_accuracy": 0.9969621395027991,
"eval_f1": 0.9808090570205716,
"eval_loss": 0.016886161640286446,
"eval_precision": 0.9766290899092659,
"eval_recall": 0.9850249584026622,
"eval_runtime": 45.9762,
"eval_samples_per_second": 9.331,
"eval_steps_per_second": 1.566,
"step": 2920
},
{
"epoch": 9.8,
"eval_accuracy": 0.9969621395027991,
"eval_f1": 0.9787351560342448,
"eval_loss": 0.017214221879839897,
"eval_precision": 0.9746974697469747,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.4576,
"eval_samples_per_second": 9.437,
"eval_steps_per_second": 1.584,
"step": 2930
},
{
"epoch": 9.83,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.9816069699903195,
"eval_loss": 0.016497749835252762,
"eval_precision": 0.9790344827586207,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.3849,
"eval_samples_per_second": 9.452,
"eval_steps_per_second": 1.586,
"step": 2940
},
{
"epoch": 9.87,
"eval_accuracy": 0.9971876575309756,
"eval_f1": 0.9821650767316467,
"eval_loss": 0.01616404764354229,
"eval_precision": 0.9793217535153019,
"eval_recall": 0.9850249584026622,
"eval_runtime": 45.4779,
"eval_samples_per_second": 9.433,
"eval_steps_per_second": 1.583,
"step": 2950
},
{
"epoch": 9.9,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.9790829754813686,
"eval_loss": 0.016479264944791794,
"eval_precision": 0.9781345142540825,
"eval_recall": 0.9800332778702163,
"eval_runtime": 45.8218,
"eval_samples_per_second": 9.362,
"eval_steps_per_second": 1.571,
"step": 2960
},
{
"epoch": 9.93,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.980060924951537,
"eval_loss": 0.016018539667129517,
"eval_precision": 0.9787057522123894,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.4831,
"eval_samples_per_second": 9.432,
"eval_steps_per_second": 1.583,
"step": 2970
},
{
"epoch": 9.97,
"eval_accuracy": 0.9970284683346157,
"eval_f1": 0.9785348289710566,
"eval_loss": 0.016076229512691498,
"eval_precision": 0.9773167358229599,
"eval_recall": 0.9797559622850804,
"eval_runtime": 45.4108,
"eval_samples_per_second": 9.447,
"eval_steps_per_second": 1.586,
"step": 2980
},
{
"epoch": 10.0,
"eval_accuracy": 0.9970019368018891,
"eval_f1": 0.9797895902547065,
"eval_loss": 0.01618347130715847,
"eval_precision": 0.9781647318960752,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.4332,
"eval_samples_per_second": 9.442,
"eval_steps_per_second": 1.585,
"step": 2990
},
{
"epoch": 10.03,
"learning_rate": 7e-06,
"loss": 0.0046,
"step": 3000
},
{
"epoch": 10.03,
"eval_accuracy": 0.9970019368018891,
"eval_f1": 0.9791234619106871,
"eval_loss": 0.016251519322395325,
"eval_precision": 0.9762889440308795,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.7254,
"eval_samples_per_second": 9.382,
"eval_steps_per_second": 1.575,
"step": 3000
},
{
"epoch": 10.07,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9806576402321082,
"eval_loss": 0.0159316323697567,
"eval_precision": 0.977147577092511,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.9937,
"eval_samples_per_second": 9.327,
"eval_steps_per_second": 1.565,
"step": 3010
},
{
"epoch": 10.1,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9798007747648035,
"eval_loss": 0.015915466472506523,
"eval_precision": 0.9776366648260629,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.3335,
"eval_samples_per_second": 9.463,
"eval_steps_per_second": 1.588,
"step": 3020
},
{
"epoch": 10.13,
"eval_accuracy": 0.9971478602318856,
"eval_f1": 0.9813200498132004,
"eval_loss": 0.015171729028224945,
"eval_precision": 0.9792874896437448,
"eval_recall": 0.9833610648918469,
"eval_runtime": 45.3108,
"eval_samples_per_second": 9.468,
"eval_steps_per_second": 1.589,
"step": 3030
},
{
"epoch": 10.17,
"eval_accuracy": 0.9966570268764426,
"eval_f1": 0.9667917187717104,
"eval_loss": 0.015076521784067154,
"eval_precision": 0.9688109161793372,
"eval_recall": 0.9647809206877427,
"eval_runtime": 45.3556,
"eval_samples_per_second": 9.459,
"eval_steps_per_second": 1.587,
"step": 3040
},
{
"epoch": 10.2,
"eval_accuracy": 0.9968427476055292,
"eval_f1": 0.9746922970543493,
"eval_loss": 0.014860566705465317,
"eval_precision": 0.9721379310344828,
"eval_recall": 0.9772601220188575,
"eval_runtime": 45.4321,
"eval_samples_per_second": 9.443,
"eval_steps_per_second": 1.585,
"step": 3050
},
{
"epoch": 10.23,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.980110497237569,
"eval_loss": 0.014547467231750488,
"eval_precision": 0.9763346175013758,
"eval_recall": 0.9839156960621187,
"eval_runtime": 45.3097,
"eval_samples_per_second": 9.468,
"eval_steps_per_second": 1.589,
"step": 3060
},
{
"epoch": 10.27,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9792760431058304,
"eval_loss": 0.014211696572601795,
"eval_precision": 0.9757709251101322,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.7056,
"eval_samples_per_second": 9.386,
"eval_steps_per_second": 1.575,
"step": 3070
},
{
"epoch": 10.3,
"eval_accuracy": 0.9970284683346157,
"eval_f1": 0.9788469514724182,
"eval_loss": 0.01424412615597248,
"eval_precision": 0.9760132340777502,
"eval_recall": 0.9816971713810316,
"eval_runtime": 45.6738,
"eval_samples_per_second": 9.393,
"eval_steps_per_second": 1.576,
"step": 3080
},
{
"epoch": 10.33,
"eval_accuracy": 0.9969356079700724,
"eval_f1": 0.9745293466223699,
"eval_loss": 0.014736946672201157,
"eval_precision": 0.9729132117191819,
"eval_recall": 0.9761508596783139,
"eval_runtime": 45.4811,
"eval_samples_per_second": 9.432,
"eval_steps_per_second": 1.583,
"step": 3090
},
{
"epoch": 10.37,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.9801050013815971,
"eval_loss": 0.014717744663357735,
"eval_precision": 0.9765969162995595,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.415,
"eval_samples_per_second": 9.446,
"eval_steps_per_second": 1.585,
"step": 3100
},
{
"epoch": 10.4,
"eval_accuracy": 0.9971080629327956,
"eval_f1": 0.9810642709053213,
"eval_loss": 0.015054759569466114,
"eval_precision": 0.9779553596031965,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.7255,
"eval_samples_per_second": 9.382,
"eval_steps_per_second": 1.575,
"step": 3110
},
{
"epoch": 10.43,
"eval_accuracy": 0.9971080629327956,
"eval_f1": 0.9807931463313527,
"eval_loss": 0.01575205847620964,
"eval_precision": 0.9774166896171853,
"eval_recall": 0.9841930116472546,
"eval_runtime": 45.3913,
"eval_samples_per_second": 9.451,
"eval_steps_per_second": 1.586,
"step": 3120
},
{
"epoch": 10.47,
"eval_accuracy": 0.9968162160728026,
"eval_f1": 0.97202216066482,
"eval_loss": 0.015902305021882057,
"eval_precision": 0.9709463198671832,
"eval_recall": 0.9731003882418192,
"eval_runtime": 45.3669,
"eval_samples_per_second": 9.456,
"eval_steps_per_second": 1.587,
"step": 3130
},
{
"epoch": 10.5,
"eval_accuracy": 0.9966835584091693,
"eval_f1": 0.9686633388796451,
"eval_loss": 0.016264360398054123,
"eval_precision": 0.9686633388796451,
"eval_recall": 0.9686633388796451,
"eval_runtime": 45.3009,
"eval_samples_per_second": 9.47,
"eval_steps_per_second": 1.589,
"step": 3140
},
{
"epoch": 10.54,
"eval_accuracy": 0.9969621395027991,
"eval_f1": 0.9782698961937716,
"eval_loss": 0.015213034115731716,
"eval_precision": 0.9765128488532744,
"eval_recall": 0.9800332778702163,
"eval_runtime": 45.7467,
"eval_samples_per_second": 9.378,
"eval_steps_per_second": 1.574,
"step": 3150
},
{
"epoch": 10.57,
"eval_accuracy": 0.9969886710355257,
"eval_f1": 0.978693967902601,
"eval_loss": 0.014814727008342743,
"eval_precision": 0.9765323025952513,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.3386,
"eval_samples_per_second": 9.462,
"eval_steps_per_second": 1.588,
"step": 3160
},
{
"epoch": 10.6,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9793828697938286,
"eval_loss": 0.015096531249582767,
"eval_precision": 0.9773543220104943,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.6502,
"eval_samples_per_second": 9.398,
"eval_steps_per_second": 1.577,
"step": 3170
},
{
"epoch": 10.64,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9764998617638928,
"eval_loss": 0.015553129836916924,
"eval_precision": 0.9735391400220507,
"eval_recall": 0.9794786466999446,
"eval_runtime": 45.4708,
"eval_samples_per_second": 9.435,
"eval_steps_per_second": 1.583,
"step": 3180
},
{
"epoch": 10.67,
"eval_accuracy": 0.9970152025682524,
"eval_f1": 0.9774643992810729,
"eval_loss": 0.0158841609954834,
"eval_precision": 0.9746346843121036,
"eval_recall": 0.9803105934553522,
"eval_runtime": 45.4753,
"eval_samples_per_second": 9.434,
"eval_steps_per_second": 1.583,
"step": 3190
},
{
"epoch": 10.7,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.9800884955752212,
"eval_loss": 0.016482515260577202,
"eval_precision": 0.9773855488141202,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.5435,
"eval_samples_per_second": 9.42,
"eval_steps_per_second": 1.581,
"step": 3200
},
{
"epoch": 10.74,
"eval_accuracy": 0.9970815314000689,
"eval_f1": 0.9795410561238596,
"eval_loss": 0.016413580626249313,
"eval_precision": 0.9765711135611908,
"eval_recall": 0.9825291181364393,
"eval_runtime": 45.616,
"eval_samples_per_second": 9.405,
"eval_steps_per_second": 1.578,
"step": 3210
},
{
"epoch": 10.77,
"eval_accuracy": 0.9969621395027991,
"eval_f1": 0.9791176877333702,
"eval_loss": 0.01622335985302925,
"eval_precision": 0.976551724137931,
"eval_recall": 0.9816971713810316,
"eval_runtime": 45.7676,
"eval_samples_per_second": 9.373,
"eval_steps_per_second": 1.573,
"step": 3220
},
{
"epoch": 10.8,
"eval_accuracy": 0.9969621395027991,
"eval_f1": 0.9803541781959049,
"eval_loss": 0.015803754329681396,
"eval_precision": 0.9781888459414688,
"eval_recall": 0.9825291181364393,
"eval_runtime": 45.7275,
"eval_samples_per_second": 9.382,
"eval_steps_per_second": 1.575,
"step": 3230
},
{
"epoch": 10.84,
"eval_accuracy": 0.9968958106709824,
"eval_f1": 0.9793828697938286,
"eval_loss": 0.015858009457588196,
"eval_precision": 0.9773543220104943,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.806,
"eval_samples_per_second": 9.366,
"eval_steps_per_second": 1.572,
"step": 3240
},
{
"epoch": 10.87,
"eval_accuracy": 0.9966968241755326,
"eval_f1": 0.9738263398421271,
"eval_loss": 0.016643954440951347,
"eval_precision": 0.9726141078838174,
"eval_recall": 0.9750415973377704,
"eval_runtime": 45.5359,
"eval_samples_per_second": 9.421,
"eval_steps_per_second": 1.581,
"step": 3250
},
{
"epoch": 10.9,
"eval_accuracy": 0.9969356079700724,
"eval_f1": 0.977728593166413,
"eval_loss": 0.016697365790605545,
"eval_precision": 0.9754347226055755,
"eval_recall": 0.9800332778702163,
"eval_runtime": 45.7975,
"eval_samples_per_second": 9.367,
"eval_steps_per_second": 1.572,
"step": 3260
},
{
"epoch": 10.94,
"eval_accuracy": 0.9969223422037091,
"eval_f1": 0.977297895902547,
"eval_loss": 0.016878845170140266,
"eval_precision": 0.9756771697070205,
"eval_recall": 0.9789240155296728,
"eval_runtime": 45.4916,
"eval_samples_per_second": 9.43,
"eval_steps_per_second": 1.583,
"step": 3270
},
{
"epoch": 10.97,
"eval_accuracy": 0.9969223422037091,
"eval_f1": 0.9780052566053397,
"eval_loss": 0.016803227365016937,
"eval_precision": 0.9757107369583218,
"eval_recall": 0.9803105934553522,
"eval_runtime": 45.574,
"eval_samples_per_second": 9.413,
"eval_steps_per_second": 1.58,
"step": 3280
},
{
"epoch": 11.0,
"eval_accuracy": 0.9969754052691624,
"eval_f1": 0.9811790755604761,
"eval_loss": 0.016553932800889015,
"eval_precision": 0.9792817679558011,
"eval_recall": 0.983083749306711,
"eval_runtime": 45.6533,
"eval_samples_per_second": 9.397,
"eval_steps_per_second": 1.577,
"step": 3290
},
{
"epoch": 11.04,
"eval_accuracy": 0.9971080629327956,
"eval_f1": 0.9845132743362832,
"eval_loss": 0.015565542504191399,
"eval_precision": 0.9817981246552675,
"eval_recall": 0.9872434830837493,
"eval_runtime": 45.6303,
"eval_samples_per_second": 9.402,
"eval_steps_per_second": 1.578,
"step": 3300
},
{
"epoch": 11.07,
"eval_accuracy": 0.9971345944655223,
"eval_f1": 0.9846579129232895,
"eval_loss": 0.014836783520877361,
"eval_precision": 0.981537613667677,
"eval_recall": 0.9877981142540211,
"eval_runtime": 45.5788,
"eval_samples_per_second": 9.412,
"eval_steps_per_second": 1.58,
"step": 3310
},
{
"epoch": 11.1,
"eval_accuracy": 0.9970549998673424,
"eval_f1": 0.9835521769177609,
"eval_loss": 0.015223776921629906,
"eval_precision": 0.9804353816478368,
"eval_recall": 0.9866888519134775,
"eval_runtime": 45.8006,
"eval_samples_per_second": 9.367,
"eval_steps_per_second": 1.572,
"step": 3320
},
{
"epoch": 11.14,
"eval_accuracy": 0.9969754052691624,
"eval_f1": 0.9827133176600746,
"eval_loss": 0.015493294224143028,
"eval_precision": 0.9801379310344828,
"eval_recall": 0.9853022739877981,
"eval_runtime": 46.0713,
"eval_samples_per_second": 9.312,
"eval_steps_per_second": 1.563,
"step": 3330
},
{
"epoch": 11.17,
"eval_accuracy": 0.9970019368018891,
"eval_f1": 0.9827180976081846,
"eval_loss": 0.014980579726397991,
"eval_precision": 0.9798731734215606,
"eval_recall": 0.985579589572934,
"eval_runtime": 45.5835,
"eval_samples_per_second": 9.411,
"eval_steps_per_second": 1.58,
"step": 3340
},
{
"epoch": 11.2,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.9840918522617236,
"eval_loss": 0.014826910570263863,
"eval_precision": 0.9817830527187413,
"eval_recall": 0.9864115363283417,
"eval_runtime": 45.5689,
"eval_samples_per_second": 9.414,
"eval_steps_per_second": 1.58,
"step": 3350
},
{
"epoch": 11.24,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.983402489626556,
"eval_loss": 0.015205192379653454,
"eval_precision": 0.9809602649006622,
"eval_recall": 0.9858569051580699,
"eval_runtime": 45.5733,
"eval_samples_per_second": 9.413,
"eval_steps_per_second": 1.58,
"step": 3360
},
{
"epoch": 11.27,
"eval_accuracy": 0.9970815314000689,
"eval_f1": 0.9835430784123911,
"eval_loss": 0.015277662314474583,
"eval_precision": 0.9809655172413793,
"eval_recall": 0.9861342207432058,
"eval_runtime": 45.8383,
"eval_samples_per_second": 9.359,
"eval_steps_per_second": 1.571,
"step": 3370
},
{
"epoch": 11.3,
"eval_accuracy": 0.9969090764373458,
"eval_f1": 0.9803921568627452,
"eval_loss": 0.015845883637666702,
"eval_precision": 0.9763476347634763,
"eval_recall": 0.9844703272323905,
"eval_runtime": 45.6768,
"eval_samples_per_second": 9.392,
"eval_steps_per_second": 1.576,
"step": 3380
},
{
"epoch": 11.34,
"eval_accuracy": 0.9968958106709824,
"eval_f1": 0.9808037563872393,
"eval_loss": 0.016353582963347435,
"eval_precision": 0.9768913342503439,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.6996,
"eval_samples_per_second": 9.387,
"eval_steps_per_second": 1.576,
"step": 3390
},
{
"epoch": 11.37,
"eval_accuracy": 0.9966835584091693,
"eval_f1": 0.9728832318760378,
"eval_loss": 0.01731358841061592,
"eval_precision": 0.9707344008834898,
"eval_recall": 0.9750415973377704,
"eval_runtime": 45.9308,
"eval_samples_per_second": 9.34,
"eval_steps_per_second": 1.568,
"step": 3400
},
{
"epoch": 11.4,
"eval_accuracy": 0.9969090764373458,
"eval_f1": 0.9787116394802323,
"eval_loss": 0.015837378799915314,
"eval_precision": 0.9757442116868799,
"eval_recall": 0.9816971713810316,
"eval_runtime": 45.8585,
"eval_samples_per_second": 9.355,
"eval_steps_per_second": 1.57,
"step": 3410
},
{
"epoch": 11.44,
"eval_accuracy": 0.9968029503064392,
"eval_f1": 0.9741534208707672,
"eval_loss": 0.0164649561047554,
"eval_precision": 0.9710664094791954,
"eval_recall": 0.9772601220188575,
"eval_runtime": 45.5679,
"eval_samples_per_second": 9.415,
"eval_steps_per_second": 1.58,
"step": 3420
},
{
"epoch": 11.47,
"eval_accuracy": 0.9964182430819029,
"eval_f1": 0.9646373595895161,
"eval_loss": 0.017043212428689003,
"eval_precision": 0.9647711511789182,
"eval_recall": 0.9645036051026068,
"eval_runtime": 45.6723,
"eval_samples_per_second": 9.393,
"eval_steps_per_second": 1.576,
"step": 3430
},
{
"epoch": 11.51,
"eval_accuracy": 0.9964182430819029,
"eval_f1": 0.9653643668606262,
"eval_loss": 0.017299339175224304,
"eval_precision": 0.964562569213732,
"eval_recall": 0.9661674986134221,
"eval_runtime": 46.0069,
"eval_samples_per_second": 9.325,
"eval_steps_per_second": 1.565,
"step": 3440
},
{
"epoch": 11.54,
"eval_accuracy": 0.9964713061473561,
"eval_f1": 0.968054211035818,
"eval_loss": 0.01724633388221264,
"eval_precision": 0.9655172413793104,
"eval_recall": 0.9706045479755963,
"eval_runtime": 45.6115,
"eval_samples_per_second": 9.406,
"eval_steps_per_second": 1.579,
"step": 3450
},
{
"epoch": 11.57,
"eval_accuracy": 0.9964845719137194,
"eval_f1": 0.9670724958494743,
"eval_loss": 0.017298314720392227,
"eval_precision": 0.9649364991717283,
"eval_recall": 0.9692179700499168,
"eval_runtime": 45.5306,
"eval_samples_per_second": 9.422,
"eval_steps_per_second": 1.581,
"step": 3460
},
{
"epoch": 11.61,
"eval_accuracy": 0.9967366214746226,
"eval_f1": 0.9718875502008032,
"eval_loss": 0.015642836689949036,
"eval_precision": 0.9706777316735823,
"eval_recall": 0.9731003882418192,
"eval_runtime": 46.9214,
"eval_samples_per_second": 9.143,
"eval_steps_per_second": 1.534,
"step": 3470
},
{
"epoch": 11.64,
"eval_accuracy": 0.9969356079700724,
"eval_f1": 0.9768986028496335,
"eval_loss": 0.015028764493763447,
"eval_precision": 0.9746066795473365,
"eval_recall": 0.9792013311148087,
"eval_runtime": 45.682,
"eval_samples_per_second": 9.391,
"eval_steps_per_second": 1.576,
"step": 3480
},
{
"epoch": 11.67,
"eval_accuracy": 0.9969621395027991,
"eval_f1": 0.9775747508305648,
"eval_loss": 0.015305536799132824,
"eval_precision": 0.9759535655058044,
"eval_recall": 0.9792013311148087,
"eval_runtime": 45.8278,
"eval_samples_per_second": 9.361,
"eval_steps_per_second": 1.571,
"step": 3490
},
{
"epoch": 11.71,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0042,
"step": 3500
},
{
"epoch": 11.71,
"eval_accuracy": 0.9969754052691624,
"eval_f1": 0.9772853185595569,
"eval_loss": 0.015260215848684311,
"eval_precision": 0.9762036524626453,
"eval_recall": 0.978369384359401,
"eval_runtime": 45.5813,
"eval_samples_per_second": 9.412,
"eval_steps_per_second": 1.58,
"step": 3500
},
{
"epoch": 11.74,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.9785407725321887,
"eval_loss": 0.015263444744050503,
"eval_precision": 0.9770528061929776,
"eval_recall": 0.9800332778702163,
"eval_runtime": 46.1625,
"eval_samples_per_second": 9.293,
"eval_steps_per_second": 1.56,
"step": 3510
},
{
"epoch": 11.77,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9793771626297577,
"eval_loss": 0.01575734093785286,
"eval_precision": 0.9776181265542968,
"eval_recall": 0.9811425402107599,
"eval_runtime": 45.6916,
"eval_samples_per_second": 9.389,
"eval_steps_per_second": 1.576,
"step": 3520
},
{
"epoch": 11.81,
"eval_accuracy": 0.9970682656337057,
"eval_f1": 0.9803541781959049,
"eval_loss": 0.016223162412643433,
"eval_precision": 0.9781888459414688,
"eval_recall": 0.9825291181364393,
"eval_runtime": 45.6681,
"eval_samples_per_second": 9.394,
"eval_steps_per_second": 1.577,
"step": 3530
},
{
"epoch": 11.84,
"eval_accuracy": 0.9970152025682524,
"eval_f1": 0.9794056668970283,
"eval_loss": 0.016862712800502777,
"eval_precision": 0.9763020115734362,
"eval_recall": 0.9825291181364393,
"eval_runtime": 45.8595,
"eval_samples_per_second": 9.355,
"eval_steps_per_second": 1.57,
"step": 3540
},
{
"epoch": 11.87,
"eval_accuracy": 0.9969754052691624,
"eval_f1": 0.9781526548672567,
"eval_loss": 0.016722770407795906,
"eval_precision": 0.9754550468836183,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.6514,
"eval_samples_per_second": 9.397,
"eval_steps_per_second": 1.577,
"step": 3550
},
{
"epoch": 11.91,
"eval_accuracy": 0.997041734100979,
"eval_f1": 0.9792473713337022,
"eval_loss": 0.01629817485809326,
"eval_precision": 0.9770844837106571,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.6901,
"eval_samples_per_second": 9.389,
"eval_steps_per_second": 1.576,
"step": 3560
},
{
"epoch": 11.94,
"eval_accuracy": 0.9970152025682524,
"eval_f1": 0.9795240730492528,
"eval_loss": 0.01616574078798294,
"eval_precision": 0.97736057426836,
"eval_recall": 0.9816971713810316,
"eval_runtime": 46.0985,
"eval_samples_per_second": 9.306,
"eval_steps_per_second": 1.562,
"step": 3570
},
{
"epoch": 11.97,
"eval_accuracy": 0.9969488737364357,
"eval_f1": 0.9778761061946902,
"eval_loss": 0.01619311049580574,
"eval_precision": 0.9751792608935466,
"eval_recall": 0.9805879090404881,
"eval_runtime": 45.9524,
"eval_samples_per_second": 9.336,
"eval_steps_per_second": 1.567,
"step": 3580
},
{
"epoch": 12.01,
"eval_accuracy": 0.9969886710355257,
"eval_f1": 0.9785822854774078,
"eval_loss": 0.01636885292828083,
"eval_precision": 0.97521343982374,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.6302,
"eval_samples_per_second": 9.402,
"eval_steps_per_second": 1.578,
"step": 3590
},
{
"epoch": 12.04,
"eval_accuracy": 0.9969886710355257,
"eval_f1": 0.9784470848300635,
"eval_loss": 0.01634366624057293,
"eval_precision": 0.9749449339207048,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.6457,
"eval_samples_per_second": 9.398,
"eval_steps_per_second": 1.577,
"step": 3600
},
{
"epoch": 12.07,
"eval_accuracy": 0.9969621395027991,
"eval_f1": 0.9776119402985075,
"eval_loss": 0.016408545896410942,
"eval_precision": 0.9743801652892562,
"eval_recall": 0.980865224625624,
"eval_runtime": 46.0467,
"eval_samples_per_second": 9.317,
"eval_steps_per_second": 1.564,
"step": 3610
},
{
"epoch": 12.11,
"eval_accuracy": 0.9971345944655223,
"eval_f1": 0.9778822228366049,
"eval_loss": 0.01554455328732729,
"eval_precision": 0.9749173098125689,
"eval_recall": 0.980865224625624,
"eval_runtime": 45.8672,
"eval_samples_per_second": 9.353,
"eval_steps_per_second": 1.57,
"step": 3620
},
{
"epoch": 12.14,
"eval_accuracy": 0.9971743917646122,
"eval_f1": 0.9781284606866002,
"eval_loss": 0.015367398969829082,
"eval_precision": 0.9765063571033721,
"eval_recall": 0.9797559622850804,
"eval_runtime": 45.8306,
"eval_samples_per_second": 9.361,
"eval_steps_per_second": 1.571,
"step": 3630
},
{
"epoch": 12.17,
"eval_accuracy": 0.9970815314000689,
"eval_f1": 0.9784172661870504,
"eval_loss": 0.016077237203717232,
"eval_precision": 0.9762562120375483,
"eval_recall": 0.9805879090404881,
"eval_runtime": 45.7148,
"eval_samples_per_second": 9.384,
"eval_steps_per_second": 1.575,
"step": 3640
},
{
"epoch": 12.21,
"eval_accuracy": 0.9968825449046191,
"eval_f1": 0.9757986447241046,
"eval_loss": 0.016824740916490555,
"eval_precision": 0.9732413793103448,
"eval_recall": 0.978369384359401,
"eval_runtime": 46.1214,
"eval_samples_per_second": 9.302,
"eval_steps_per_second": 1.561,
"step": 3650
},
{
"epoch": 12.24,
"eval_accuracy": 0.9969223422037091,
"eval_f1": 0.978146611341632,
"eval_loss": 0.016822459176182747,
"eval_precision": 0.9757174392935982,
"eval_recall": 0.9805879090404881,
"eval_runtime": 45.7927,
"eval_samples_per_second": 9.368,
"eval_steps_per_second": 1.572,
"step": 3660
},
{
"epoch": 12.27,
"eval_accuracy": 0.9968825449046191,
"eval_f1": 0.9792588495575221,
"eval_loss": 0.01815040595829487,
"eval_precision": 0.9765581908439052,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.8912,
"eval_samples_per_second": 9.348,
"eval_steps_per_second": 1.569,
"step": 3670
},
{
"epoch": 12.31,
"eval_accuracy": 0.9967764187737126,
"eval_f1": 0.9788586430841509,
"eval_loss": 0.01881832629442215,
"eval_precision": 0.9754888460479206,
"eval_recall": 0.9822518025513034,
"eval_runtime": 46.0893,
"eval_samples_per_second": 9.308,
"eval_steps_per_second": 1.562,
"step": 3680
},
{
"epoch": 12.34,
"eval_accuracy": 0.9968294818391659,
"eval_f1": 0.976892209768922,
"eval_loss": 0.017492154613137245,
"eval_precision": 0.9748688207677437,
"eval_recall": 0.9789240155296728,
"eval_runtime": 45.8024,
"eval_samples_per_second": 9.366,
"eval_steps_per_second": 1.572,
"step": 3690
},
{
"epoch": 12.37,
"eval_accuracy": 0.9966172295773527,
"eval_f1": 0.9710806697108068,
"eval_loss": 0.018154501914978027,
"eval_precision": 0.9690693178679922,
"eval_recall": 0.9731003882418192,
"eval_runtime": 46.0834,
"eval_samples_per_second": 9.309,
"eval_steps_per_second": 1.562,
"step": 3700
},
{
"epoch": 12.41,
"eval_accuracy": 0.9962457881191796,
"eval_f1": 0.9614745011086475,
"eval_loss": 0.01924285851418972,
"eval_precision": 0.9609418282548476,
"eval_recall": 0.9620077648363838,
"eval_runtime": 45.696,
"eval_samples_per_second": 9.388,
"eval_steps_per_second": 1.576,
"step": 3710
},
{
"epoch": 12.44,
"eval_accuracy": 0.9964580403809928,
"eval_f1": 0.9651259341267644,
"eval_loss": 0.017841314896941185,
"eval_precision": 0.9632596685082873,
"eval_recall": 0.9669994453688298,
"eval_runtime": 45.9939,
"eval_samples_per_second": 9.327,
"eval_steps_per_second": 1.565,
"step": 3720
},
{
"epoch": 12.47,
"eval_accuracy": 0.9966304953437161,
"eval_f1": 0.970962389380531,
"eval_loss": 0.016754455864429474,
"eval_precision": 0.968284611141754,
"eval_recall": 0.973655019412091,
"eval_runtime": 45.8171,
"eval_samples_per_second": 9.363,
"eval_steps_per_second": 1.571,
"step": 3730
},
{
"epoch": 12.51,
"eval_accuracy": 0.9968294818391659,
"eval_f1": 0.9774269491760144,
"eval_loss": 0.015923812985420227,
"eval_precision": 0.9762102351313969,
"eval_recall": 0.9786466999445369,
"eval_runtime": 45.7801,
"eval_samples_per_second": 9.371,
"eval_steps_per_second": 1.573,
"step": 3740
},
{
"epoch": 12.54,
"eval_accuracy": 0.9968825449046191,
"eval_f1": 0.9772916089725838,
"eval_loss": 0.015936698764562607,
"eval_precision": 0.9759402654867256,
"eval_recall": 0.9786466999445369,
"eval_runtime": 45.9975,
"eval_samples_per_second": 9.327,
"eval_steps_per_second": 1.565,
"step": 3750
},
{
"epoch": 12.58,
"eval_accuracy": 0.9968029503064392,
"eval_f1": 0.9736623232603271,
"eval_loss": 0.016157541424036026,
"eval_precision": 0.9733924611973392,
"eval_recall": 0.9739323349972269,
"eval_runtime": 45.7117,
"eval_samples_per_second": 9.385,
"eval_steps_per_second": 1.575,
"step": 3760
},
{
"epoch": 12.61,
"eval_accuracy": 0.9967366214746226,
"eval_f1": 0.9694117647058823,
"eval_loss": 0.01580197736620903,
"eval_precision": 0.9676706272450953,
"eval_recall": 0.971159179145868,
"eval_runtime": 45.5828,
"eval_samples_per_second": 9.411,
"eval_steps_per_second": 1.58,
"step": 3770
},
{
"epoch": 12.64,
"eval_accuracy": 0.9969090764373458,
"eval_f1": 0.971460238293156,
"eval_loss": 0.015100532211363316,
"eval_precision": 0.9706533776301218,
"eval_recall": 0.9722684414864116,
"eval_runtime": 45.7142,
"eval_samples_per_second": 9.384,
"eval_steps_per_second": 1.575,
"step": 3780
},
{
"epoch": 12.68,
"eval_accuracy": 0.9969488737364357,
"eval_f1": 0.9725609756097561,
"eval_loss": 0.015240387991070747,
"eval_precision": 0.97202216066482,
"eval_recall": 0.9731003882418192,
"eval_runtime": 46.103,
"eval_samples_per_second": 9.305,
"eval_steps_per_second": 1.562,
"step": 3790
},
{
"epoch": 12.71,
"eval_accuracy": 0.9970284683346157,
"eval_f1": 0.9779991697799916,
"eval_loss": 0.015490233898162842,
"eval_precision": 0.975973487986744,
"eval_recall": 0.9800332778702163,
"eval_runtime": 45.7054,
"eval_samples_per_second": 9.386,
"eval_steps_per_second": 1.575,
"step": 3800
},
{
"epoch": 12.74,
"eval_accuracy": 0.9971213286991589,
"eval_f1": 0.980060924951537,
"eval_loss": 0.014931376092135906,
"eval_precision": 0.9787057522123894,
"eval_recall": 0.9814198557958957,
"eval_runtime": 45.8361,
"eval_samples_per_second": 9.359,
"eval_steps_per_second": 1.571,
"step": 3810
},
{
"epoch": 12.78,
"eval_accuracy": 0.9970947971664323,
"eval_f1": 0.9769764216366158,
"eval_loss": 0.013774119317531586,
"eval_precision": 0.9772475027746947,
"eval_recall": 0.9767054908485857,
"eval_runtime": 46.4293,
"eval_samples_per_second": 9.24,
"eval_steps_per_second": 1.551,
"step": 3820
},
{
"epoch": 12.81,
"eval_accuracy": 0.9971611259982489,
"eval_f1": 0.9775436650956474,
"eval_loss": 0.01355548482388258,
"eval_precision": 0.9772727272727273,
"eval_recall": 0.9778147531891292,
"eval_runtime": 45.7415,
"eval_samples_per_second": 9.379,
"eval_steps_per_second": 1.574,
"step": 3830
},
{
"epoch": 12.84,
"eval_accuracy": 0.9973335809609721,
"eval_f1": 0.9824124082537044,
"eval_loss": 0.013703616335988045,
"eval_precision": 0.9811894882434301,
"eval_recall": 0.9836383804769828,
"eval_runtime": 45.73,
"eval_samples_per_second": 9.381,
"eval_steps_per_second": 1.574,
"step": 3840
},
{
"epoch": 12.88,
"eval_accuracy": 0.9973601124936987,
"eval_f1": 0.9812102790826194,
"eval_loss": 0.014531377702951431,
"eval_precision": 0.9776982378854625,
"eval_recall": 0.9847476428175264,
"eval_runtime": 45.7852,
"eval_samples_per_second": 9.37,
"eval_steps_per_second": 1.573,
"step": 3850
},
{
"epoch": 12.91,
"eval_accuracy": 0.9968427476055292,
"eval_f1": 0.977526540741762,
"eval_loss": 0.016427284106612206,
"eval_precision": 0.9720318069646284,
"eval_recall": 0.983083749306711,
"eval_runtime": 45.8438,
"eval_samples_per_second": 9.358,
"eval_steps_per_second": 1.571,
"step": 3860
},
{
"epoch": 12.94,
"eval_accuracy": 0.9960202700910031,
"eval_f1": 0.9653931339977851,
"eval_loss": 0.021676059812307358,
"eval_precision": 0.9637921503593145,
"eval_recall": 0.9669994453688298,
"eval_runtime": 45.7888,
"eval_samples_per_second": 9.369,
"eval_steps_per_second": 1.572,
"step": 3870
},
{
"epoch": 12.98,
"eval_accuracy": 0.9967498872409859,
"eval_f1": 0.9777900400055181,
"eval_loss": 0.018003830686211586,
"eval_precision": 0.9728245951139171,
"eval_recall": 0.9828064337215752,
"eval_runtime": 45.7325,
"eval_samples_per_second": 9.381,
"eval_steps_per_second": 1.574,
"step": 3880
},
{
"epoch": 13.01,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.977667493796526,
"eval_loss": 0.01754719577729702,
"eval_precision": 0.9720394736842105,
"eval_recall": 0.9833610648918469,
"eval_runtime": 46.1857,
"eval_samples_per_second": 9.289,
"eval_steps_per_second": 1.559,
"step": 3890
},
{
"epoch": 13.04,
"eval_accuracy": 0.9967631530073492,
"eval_f1": 0.9739274382673472,
"eval_loss": 0.01792616955935955,
"eval_precision": 0.96898160856437,
"eval_recall": 0.9789240155296728,
"eval_runtime": 45.7326,
"eval_samples_per_second": 9.381,
"eval_steps_per_second": 1.574,
"step": 3900
},
{
"epoch": 13.08,
"eval_accuracy": 0.9967631530073492,
"eval_f1": 0.9729431253451133,
"eval_loss": 0.017918290570378304,
"eval_precision": 0.9686641011544805,
"eval_recall": 0.9772601220188575,
"eval_runtime": 46.0978,
"eval_samples_per_second": 9.306,
"eval_steps_per_second": 1.562,
"step": 3910
},
{
"epoch": 13.11,
"eval_accuracy": 0.9968692791382558,
"eval_f1": 0.9765323025952513,
"eval_loss": 0.017354754731059074,
"eval_precision": 0.9722374931280924,
"eval_recall": 0.980865224625624,
"eval_runtime": 46.21,
"eval_samples_per_second": 9.284,
"eval_steps_per_second": 1.558,
"step": 3920
},
{
"epoch": 13.14,
"eval_accuracy": 0.9969356079700724,
"eval_f1": 0.9775017253278124,
"eval_loss": 0.015932898968458176,
"eval_precision": 0.9730695245946689,
"eval_recall": 0.9819744869661675,
"eval_runtime": 45.7375,
"eval_samples_per_second": 9.38,
"eval_steps_per_second": 1.574,
"step": 3930
},
{
"epoch": 13.18,
"eval_accuracy": 0.9969090764373458,
"eval_f1": 0.9779005524861878,
"eval_loss": 0.015960365533828735,
"eval_precision": 0.9741331865712713,
"eval_recall": 0.9816971713810316,
"eval_runtime": 45.8882,
"eval_samples_per_second": 9.349,
"eval_steps_per_second": 1.569,
"step": 3940
},
{
"epoch": 13.21,
"eval_accuracy": 0.9967498872409859,
"eval_f1": 0.9737569060773481,
"eval_loss": 0.017051612958312035,
"eval_precision": 0.9700055035773253,
"eval_recall": 0.9775374376039934,
"eval_runtime": 45.8012,
"eval_samples_per_second": 9.367,
"eval_steps_per_second": 1.572,
"step": 3950
},
{
"epoch": 13.24,
"eval_accuracy": 0.9966702926428059,
"eval_f1": 0.9723527785457561,
"eval_loss": 0.01766437292098999,
"eval_precision": 0.9694046306504961,
"eval_recall": 0.9753189129229063,
"eval_runtime": 45.8759,
"eval_samples_per_second": 9.351,
"eval_steps_per_second": 1.569,
"step": 3960
},
{
"epoch": 13.28,
"eval_accuracy": 0.9966570268764426,
"eval_f1": 0.9727411097274111,
"eval_loss": 0.01822058856487274,
"eval_precision": 0.9707263186964927,
"eval_recall": 0.9747642817526345,
"eval_runtime": 45.8529,
"eval_samples_per_second": 9.356,
"eval_steps_per_second": 1.57,
"step": 3970
},
{
"epoch": 13.31,
"eval_accuracy": 0.9966304953437161,
"eval_f1": 0.9724872113922302,
"eval_loss": 0.01849460043013096,
"eval_precision": 0.9696719051557762,
"eval_recall": 0.9753189129229063,
"eval_runtime": 45.7611,
"eval_samples_per_second": 9.375,
"eval_steps_per_second": 1.573,
"step": 3980
},
{
"epoch": 13.34,
"eval_accuracy": 0.9968427476055292,
"eval_f1": 0.9780417069465543,
"eval_loss": 0.017539281398057938,
"eval_precision": 0.9741403026134801,
"eval_recall": 0.9819744869661675,
"eval_runtime": 46.0339,
"eval_samples_per_second": 9.319,
"eval_steps_per_second": 1.564,
"step": 3990
},
{
"epoch": 13.38,
"learning_rate": 6e-06,
"loss": 0.0037,
"step": 4000
},
{
"epoch": 13.38,
"eval_accuracy": 0.9968958106709824,
"eval_f1": 0.9792874896437448,
"eval_loss": 0.017371075227856636,
"eval_precision": 0.9752475247524752,
"eval_recall": 0.9833610648918469,
"eval_runtime": 45.7746,
"eval_samples_per_second": 9.372,
"eval_steps_per_second": 1.573,
"step": 4000
}
],
"max_steps": 10000,
"num_train_epochs": 34,
"total_flos": 6370581676032000.0,
"trial_name": null,
"trial_params": null
}