bloomz-3b-mixed-detector / trainer_state.json
andreas122001's picture
Upload 12 files
c0e95a4
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 1.0,
"global_step": 2188,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"learning_rate": 4.997714808043876e-05,
"loss": 5.4892,
"step": 1
},
{
"epoch": 0.02,
"learning_rate": 4.9017367458866546e-05,
"loss": 3.0607,
"step": 43
},
{
"epoch": 0.02,
"eval_accuracy": 0.8749333333333333,
"eval_f1": 0.8729341641831482,
"eval_loss": 2.1355409622192383,
"eval_precision": 0.887114537444934,
"eval_recall": 0.8592,
"eval_runtime": 581.4545,
"eval_samples_per_second": 6.449,
"eval_steps_per_second": 0.807,
"step": 43
},
{
"epoch": 0.04,
"learning_rate": 4.8034734917733096e-05,
"loss": 1.6864,
"step": 86
},
{
"epoch": 0.04,
"eval_accuracy": 0.8901333333333333,
"eval_f1": 0.8857459789240155,
"eval_loss": 1.632243275642395,
"eval_precision": 0.9225880993645291,
"eval_recall": 0.8517333333333333,
"eval_runtime": 581.1642,
"eval_samples_per_second": 6.453,
"eval_steps_per_second": 0.807,
"step": 86
},
{
"epoch": 0.06,
"learning_rate": 4.705210237659964e-05,
"loss": 1.0658,
"step": 129
},
{
"epoch": 0.06,
"eval_accuracy": 0.904,
"eval_f1": 0.9061032863849765,
"eval_loss": 0.3131539821624756,
"eval_precision": 0.886676875957121,
"eval_recall": 0.9264,
"eval_runtime": 580.6614,
"eval_samples_per_second": 6.458,
"eval_steps_per_second": 0.808,
"step": 129
},
{
"epoch": 0.08,
"learning_rate": 4.606946983546618e-05,
"loss": 0.4275,
"step": 172
},
{
"epoch": 0.08,
"eval_accuracy": 0.8874666666666666,
"eval_f1": 0.8765359859566997,
"eval_loss": 1.6054295301437378,
"eval_precision": 0.9708360337005832,
"eval_recall": 0.7989333333333334,
"eval_runtime": 580.8161,
"eval_samples_per_second": 6.456,
"eval_steps_per_second": 0.807,
"step": 172
},
{
"epoch": 0.1,
"learning_rate": 4.5086837294332726e-05,
"loss": 0.5456,
"step": 215
},
{
"epoch": 0.1,
"eval_accuracy": 0.9170666666666667,
"eval_f1": 0.9218789248932429,
"eval_loss": 0.41803765296936035,
"eval_precision": 0.8713200379867047,
"eval_recall": 0.9786666666666667,
"eval_runtime": 580.4549,
"eval_samples_per_second": 6.46,
"eval_steps_per_second": 0.808,
"step": 215
},
{
"epoch": 0.12,
"learning_rate": 4.410420475319927e-05,
"loss": 0.6111,
"step": 258
},
{
"epoch": 0.12,
"eval_accuracy": 0.8786666666666667,
"eval_f1": 0.8626622396619378,
"eval_loss": 0.32219210267066956,
"eval_precision": 0.9937413073713491,
"eval_recall": 0.7621333333333333,
"eval_runtime": 584.0808,
"eval_samples_per_second": 6.42,
"eval_steps_per_second": 0.803,
"step": 258
},
{
"epoch": 0.14,
"learning_rate": 4.312157221206581e-05,
"loss": 0.7106,
"step": 301
},
{
"epoch": 0.14,
"eval_accuracy": 0.9274666666666667,
"eval_f1": 0.9221967963386728,
"eval_loss": 0.5022754073143005,
"eval_precision": 0.9944478716841456,
"eval_recall": 0.8597333333333333,
"eval_runtime": 581.6225,
"eval_samples_per_second": 6.447,
"eval_steps_per_second": 0.806,
"step": 301
},
{
"epoch": 0.16,
"learning_rate": 4.213893967093236e-05,
"loss": 0.2426,
"step": 344
},
{
"epoch": 0.16,
"eval_accuracy": 0.9586666666666667,
"eval_f1": 0.9586997069011457,
"eval_loss": 0.16574496030807495,
"eval_precision": 0.9579339723109691,
"eval_recall": 0.9594666666666667,
"eval_runtime": 580.7975,
"eval_samples_per_second": 6.457,
"eval_steps_per_second": 0.808,
"step": 344
},
{
"epoch": 0.18,
"learning_rate": 4.1156307129798905e-05,
"loss": 0.3958,
"step": 387
},
{
"epoch": 0.18,
"eval_accuracy": 0.9554666666666667,
"eval_f1": 0.9535724214623298,
"eval_loss": 0.24226774275302887,
"eval_precision": 0.9959349593495935,
"eval_recall": 0.9146666666666666,
"eval_runtime": 581.1794,
"eval_samples_per_second": 6.452,
"eval_steps_per_second": 0.807,
"step": 387
},
{
"epoch": 0.2,
"learning_rate": 4.017367458866545e-05,
"loss": 0.4259,
"step": 430
},
{
"epoch": 0.2,
"eval_accuracy": 0.9448,
"eval_f1": 0.9449614464238233,
"eval_loss": 0.3525341749191284,
"eval_precision": 0.9422057264050901,
"eval_recall": 0.9477333333333333,
"eval_runtime": 580.7809,
"eval_samples_per_second": 6.457,
"eval_steps_per_second": 0.808,
"step": 430
},
{
"epoch": 0.22,
"learning_rate": 3.919104204753199e-05,
"loss": 0.2217,
"step": 473
},
{
"epoch": 0.22,
"eval_accuracy": 0.9549333333333333,
"eval_f1": 0.9531466592736346,
"eval_loss": 0.22800709307193756,
"eval_precision": 0.9924942263279446,
"eval_recall": 0.9168,
"eval_runtime": 580.8019,
"eval_samples_per_second": 6.457,
"eval_steps_per_second": 0.808,
"step": 473
},
{
"epoch": 0.24,
"learning_rate": 3.820840950639854e-05,
"loss": 0.1741,
"step": 516
},
{
"epoch": 0.24,
"eval_accuracy": 0.9682666666666667,
"eval_f1": 0.9673525377229081,
"eval_loss": 0.15350370109081268,
"eval_precision": 0.996045197740113,
"eval_recall": 0.9402666666666667,
"eval_runtime": 584.2385,
"eval_samples_per_second": 6.419,
"eval_steps_per_second": 0.803,
"step": 516
},
{
"epoch": 0.26,
"learning_rate": 3.7225776965265085e-05,
"loss": 0.1731,
"step": 559
},
{
"epoch": 0.26,
"eval_accuracy": 0.9648,
"eval_f1": 0.9636763896532745,
"eval_loss": 0.29772499203681946,
"eval_precision": 0.9954519613416714,
"eval_recall": 0.9338666666666666,
"eval_runtime": 580.9188,
"eval_samples_per_second": 6.455,
"eval_steps_per_second": 0.807,
"step": 559
},
{
"epoch": 0.28,
"learning_rate": 3.624314442413163e-05,
"loss": 0.1857,
"step": 602
},
{
"epoch": 0.28,
"eval_accuracy": 0.9826666666666667,
"eval_f1": 0.9826527888977848,
"eval_loss": 0.16285915672779083,
"eval_precision": 0.9834401709401709,
"eval_recall": 0.9818666666666667,
"eval_runtime": 581.4605,
"eval_samples_per_second": 6.449,
"eval_steps_per_second": 0.807,
"step": 602
},
{
"epoch": 0.29,
"learning_rate": 3.526051188299818e-05,
"loss": 0.241,
"step": 645
},
{
"epoch": 0.29,
"eval_accuracy": 0.9677333333333333,
"eval_f1": 0.9681997371879106,
"eval_loss": 0.30683064460754395,
"eval_precision": 0.9544041450777202,
"eval_recall": 0.9824,
"eval_runtime": 580.3999,
"eval_samples_per_second": 6.461,
"eval_steps_per_second": 0.808,
"step": 645
},
{
"epoch": 0.31,
"learning_rate": 3.4277879341864715e-05,
"loss": 0.1674,
"step": 688
},
{
"epoch": 0.31,
"eval_accuracy": 0.9050666666666667,
"eval_f1": 0.9130434782608695,
"eval_loss": 0.5339795351028442,
"eval_precision": 0.8422712933753943,
"eval_recall": 0.9968,
"eval_runtime": 580.4617,
"eval_samples_per_second": 6.46,
"eval_steps_per_second": 0.808,
"step": 688
},
{
"epoch": 0.33,
"learning_rate": 3.329524680073126e-05,
"loss": 0.1452,
"step": 731
},
{
"epoch": 0.33,
"eval_accuracy": 0.9754666666666667,
"eval_f1": 0.9756871035940803,
"eval_loss": 0.1770327091217041,
"eval_precision": 0.9669984284965951,
"eval_recall": 0.9845333333333334,
"eval_runtime": 581.5384,
"eval_samples_per_second": 6.448,
"eval_steps_per_second": 0.806,
"step": 731
},
{
"epoch": 0.35,
"learning_rate": 3.231261425959781e-05,
"loss": 0.2261,
"step": 774
},
{
"epoch": 0.35,
"eval_accuracy": 0.9714666666666667,
"eval_f1": 0.97192337969037,
"eval_loss": 0.2083805948495865,
"eval_precision": 0.9566115702479339,
"eval_recall": 0.9877333333333334,
"eval_runtime": 582.4902,
"eval_samples_per_second": 6.438,
"eval_steps_per_second": 0.805,
"step": 774
},
{
"epoch": 0.37,
"learning_rate": 3.132998171846435e-05,
"loss": 0.1849,
"step": 817
},
{
"epoch": 0.37,
"eval_accuracy": 0.9765333333333334,
"eval_f1": 0.9763186221743809,
"eval_loss": 0.12196581810712814,
"eval_precision": 0.9853340575774036,
"eval_recall": 0.9674666666666667,
"eval_runtime": 578.7143,
"eval_samples_per_second": 6.48,
"eval_steps_per_second": 0.81,
"step": 817
},
{
"epoch": 0.39,
"learning_rate": 3.03473491773309e-05,
"loss": 0.1237,
"step": 860
},
{
"epoch": 0.39,
"eval_accuracy": 0.9693333333333334,
"eval_f1": 0.9700286682303884,
"eval_loss": 0.2138151079416275,
"eval_precision": 0.9485219164118247,
"eval_recall": 0.9925333333333334,
"eval_runtime": 578.8904,
"eval_samples_per_second": 6.478,
"eval_steps_per_second": 0.81,
"step": 860
},
{
"epoch": 0.41,
"learning_rate": 2.9364716636197442e-05,
"loss": 0.1627,
"step": 903
},
{
"epoch": 0.41,
"eval_accuracy": 0.9584,
"eval_f1": 0.9566425792106726,
"eval_loss": 0.254962295293808,
"eval_precision": 0.9988392338943702,
"eval_recall": 0.9178666666666667,
"eval_runtime": 578.6033,
"eval_samples_per_second": 6.481,
"eval_steps_per_second": 0.811,
"step": 903
},
{
"epoch": 0.43,
"learning_rate": 2.838208409506399e-05,
"loss": 0.2477,
"step": 946
},
{
"epoch": 0.43,
"eval_accuracy": 0.9765333333333334,
"eval_f1": 0.9761258817145958,
"eval_loss": 0.13448475301265717,
"eval_precision": 0.9933738266151297,
"eval_recall": 0.9594666666666667,
"eval_runtime": 578.5049,
"eval_samples_per_second": 6.482,
"eval_steps_per_second": 0.811,
"step": 946
},
{
"epoch": 0.45,
"learning_rate": 2.739945155393053e-05,
"loss": 0.0943,
"step": 989
},
{
"epoch": 0.45,
"eval_accuracy": 0.9688,
"eval_f1": 0.9695391825045562,
"eval_loss": 0.18509739637374878,
"eval_precision": 0.9471007121057986,
"eval_recall": 0.9930666666666667,
"eval_runtime": 578.7851,
"eval_samples_per_second": 6.479,
"eval_steps_per_second": 0.81,
"step": 989
},
{
"epoch": 0.47,
"learning_rate": 2.641681901279708e-05,
"loss": 0.2131,
"step": 1032
},
{
"epoch": 0.47,
"eval_accuracy": 0.9826666666666667,
"eval_f1": 0.9825970548862116,
"eval_loss": 0.10872189700603485,
"eval_precision": 0.9865591397849462,
"eval_recall": 0.9786666666666667,
"eval_runtime": 580.8924,
"eval_samples_per_second": 6.456,
"eval_steps_per_second": 0.807,
"step": 1032
},
{
"epoch": 0.49,
"learning_rate": 2.5434186471663625e-05,
"loss": 0.0829,
"step": 1075
},
{
"epoch": 0.49,
"eval_accuracy": 0.9661333333333333,
"eval_f1": 0.9651577503429356,
"eval_loss": 0.2479323148727417,
"eval_precision": 0.9937853107344633,
"eval_recall": 0.9381333333333334,
"eval_runtime": 578.7358,
"eval_samples_per_second": 6.48,
"eval_steps_per_second": 0.81,
"step": 1075
},
{
"epoch": 0.51,
"learning_rate": 2.4451553930530165e-05,
"loss": 0.1392,
"step": 1118
},
{
"epoch": 0.51,
"eval_accuracy": 0.9613333333333334,
"eval_f1": 0.959867146415721,
"eval_loss": 0.20837165415287018,
"eval_precision": 0.997698504027618,
"eval_recall": 0.9248,
"eval_runtime": 579.0845,
"eval_samples_per_second": 6.476,
"eval_steps_per_second": 0.81,
"step": 1118
},
{
"epoch": 0.53,
"learning_rate": 2.346892138939671e-05,
"loss": 0.0563,
"step": 1161
},
{
"epoch": 0.53,
"eval_accuracy": 0.9874666666666667,
"eval_f1": 0.9874833555259653,
"eval_loss": 0.08351419121026993,
"eval_precision": 0.9861702127659574,
"eval_recall": 0.9888,
"eval_runtime": 578.9179,
"eval_samples_per_second": 6.478,
"eval_steps_per_second": 0.81,
"step": 1161
},
{
"epoch": 0.55,
"learning_rate": 2.2486288848263255e-05,
"loss": 0.107,
"step": 1204
},
{
"epoch": 0.55,
"eval_accuracy": 0.9826666666666667,
"eval_f1": 0.9828269484808455,
"eval_loss": 0.11463689059019089,
"eval_precision": 0.9738219895287958,
"eval_recall": 0.992,
"eval_runtime": 579.4593,
"eval_samples_per_second": 6.472,
"eval_steps_per_second": 0.809,
"step": 1204
},
{
"epoch": 0.57,
"learning_rate": 2.1503656307129798e-05,
"loss": 0.0822,
"step": 1247
},
{
"epoch": 0.57,
"eval_accuracy": 0.9816,
"eval_f1": 0.9817218543046358,
"eval_loss": 0.1307775229215622,
"eval_precision": 0.9752631578947368,
"eval_recall": 0.9882666666666666,
"eval_runtime": 580.0354,
"eval_samples_per_second": 6.465,
"eval_steps_per_second": 0.809,
"step": 1247
},
{
"epoch": 0.59,
"learning_rate": 2.0521023765996345e-05,
"loss": 0.1165,
"step": 1290
},
{
"epoch": 0.59,
"eval_accuracy": 0.9856,
"eval_f1": 0.9855923159018143,
"eval_loss": 0.09052357822656631,
"eval_precision": 0.9861185264281901,
"eval_recall": 0.9850666666666666,
"eval_runtime": 581.231,
"eval_samples_per_second": 6.452,
"eval_steps_per_second": 0.807,
"step": 1290
},
{
"epoch": 0.61,
"learning_rate": 1.953839122486289e-05,
"loss": 0.1156,
"step": 1333
},
{
"epoch": 0.61,
"eval_accuracy": 0.9864,
"eval_f1": 0.9864972200158858,
"eval_loss": 0.09110942482948303,
"eval_precision": 0.9794952681388013,
"eval_recall": 0.9936,
"eval_runtime": 579.1835,
"eval_samples_per_second": 6.475,
"eval_steps_per_second": 0.81,
"step": 1333
},
{
"epoch": 0.63,
"learning_rate": 1.8555758683729435e-05,
"loss": 0.1172,
"step": 1376
},
{
"epoch": 0.63,
"eval_accuracy": 0.984,
"eval_f1": 0.9841772151898733,
"eval_loss": 0.09306684881448746,
"eval_precision": 0.97339593114241,
"eval_recall": 0.9952,
"eval_runtime": 579.0887,
"eval_samples_per_second": 6.476,
"eval_steps_per_second": 0.81,
"step": 1376
},
{
"epoch": 0.65,
"learning_rate": 1.7573126142595978e-05,
"loss": 0.1447,
"step": 1419
},
{
"epoch": 0.65,
"eval_accuracy": 0.9848,
"eval_f1": 0.9849086576648134,
"eval_loss": 0.08812595903873444,
"eval_precision": 0.9779179810725552,
"eval_recall": 0.992,
"eval_runtime": 579.3815,
"eval_samples_per_second": 6.472,
"eval_steps_per_second": 0.809,
"step": 1419
},
{
"epoch": 0.67,
"learning_rate": 1.659049360146252e-05,
"loss": 0.087,
"step": 1462
},
{
"epoch": 0.67,
"eval_accuracy": 0.9872,
"eval_f1": 0.9872272485364556,
"eval_loss": 0.07127923518419266,
"eval_precision": 0.9851301115241635,
"eval_recall": 0.9893333333333333,
"eval_runtime": 578.9808,
"eval_samples_per_second": 6.477,
"eval_steps_per_second": 0.81,
"step": 1462
},
{
"epoch": 0.69,
"learning_rate": 1.5607861060329068e-05,
"loss": 0.0313,
"step": 1505
},
{
"epoch": 0.69,
"eval_accuracy": 0.9861333333333333,
"eval_f1": 0.9862142099681867,
"eval_loss": 0.1003463938832283,
"eval_precision": 0.9804955192409067,
"eval_recall": 0.992,
"eval_runtime": 579.6786,
"eval_samples_per_second": 6.469,
"eval_steps_per_second": 0.809,
"step": 1505
},
{
"epoch": 0.71,
"learning_rate": 1.4625228519195613e-05,
"loss": 0.0729,
"step": 1548
},
{
"epoch": 0.71,
"eval_accuracy": 0.9869333333333333,
"eval_f1": 0.986859747921695,
"eval_loss": 0.0750027745962143,
"eval_precision": 0.9924487594390508,
"eval_recall": 0.9813333333333333,
"eval_runtime": 581.8591,
"eval_samples_per_second": 6.445,
"eval_steps_per_second": 0.806,
"step": 1548
},
{
"epoch": 0.73,
"learning_rate": 1.3642595978062158e-05,
"loss": 0.106,
"step": 1591
},
{
"epoch": 0.73,
"eval_accuracy": 0.9874666666666667,
"eval_f1": 0.9874499332443257,
"eval_loss": 0.06067837029695511,
"eval_precision": 0.9887700534759358,
"eval_recall": 0.9861333333333333,
"eval_runtime": 579.0471,
"eval_samples_per_second": 6.476,
"eval_steps_per_second": 0.81,
"step": 1591
},
{
"epoch": 0.75,
"learning_rate": 1.2659963436928701e-05,
"loss": 0.0823,
"step": 1634
},
{
"epoch": 0.75,
"eval_accuracy": 0.9877333333333334,
"eval_f1": 0.9877005347593582,
"eval_loss": 0.07156907767057419,
"eval_precision": 0.9903485254691688,
"eval_recall": 0.9850666666666666,
"eval_runtime": 578.809,
"eval_samples_per_second": 6.479,
"eval_steps_per_second": 0.81,
"step": 1634
},
{
"epoch": 0.77,
"learning_rate": 1.1677330895795248e-05,
"loss": 0.0817,
"step": 1677
},
{
"epoch": 0.77,
"eval_accuracy": 0.9845333333333334,
"eval_f1": 0.9846804014791337,
"eval_loss": 0.09290226548910141,
"eval_precision": 0.9754055468341183,
"eval_recall": 0.9941333333333333,
"eval_runtime": 578.5452,
"eval_samples_per_second": 6.482,
"eval_steps_per_second": 0.811,
"step": 1677
},
{
"epoch": 0.79,
"learning_rate": 1.0694698354661791e-05,
"loss": 0.1279,
"step": 1720
},
{
"epoch": 0.79,
"eval_accuracy": 0.988,
"eval_f1": 0.9879453522635949,
"eval_loss": 0.07037492841482162,
"eval_precision": 0.9924650161463939,
"eval_recall": 0.9834666666666667,
"eval_runtime": 579.5947,
"eval_samples_per_second": 6.47,
"eval_steps_per_second": 0.809,
"step": 1720
},
{
"epoch": 0.81,
"learning_rate": 9.712065813528338e-06,
"loss": 0.075,
"step": 1763
},
{
"epoch": 0.81,
"eval_accuracy": 0.9890666666666666,
"eval_f1": 0.9890462196099385,
"eval_loss": 0.06325065344572067,
"eval_precision": 0.9908993576017131,
"eval_recall": 0.9872,
"eval_runtime": 579.6298,
"eval_samples_per_second": 6.47,
"eval_steps_per_second": 0.809,
"step": 1763
},
{
"epoch": 0.83,
"learning_rate": 8.729433272394881e-06,
"loss": 0.0909,
"step": 1806
},
{
"epoch": 0.83,
"eval_accuracy": 0.9842666666666666,
"eval_f1": 0.9840841650930671,
"eval_loss": 0.09650667011737823,
"eval_precision": 0.9956331877729258,
"eval_recall": 0.9728,
"eval_runtime": 579.8501,
"eval_samples_per_second": 6.467,
"eval_steps_per_second": 0.809,
"step": 1806
},
{
"epoch": 0.85,
"learning_rate": 7.746800731261426e-06,
"loss": 0.0583,
"step": 1849
},
{
"epoch": 0.85,
"eval_accuracy": 0.9893333333333333,
"eval_f1": 0.9893276414087514,
"eval_loss": 0.07162317633628845,
"eval_precision": 0.9898558462359851,
"eval_recall": 0.9888,
"eval_runtime": 579.4799,
"eval_samples_per_second": 6.471,
"eval_steps_per_second": 0.809,
"step": 1849
},
{
"epoch": 0.86,
"learning_rate": 6.764168190127972e-06,
"loss": 0.0961,
"step": 1892
},
{
"epoch": 0.86,
"eval_accuracy": 0.988,
"eval_f1": 0.9879518072289156,
"eval_loss": 0.05759565904736519,
"eval_precision": 0.9919354838709677,
"eval_recall": 0.984,
"eval_runtime": 580.3503,
"eval_samples_per_second": 6.462,
"eval_steps_per_second": 0.808,
"step": 1892
},
{
"epoch": 0.88,
"learning_rate": 5.781535648994515e-06,
"loss": 0.0356,
"step": 1935
},
{
"epoch": 0.88,
"eval_accuracy": 0.9882666666666666,
"eval_f1": 0.9883103081827843,
"eval_loss": 0.06381053477525711,
"eval_precision": 0.984647961884595,
"eval_recall": 0.992,
"eval_runtime": 581.544,
"eval_samples_per_second": 6.448,
"eval_steps_per_second": 0.806,
"step": 1935
},
{
"epoch": 0.9,
"learning_rate": 4.798903107861061e-06,
"loss": 0.0848,
"step": 1978
},
{
"epoch": 0.9,
"eval_accuracy": 0.9893333333333333,
"eval_f1": 0.9893162393162394,
"eval_loss": 0.05824807286262512,
"eval_precision": 0.990904226859283,
"eval_recall": 0.9877333333333334,
"eval_runtime": 578.359,
"eval_samples_per_second": 6.484,
"eval_steps_per_second": 0.811,
"step": 1978
},
{
"epoch": 0.92,
"learning_rate": 3.816270566727605e-06,
"loss": 0.1019,
"step": 2021
},
{
"epoch": 0.92,
"eval_accuracy": 0.9890666666666666,
"eval_f1": 0.9890579129970644,
"eval_loss": 0.055534329265356064,
"eval_precision": 0.9898504273504274,
"eval_recall": 0.9882666666666666,
"eval_runtime": 579.2162,
"eval_samples_per_second": 6.474,
"eval_steps_per_second": 0.81,
"step": 2021
},
{
"epoch": 0.94,
"learning_rate": 2.83363802559415e-06,
"loss": 0.0274,
"step": 2064
},
{
"epoch": 0.94,
"eval_accuracy": 0.9893333333333333,
"eval_f1": 0.9892990904226859,
"eval_loss": 0.05893222615122795,
"eval_precision": 0.9924852388620504,
"eval_recall": 0.9861333333333333,
"eval_runtime": 581.1057,
"eval_samples_per_second": 6.453,
"eval_steps_per_second": 0.807,
"step": 2064
},
{
"epoch": 0.96,
"learning_rate": 1.851005484460695e-06,
"loss": 0.0313,
"step": 2107
},
{
"epoch": 0.96,
"eval_accuracy": 0.9893333333333333,
"eval_f1": 0.9892933618843683,
"eval_loss": 0.0617961585521698,
"eval_precision": 0.9930145083288554,
"eval_recall": 0.9856,
"eval_runtime": 580.2597,
"eval_samples_per_second": 6.463,
"eval_steps_per_second": 0.808,
"step": 2107
},
{
"epoch": 0.98,
"learning_rate": 8.683729433272396e-07,
"loss": 0.0513,
"step": 2150
},
{
"epoch": 0.98,
"eval_accuracy": 0.9898666666666667,
"eval_f1": 0.9898286937901497,
"eval_loss": 0.05942407250404358,
"eval_precision": 0.9935518538420204,
"eval_recall": 0.9861333333333333,
"eval_runtime": 580.5968,
"eval_samples_per_second": 6.459,
"eval_steps_per_second": 0.808,
"step": 2150
}
],
"max_steps": 2188,
"num_train_epochs": 1,
"total_flos": 1.268902526976e+17,
"trial_name": null,
"trial_params": null
}