|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 12.0, |
|
"eval_steps": 500, |
|
"global_step": 492, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_B": { |
|
"f1-score": 0.5721362229102167, |
|
"precision": 0.8076923076923077, |
|
"recall": 0.4429530201342282, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.927966217883682, |
|
"precision": 0.8850358282336942, |
|
"recall": 0.9752737752161383, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.864171621779177, |
|
"precision": 0.9349142280524723, |
|
"recall": 0.8033817472360719, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.8977515478474963, |
|
"eval_loss": 0.29473039507865906, |
|
"eval_macro avg": { |
|
"f1-score": 0.7880913541910252, |
|
"precision": 0.8758807879928246, |
|
"recall": 0.7405361808621462, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.3384, |
|
"eval_samples_per_second": 59.772, |
|
"eval_steps_per_second": 7.472, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8932184128068332, |
|
"precision": 0.8987766886849552, |
|
"recall": 0.8977515478474963, |
|
"support": 27619.0 |
|
}, |
|
"step": 41 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_B": { |
|
"f1-score": 0.8396183552930486, |
|
"precision": 0.7979274611398963, |
|
"recall": 0.8859060402684564, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9529475085691623, |
|
"precision": 0.9369951534733441, |
|
"recall": 0.9694524495677234, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9060667568786648, |
|
"precision": 0.9441833137485312, |
|
"recall": 0.8709083026230219, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.9333791954813715, |
|
"eval_loss": 0.19544227421283722, |
|
"eval_macro avg": { |
|
"f1-score": 0.8995442069136251, |
|
"precision": 0.8930353094539237, |
|
"recall": 0.9087555974864006, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.3427, |
|
"eval_samples_per_second": 59.582, |
|
"eval_steps_per_second": 7.448, |
|
"eval_weighted avg": { |
|
"f1-score": 0.933007462877301, |
|
"precision": 0.9341445927577168, |
|
"recall": 0.9333791954813715, |
|
"support": 27619.0 |
|
}, |
|
"step": 82 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_B": { |
|
"f1-score": 0.8647365923113433, |
|
"precision": 0.856203007518797, |
|
"recall": 0.8734419942473634, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9557367501456028, |
|
"precision": 0.9658622719246616, |
|
"recall": 0.945821325648415, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9184183917833005, |
|
"precision": 0.9021432305279665, |
|
"recall": 0.9352915673097767, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.9395705854665267, |
|
"eval_loss": 0.17375266551971436, |
|
"eval_macro avg": { |
|
"f1-score": 0.9129639114134155, |
|
"precision": 0.9080695033238083, |
|
"recall": 0.9181849624018517, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.344, |
|
"eval_samples_per_second": 59.525, |
|
"eval_steps_per_second": 7.441, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9398342070096555, |
|
"precision": 0.940436062116152, |
|
"recall": 0.9395705854665267, |
|
"support": 27619.0 |
|
}, |
|
"step": 123 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_B": { |
|
"f1-score": 0.862493839329719, |
|
"precision": 0.8874239350912779, |
|
"recall": 0.8389261744966443, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9584169773444221, |
|
"precision": 0.9537671232876712, |
|
"recall": 0.9631123919308358, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9205518294345384, |
|
"precision": 0.926259190167892, |
|
"recall": 0.9149143724257534, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.9423223143488179, |
|
"eval_loss": 0.17503595352172852, |
|
"eval_macro avg": { |
|
"f1-score": 0.9138208820362266, |
|
"precision": 0.9224834161822804, |
|
"recall": 0.9056509796177444, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.3496, |
|
"eval_samples_per_second": 59.277, |
|
"eval_steps_per_second": 7.41, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9421458709478862, |
|
"precision": 0.9420728499160095, |
|
"recall": 0.9423223143488179, |
|
"support": 27619.0 |
|
}, |
|
"step": 164 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_B": { |
|
"f1-score": 0.8739573679332716, |
|
"precision": 0.8457399103139014, |
|
"recall": 0.9041227229146692, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.954658525554048, |
|
"precision": 0.9367580161988239, |
|
"recall": 0.9732564841498559, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9086082241301401, |
|
"precision": 0.948690728945506, |
|
"recall": 0.8717754172989378, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.9367464426662805, |
|
"eval_loss": 0.20350226759910583, |
|
"eval_macro avg": { |
|
"f1-score": 0.9124080392058199, |
|
"precision": 0.9103962184860771, |
|
"recall": 0.916384874787821, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.3385, |
|
"eval_samples_per_second": 59.767, |
|
"eval_steps_per_second": 7.471, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9362280469583188, |
|
"precision": 0.9373068891979518, |
|
"recall": 0.9367464426662805, |
|
"support": 27619.0 |
|
}, |
|
"step": 205 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_B": { |
|
"f1-score": 0.8744710860366715, |
|
"precision": 0.8579335793357934, |
|
"recall": 0.8916586768935763, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9548456588905582, |
|
"precision": 0.9394277427631212, |
|
"recall": 0.970778097982709, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9091520861372813, |
|
"precision": 0.941900999302812, |
|
"recall": 0.8786039453717754, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.9369998913791231, |
|
"eval_loss": 0.18961849808692932, |
|
"eval_macro avg": { |
|
"f1-score": 0.9128229436881702, |
|
"precision": 0.9130874404672422, |
|
"recall": 0.9136802400826869, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.3446, |
|
"eval_samples_per_second": 59.497, |
|
"eval_steps_per_second": 7.437, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9365466769683909, |
|
"precision": 0.9371763887090455, |
|
"recall": 0.9369998913791231, |
|
"support": 27619.0 |
|
}, |
|
"step": 246 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_B": { |
|
"f1-score": 0.8734770384254921, |
|
"precision": 0.854262144821265, |
|
"recall": 0.8935762224352828, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9571367703451216, |
|
"precision": 0.9436012321478577, |
|
"recall": 0.9710662824207493, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9144644952231968, |
|
"precision": 0.9436181252161882, |
|
"recall": 0.8870583134619553, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.9400774828922119, |
|
"eval_loss": 0.19739200174808502, |
|
"eval_macro avg": { |
|
"f1-score": 0.9150261013312702, |
|
"precision": 0.9138271673951035, |
|
"recall": 0.9172336061059957, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.3403, |
|
"eval_samples_per_second": 59.69, |
|
"eval_steps_per_second": 7.461, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9397229787282255, |
|
"precision": 0.9402330865729558, |
|
"recall": 0.9400774828922119, |
|
"support": 27619.0 |
|
}, |
|
"step": 287 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_B": { |
|
"f1-score": 0.875, |
|
"precision": 0.851952770208901, |
|
"recall": 0.8993288590604027, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9546683185043361, |
|
"precision": 0.9332269074094462, |
|
"recall": 0.9771181556195966, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.90670155876664, |
|
"precision": 0.9541427203065134, |
|
"recall": 0.8637546065467158, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.9363119591585503, |
|
"eval_loss": 0.2391989678144455, |
|
"eval_macro avg": { |
|
"f1-score": 0.9121232924236587, |
|
"precision": 0.9131074659749535, |
|
"recall": 0.913400540408905, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.3469, |
|
"eval_samples_per_second": 59.396, |
|
"eval_steps_per_second": 7.424, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9356366598077863, |
|
"precision": 0.937144513575063, |
|
"recall": 0.9363119591585503, |
|
"support": 27619.0 |
|
}, |
|
"step": 328 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_B": { |
|
"f1-score": 0.8698850574712644, |
|
"precision": 0.8356890459363958, |
|
"recall": 0.9069990412272292, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9540004482294935, |
|
"precision": 0.9281042189033032, |
|
"recall": 0.9813832853025937, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9027465883572292, |
|
"precision": 0.9629038201695124, |
|
"recall": 0.8496639930630826, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.9345740251276295, |
|
"eval_loss": 0.25876709818840027, |
|
"eval_macro avg": { |
|
"f1-score": 0.9088773646859957, |
|
"precision": 0.9088990283364038, |
|
"recall": 0.9126821065309684, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.3397, |
|
"eval_samples_per_second": 59.713, |
|
"eval_steps_per_second": 7.464, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9337028102359982, |
|
"precision": 0.9362389122621345, |
|
"recall": 0.9345740251276295, |
|
"support": 27619.0 |
|
}, |
|
"step": 369 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_B": { |
|
"f1-score": 0.8675496688741721, |
|
"precision": 0.8562091503267973, |
|
"recall": 0.8791946308724832, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9541242937853106, |
|
"precision": 0.9356232686980609, |
|
"recall": 0.973371757925072, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9069058903182126, |
|
"precision": 0.9457519416333255, |
|
"recall": 0.8711250812920008, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.935660233896955, |
|
"eval_loss": 0.2737439274787903, |
|
"eval_macro avg": { |
|
"f1-score": 0.9095266176592318, |
|
"precision": 0.9125281202193946, |
|
"recall": 0.9078971566965187, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.3436, |
|
"eval_samples_per_second": 59.54, |
|
"eval_steps_per_second": 7.443, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9350818112852286, |
|
"precision": 0.9360077218295835, |
|
"recall": 0.935660233896955, |
|
"support": 27619.0 |
|
}, |
|
"step": 410 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_B": { |
|
"f1-score": 0.8654028436018957, |
|
"precision": 0.8556701030927835, |
|
"recall": 0.87535953978907, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9553462854557281, |
|
"precision": 0.9378157792460163, |
|
"recall": 0.9735446685878962, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9094388473011763, |
|
"precision": 0.9459079733052336, |
|
"recall": 0.8756774333405593, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.9371447192150332, |
|
"eval_loss": 0.27220794558525085, |
|
"eval_macro avg": { |
|
"f1-score": 0.9100626587862667, |
|
"precision": 0.9131312852146779, |
|
"recall": 0.9081938805725085, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.3435, |
|
"eval_samples_per_second": 59.547, |
|
"eval_steps_per_second": 7.443, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9366145053671137, |
|
"precision": 0.937416801808836, |
|
"recall": 0.9371447192150332, |
|
"support": 27619.0 |
|
}, |
|
"step": 451 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_B": { |
|
"f1-score": 0.8710900473933649, |
|
"precision": 0.8612933458294283, |
|
"recall": 0.8811121764141898, |
|
"support": 1043.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9563688940549427, |
|
"precision": 0.9410812921943871, |
|
"recall": 0.9721613832853025, |
|
"support": 17350.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9124614953794455, |
|
"precision": 0.9440259589755475, |
|
"recall": 0.8829395187513549, |
|
"support": 9226.0 |
|
}, |
|
"eval_accuracy": 0.9389188602049314, |
|
"eval_loss": 0.27493152022361755, |
|
"eval_macro avg": { |
|
"f1-score": 0.9133068122759177, |
|
"precision": 0.9154668656664544, |
|
"recall": 0.9120710261502823, |
|
"support": 27619.0 |
|
}, |
|
"eval_runtime": 1.3368, |
|
"eval_samples_per_second": 59.844, |
|
"eval_steps_per_second": 7.48, |
|
"eval_weighted avg": { |
|
"f1-score": 0.938481371072642, |
|
"precision": 0.9390518439038746, |
|
"recall": 0.9389188602049314, |
|
"support": 27619.0 |
|
}, |
|
"step": 492 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 656, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 16, |
|
"save_steps": 500, |
|
"total_flos": 1725439832827200.0, |
|
"train_batch_size": 8, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|