{ "best_metric": null, "best_model_checkpoint": null, "epoch": 2.0, "eval_steps": 500, "global_step": 10940, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 1.9998171846435103e-05, "loss": 3.4748, "step": 1 }, { "epoch": 0.23, "learning_rate": 1.7714808043875687e-05, "loss": 0.3223, "step": 1250 }, { "epoch": 0.46, "learning_rate": 1.5429616087751372e-05, "loss": 0.1466, "step": 2500 }, { "epoch": 0.69, "learning_rate": 1.3144424131627058e-05, "loss": 0.1219, "step": 3750 }, { "epoch": 0.91, "learning_rate": 1.0859232175502743e-05, "loss": 0.1025, "step": 5000 }, { "epoch": 1.0, "eval_ANIM": { "f1": 0.6988922457200403, "number": 3208, "precision": 0.5861486486486487, "recall": 0.8653366583541147 }, "eval_BIO": { "f1": 0.5263157894736842, "number": 16, "precision": 0.45454545454545453, "recall": 0.625 }, "eval_CEL": { "f1": 0.7659574468085106, "number": 82, "precision": 0.6792452830188679, "recall": 0.8780487804878049 }, "eval_DIS": { "f1": 0.6575342465753424, "number": 1518, "precision": 0.5229571984435798, "recall": 0.8853754940711462 }, "eval_EVE": { "f1": 0.958100558659218, "number": 704, "precision": 0.9423076923076923, "recall": 0.9744318181818182 }, "eval_FOOD": { "f1": 0.53125, "number": 1132, "precision": 0.38825448613376834, "recall": 0.8409893992932862 }, "eval_INST": { "f1": 0.5454545454545454, "number": 24, "precision": 0.42857142857142855, "recall": 0.75 }, "eval_LOC": { "f1": 0.9938849369774116, "number": 24048, "precision": 0.9942571785268415, "recall": 0.9935129740518962 }, "eval_MEDIA": { "f1": 0.9480381760339343, "number": 916, "precision": 0.9216494845360824, "recall": 0.9759825327510917 }, "eval_MYTH": { "f1": 0.6987951807228915, "number": 64, "precision": 0.5686274509803921, "recall": 0.90625 }, "eval_ORG": { "f1": 0.9804511278195489, "number": 6618, "precision": 0.9757557617479796, "recall": 0.9851919008763977 }, "eval_PER": { "f1": 0.9935385784872672, "number": 10530, "precision": 0.9941053432211447, "recall": 0.9929724596391263 }, "eval_PLANT": { "f1": 0.56656346749226, "number": 1788, "precision": 0.4331360946745562, "recall": 0.8187919463087249 }, "eval_TIME": { "f1": 0.7452830188679245, "number": 578, "precision": 0.6829971181556196, "recall": 0.8200692041522492 }, "eval_VEHI": { "f1": 0.8571428571428572, "number": 64, "precision": 0.7894736842105263, "recall": 0.9375 }, "eval_loss": 0.09848607331514359, "eval_overall_accuracy": 0.9839002953677689, "eval_overall_f1": 0.9165482757984463, "eval_overall_precision": 0.8698606149751348, "eval_overall_recall": 0.9685318775589784, "eval_runtime": 95.1985, "eval_samples_per_second": 345.678, "eval_steps_per_second": 7.206, "step": 5470 }, { "epoch": 1.14, "learning_rate": 8.574040219378429e-06, "loss": 0.0791, "step": 6250 }, { "epoch": 1.37, "learning_rate": 6.288848263254113e-06, "loss": 0.0668, "step": 7500 }, { "epoch": 1.6, "learning_rate": 4.003656307129799e-06, "loss": 0.0584, "step": 8750 }, { "epoch": 1.83, "learning_rate": 1.7184643510054846e-06, "loss": 0.0526, "step": 10000 }, { "epoch": 2.0, "eval_ANIM": { "f1": 0.7314670813893208, "number": 3208, "precision": 0.6259982253771074, "recall": 0.8796758104738155 }, "eval_BIO": { "f1": 0.6363636363636364, "number": 16, "precision": 0.5, "recall": 0.875 }, "eval_CEL": { "f1": 0.7835051546391752, "number": 82, "precision": 0.6785714285714286, "recall": 0.926829268292683 }, "eval_DIS": { "f1": 0.6950578338590956, "number": 1518, "precision": 0.5783027121609798, "recall": 0.8708827404479579 }, "eval_EVE": { "f1": 0.9678321678321677, "number": 704, "precision": 0.953168044077135, "recall": 0.9829545454545454 }, "eval_FOOD": { "f1": 0.5880893300248139, "number": 1132, "precision": 0.45315487571701724, "recall": 0.8374558303886925 }, "eval_INST": { "f1": 0.5625000000000001, "number": 24, "precision": 0.45, "recall": 0.75 }, "eval_LOC": { "f1": 0.9941398944349777, "number": 24048, "precision": 0.9936030572401762, "recall": 0.9946773120425815 }, "eval_MEDIA": { "f1": 0.9540106951871657, "number": 916, "precision": 0.9350104821802935, "recall": 0.9737991266375546 }, "eval_MYTH": { "f1": 0.8055555555555555, "number": 64, "precision": 0.725, "recall": 0.90625 }, "eval_ORG": { "f1": 0.9806938159879336, "number": 6618, "precision": 0.9789220114423366, "recall": 0.9824720459353279 }, "eval_PER": { "f1": 0.9945915172217479, "number": 10530, "precision": 0.9937428896473265, "recall": 0.9954415954415955 }, "eval_PLANT": { "f1": 0.6153232242617718, "number": 1788, "precision": 0.478287841191067, "recall": 0.8624161073825504 }, "eval_TIME": { "f1": 0.7310030395136778, "number": 578, "precision": 0.6517615176151762, "recall": 0.8321799307958477 }, "eval_VEHI": { "f1": 0.8571428571428572, "number": 64, "precision": 0.7894736842105263, "recall": 0.9375 }, "eval_loss": 0.11049605160951614, "eval_overall_accuracy": 0.9861263597723507, "eval_overall_f1": 0.9277588486101026, "eval_overall_precision": 0.8877743728620296, "eval_overall_recall": 0.9715149151881458, "eval_runtime": 94.1134, "eval_samples_per_second": 349.663, "eval_steps_per_second": 7.289, "step": 10940 }, { "epoch": 2.0, "step": 10940, "total_flos": 1.929975843125117e+16, "train_loss": 0.1132796828881914, "train_runtime": 2485.5568, "train_samples_per_second": 211.269, "train_steps_per_second": 4.401 } ], "logging_steps": 1250, "max_steps": 10940, "num_train_epochs": 2, "save_steps": 500, "total_flos": 1.929975843125117e+16, "trial_name": null, "trial_params": null }