|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 2.0, |
|
"eval_steps": 500, |
|
"global_step": 10940, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.0, |
|
"learning_rate": 1.9998171846435103e-05, |
|
"loss": 3.4748, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"learning_rate": 1.7714808043875687e-05, |
|
"loss": 0.3223, |
|
"step": 1250 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"learning_rate": 1.5429616087751372e-05, |
|
"loss": 0.1466, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.69, |
|
"learning_rate": 1.3144424131627058e-05, |
|
"loss": 0.1219, |
|
"step": 3750 |
|
}, |
|
{ |
|
"epoch": 0.91, |
|
"learning_rate": 1.0859232175502743e-05, |
|
"loss": 0.1025, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_ANIM": { |
|
"f1": 0.6988922457200403, |
|
"number": 3208, |
|
"precision": 0.5861486486486487, |
|
"recall": 0.8653366583541147 |
|
}, |
|
"eval_BIO": { |
|
"f1": 0.5263157894736842, |
|
"number": 16, |
|
"precision": 0.45454545454545453, |
|
"recall": 0.625 |
|
}, |
|
"eval_CEL": { |
|
"f1": 0.7659574468085106, |
|
"number": 82, |
|
"precision": 0.6792452830188679, |
|
"recall": 0.8780487804878049 |
|
}, |
|
"eval_DIS": { |
|
"f1": 0.6575342465753424, |
|
"number": 1518, |
|
"precision": 0.5229571984435798, |
|
"recall": 0.8853754940711462 |
|
}, |
|
"eval_EVE": { |
|
"f1": 0.958100558659218, |
|
"number": 704, |
|
"precision": 0.9423076923076923, |
|
"recall": 0.9744318181818182 |
|
}, |
|
"eval_FOOD": { |
|
"f1": 0.53125, |
|
"number": 1132, |
|
"precision": 0.38825448613376834, |
|
"recall": 0.8409893992932862 |
|
}, |
|
"eval_INST": { |
|
"f1": 0.5454545454545454, |
|
"number": 24, |
|
"precision": 0.42857142857142855, |
|
"recall": 0.75 |
|
}, |
|
"eval_LOC": { |
|
"f1": 0.9938849369774116, |
|
"number": 24048, |
|
"precision": 0.9942571785268415, |
|
"recall": 0.9935129740518962 |
|
}, |
|
"eval_MEDIA": { |
|
"f1": 0.9480381760339343, |
|
"number": 916, |
|
"precision": 0.9216494845360824, |
|
"recall": 0.9759825327510917 |
|
}, |
|
"eval_MYTH": { |
|
"f1": 0.6987951807228915, |
|
"number": 64, |
|
"precision": 0.5686274509803921, |
|
"recall": 0.90625 |
|
}, |
|
"eval_ORG": { |
|
"f1": 0.9804511278195489, |
|
"number": 6618, |
|
"precision": 0.9757557617479796, |
|
"recall": 0.9851919008763977 |
|
}, |
|
"eval_PER": { |
|
"f1": 0.9935385784872672, |
|
"number": 10530, |
|
"precision": 0.9941053432211447, |
|
"recall": 0.9929724596391263 |
|
}, |
|
"eval_PLANT": { |
|
"f1": 0.56656346749226, |
|
"number": 1788, |
|
"precision": 0.4331360946745562, |
|
"recall": 0.8187919463087249 |
|
}, |
|
"eval_TIME": { |
|
"f1": 0.7452830188679245, |
|
"number": 578, |
|
"precision": 0.6829971181556196, |
|
"recall": 0.8200692041522492 |
|
}, |
|
"eval_VEHI": { |
|
"f1": 0.8571428571428572, |
|
"number": 64, |
|
"precision": 0.7894736842105263, |
|
"recall": 0.9375 |
|
}, |
|
"eval_loss": 0.09848607331514359, |
|
"eval_overall_accuracy": 0.9839002953677689, |
|
"eval_overall_f1": 0.9165482757984463, |
|
"eval_overall_precision": 0.8698606149751348, |
|
"eval_overall_recall": 0.9685318775589784, |
|
"eval_runtime": 95.1985, |
|
"eval_samples_per_second": 345.678, |
|
"eval_steps_per_second": 7.206, |
|
"step": 5470 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"learning_rate": 8.574040219378429e-06, |
|
"loss": 0.0791, |
|
"step": 6250 |
|
}, |
|
{ |
|
"epoch": 1.37, |
|
"learning_rate": 6.288848263254113e-06, |
|
"loss": 0.0668, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"learning_rate": 4.003656307129799e-06, |
|
"loss": 0.0584, |
|
"step": 8750 |
|
}, |
|
{ |
|
"epoch": 1.83, |
|
"learning_rate": 1.7184643510054846e-06, |
|
"loss": 0.0526, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_ANIM": { |
|
"f1": 0.7314670813893208, |
|
"number": 3208, |
|
"precision": 0.6259982253771074, |
|
"recall": 0.8796758104738155 |
|
}, |
|
"eval_BIO": { |
|
"f1": 0.6363636363636364, |
|
"number": 16, |
|
"precision": 0.5, |
|
"recall": 0.875 |
|
}, |
|
"eval_CEL": { |
|
"f1": 0.7835051546391752, |
|
"number": 82, |
|
"precision": 0.6785714285714286, |
|
"recall": 0.926829268292683 |
|
}, |
|
"eval_DIS": { |
|
"f1": 0.6950578338590956, |
|
"number": 1518, |
|
"precision": 0.5783027121609798, |
|
"recall": 0.8708827404479579 |
|
}, |
|
"eval_EVE": { |
|
"f1": 0.9678321678321677, |
|
"number": 704, |
|
"precision": 0.953168044077135, |
|
"recall": 0.9829545454545454 |
|
}, |
|
"eval_FOOD": { |
|
"f1": 0.5880893300248139, |
|
"number": 1132, |
|
"precision": 0.45315487571701724, |
|
"recall": 0.8374558303886925 |
|
}, |
|
"eval_INST": { |
|
"f1": 0.5625000000000001, |
|
"number": 24, |
|
"precision": 0.45, |
|
"recall": 0.75 |
|
}, |
|
"eval_LOC": { |
|
"f1": 0.9941398944349777, |
|
"number": 24048, |
|
"precision": 0.9936030572401762, |
|
"recall": 0.9946773120425815 |
|
}, |
|
"eval_MEDIA": { |
|
"f1": 0.9540106951871657, |
|
"number": 916, |
|
"precision": 0.9350104821802935, |
|
"recall": 0.9737991266375546 |
|
}, |
|
"eval_MYTH": { |
|
"f1": 0.8055555555555555, |
|
"number": 64, |
|
"precision": 0.725, |
|
"recall": 0.90625 |
|
}, |
|
"eval_ORG": { |
|
"f1": 0.9806938159879336, |
|
"number": 6618, |
|
"precision": 0.9789220114423366, |
|
"recall": 0.9824720459353279 |
|
}, |
|
"eval_PER": { |
|
"f1": 0.9945915172217479, |
|
"number": 10530, |
|
"precision": 0.9937428896473265, |
|
"recall": 0.9954415954415955 |
|
}, |
|
"eval_PLANT": { |
|
"f1": 0.6153232242617718, |
|
"number": 1788, |
|
"precision": 0.478287841191067, |
|
"recall": 0.8624161073825504 |
|
}, |
|
"eval_TIME": { |
|
"f1": 0.7310030395136778, |
|
"number": 578, |
|
"precision": 0.6517615176151762, |
|
"recall": 0.8321799307958477 |
|
}, |
|
"eval_VEHI": { |
|
"f1": 0.8571428571428572, |
|
"number": 64, |
|
"precision": 0.7894736842105263, |
|
"recall": 0.9375 |
|
}, |
|
"eval_loss": 0.11049605160951614, |
|
"eval_overall_accuracy": 0.9861263597723507, |
|
"eval_overall_f1": 0.9277588486101026, |
|
"eval_overall_precision": 0.8877743728620296, |
|
"eval_overall_recall": 0.9715149151881458, |
|
"eval_runtime": 94.1134, |
|
"eval_samples_per_second": 349.663, |
|
"eval_steps_per_second": 7.289, |
|
"step": 10940 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"step": 10940, |
|
"total_flos": 1.929975843125117e+16, |
|
"train_loss": 0.1132796828881914, |
|
"train_runtime": 2485.5568, |
|
"train_samples_per_second": 211.269, |
|
"train_steps_per_second": 4.401 |
|
} |
|
], |
|
"logging_steps": 1250, |
|
"max_steps": 10940, |
|
"num_train_epochs": 2, |
|
"save_steps": 500, |
|
"total_flos": 1.929975843125117e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|