|
{ |
|
"best_metric": 0.5486067787470349, |
|
"best_model_checkpoint": "InLegalBERT-lora/checkpoint-1125", |
|
"epoch": 8.0, |
|
"eval_steps": 500, |
|
"global_step": 1286, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.6553059643687065, |
|
"eval_f1_macro": 0.34196434919671853, |
|
"eval_f1_micro": 0.6553059643687065, |
|
"eval_f1_weighted": 0.6146575775654787, |
|
"eval_loss": 1.2012524604797363, |
|
"eval_macro_fpr": 0.036531607457408626, |
|
"eval_macro_sensitivity": 0.39029268516816945, |
|
"eval_macro_specificity": 0.9740627875145957, |
|
"eval_precision": 0.6007307052856502, |
|
"eval_precision_macro": 0.32788772117271575, |
|
"eval_recall": 0.6553059643687065, |
|
"eval_recall_macro": 0.39029268516816945, |
|
"eval_runtime": 30.3344, |
|
"eval_samples_per_second": 42.559, |
|
"eval_steps_per_second": 5.34, |
|
"eval_weighted_fpr": 0.03621124582960371, |
|
"eval_weighted_sensitivity": 0.6553059643687065, |
|
"eval_weighted_specificity": 0.9556358483502301, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7381874515879163, |
|
"eval_f1_macro": 0.4250111578260666, |
|
"eval_f1_micro": 0.7381874515879164, |
|
"eval_f1_weighted": 0.7236865886821344, |
|
"eval_loss": 0.8278939127922058, |
|
"eval_macro_fpr": 0.024763530819684316, |
|
"eval_macro_sensitivity": 0.46578072689552413, |
|
"eval_macro_specificity": 0.9806295017830671, |
|
"eval_precision": 0.7211273477007717, |
|
"eval_precision_macro": 0.40923635739063985, |
|
"eval_recall": 0.7381874515879163, |
|
"eval_recall_macro": 0.46578072689552413, |
|
"eval_runtime": 34.091, |
|
"eval_samples_per_second": 37.869, |
|
"eval_steps_per_second": 4.752, |
|
"eval_weighted_fpr": 0.024707602339181286, |
|
"eval_weighted_sensitivity": 0.7381874515879163, |
|
"eval_weighted_specificity": 0.9712550751580882, |
|
"step": 321 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7544539116963594, |
|
"eval_f1_macro": 0.44305220236653187, |
|
"eval_f1_micro": 0.7544539116963594, |
|
"eval_f1_weighted": 0.7304902543811719, |
|
"eval_loss": 0.713018000125885, |
|
"eval_macro_fpr": 0.0233195243156939, |
|
"eval_macro_sensitivity": 0.4769897256873969, |
|
"eval_macro_specificity": 0.9816367201302573, |
|
"eval_precision": 0.7255238407846915, |
|
"eval_precision_macro": 0.4800443784048848, |
|
"eval_recall": 0.7544539116963594, |
|
"eval_recall_macro": 0.4769897256873969, |
|
"eval_runtime": 32.6151, |
|
"eval_samples_per_second": 39.583, |
|
"eval_steps_per_second": 4.967, |
|
"eval_weighted_fpr": 0.02271912850283093, |
|
"eval_weighted_sensitivity": 0.7544539116963594, |
|
"eval_weighted_specificity": 0.9700968902575, |
|
"step": 482 |
|
}, |
|
{ |
|
"epoch": 3.11, |
|
"learning_rate": 3.958333333333333e-05, |
|
"loss": 1.1985, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.7823392718822618, |
|
"eval_f1_macro": 0.5047859025633034, |
|
"eval_f1_micro": 0.7823392718822618, |
|
"eval_f1_weighted": 0.766027283346833, |
|
"eval_loss": 0.6922410726547241, |
|
"eval_macro_fpr": 0.02001637486004151, |
|
"eval_macro_sensitivity": 0.528327896933921, |
|
"eval_macro_specificity": 0.9837585704961105, |
|
"eval_precision": 0.7594430092765442, |
|
"eval_precision_macro": 0.5188076394331661, |
|
"eval_recall": 0.7823392718822618, |
|
"eval_recall_macro": 0.528327896933921, |
|
"eval_runtime": 32.5532, |
|
"eval_samples_per_second": 39.658, |
|
"eval_steps_per_second": 4.976, |
|
"eval_weighted_fpr": 0.019485472574717427, |
|
"eval_weighted_sensitivity": 0.7823392718822618, |
|
"eval_weighted_specificity": 0.9740392855593933, |
|
"step": 643 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.7939581719597212, |
|
"eval_f1_macro": 0.5257108179174788, |
|
"eval_f1_micro": 0.7939581719597211, |
|
"eval_f1_weighted": 0.7717932414170925, |
|
"eval_loss": 0.6710420846939087, |
|
"eval_macro_fpr": 0.018964580711785816, |
|
"eval_macro_sensitivity": 0.5571328425020213, |
|
"eval_macro_specificity": 0.9845265708178329, |
|
"eval_precision": 0.7734327517428056, |
|
"eval_precision_macro": 0.5449998556573111, |
|
"eval_recall": 0.7939581719597212, |
|
"eval_recall_macro": 0.5571328425020213, |
|
"eval_runtime": 33.235, |
|
"eval_samples_per_second": 38.845, |
|
"eval_steps_per_second": 4.874, |
|
"eval_weighted_fpr": 0.018199233716475097, |
|
"eval_weighted_sensitivity": 0.7939581719597212, |
|
"eval_weighted_specificity": 0.9739403903077732, |
|
"step": 803 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.7970565453137103, |
|
"eval_f1_macro": 0.5316254099721903, |
|
"eval_f1_micro": 0.7970565453137104, |
|
"eval_f1_weighted": 0.7789523196246046, |
|
"eval_loss": 0.6454855799674988, |
|
"eval_macro_fpr": 0.018368947118040532, |
|
"eval_macro_sensitivity": 0.5622105847462606, |
|
"eval_macro_specificity": 0.9848273693754934, |
|
"eval_precision": 0.7756987894676903, |
|
"eval_precision_macro": 0.5353415355904975, |
|
"eval_recall": 0.7970565453137103, |
|
"eval_recall_macro": 0.5622105847462606, |
|
"eval_runtime": 33.0425, |
|
"eval_samples_per_second": 39.071, |
|
"eval_steps_per_second": 4.903, |
|
"eval_weighted_fpr": 0.017862012544314153, |
|
"eval_weighted_sensitivity": 0.7970565453137103, |
|
"eval_weighted_specificity": 0.9753539953186898, |
|
"step": 964 |
|
}, |
|
{ |
|
"epoch": 6.22, |
|
"learning_rate": 2.916666666666667e-05, |
|
"loss": 0.5721, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.8001549186676995, |
|
"eval_f1_macro": 0.5486067787470349, |
|
"eval_f1_micro": 0.8001549186676995, |
|
"eval_f1_weighted": 0.7845126172395842, |
|
"eval_loss": 0.6394562721252441, |
|
"eval_macro_fpr": 0.01807650265580631, |
|
"eval_macro_sensitivity": 0.5784319115133939, |
|
"eval_macro_specificity": 0.9850891561725063, |
|
"eval_precision": 0.7801018097427485, |
|
"eval_precision_macro": 0.5442815357986059, |
|
"eval_recall": 0.8001549186676995, |
|
"eval_recall_macro": 0.5784319115133939, |
|
"eval_runtime": 32.9727, |
|
"eval_samples_per_second": 39.154, |
|
"eval_steps_per_second": 4.913, |
|
"eval_weighted_fpr": 0.017527173913043478, |
|
"eval_weighted_sensitivity": 0.8001549186676995, |
|
"eval_weighted_specificity": 0.9761824239198935, |
|
"step": 1125 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8024786986831913, |
|
"eval_f1_macro": 0.5474570084709011, |
|
"eval_f1_micro": 0.8024786986831914, |
|
"eval_f1_weighted": 0.787386582262622, |
|
"eval_loss": 0.6317066550254822, |
|
"eval_macro_fpr": 0.017822080148589308, |
|
"eval_macro_sensitivity": 0.5773035410379497, |
|
"eval_macro_specificity": 0.9852623885220758, |
|
"eval_precision": 0.783268466071204, |
|
"eval_precision_macro": 0.5438628735250125, |
|
"eval_recall": 0.8024786986831913, |
|
"eval_recall_macro": 0.5773035410379497, |
|
"eval_runtime": 33.0187, |
|
"eval_samples_per_second": 39.099, |
|
"eval_steps_per_second": 4.906, |
|
"eval_weighted_fpr": 0.017277593332881633, |
|
"eval_weighted_sensitivity": 0.8024786986831913, |
|
"eval_weighted_specificity": 0.9764571291479465, |
|
"step": 1286 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 2400, |
|
"num_train_epochs": 15, |
|
"save_steps": 500, |
|
"total_flos": 1.1155889738907648e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|