|
{ |
|
"best_metric": 0.6261172643852387, |
|
"best_model_checkpoint": "bart-base-lora/checkpoint-2250", |
|
"epoch": 13.996889580093313, |
|
"eval_steps": 500, |
|
"global_step": 2250, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.611154144074361, |
|
"eval_f1_macro": 0.28705545756004525, |
|
"eval_f1_micro": 0.611154144074361, |
|
"eval_f1_weighted": 0.5574695078229231, |
|
"eval_loss": 1.3204560279846191, |
|
"eval_macro_fpr": 0.046390243375546196, |
|
"eval_macro_sensitivity": 0.302378554842108, |
|
"eval_macro_specificity": 0.9691815961629444, |
|
"eval_precision": 0.5321554731456403, |
|
"eval_precision_macro": 0.2887439395071009, |
|
"eval_recall": 0.611154144074361, |
|
"eval_recall_macro": 0.302378554842108, |
|
"eval_runtime": 45.1674, |
|
"eval_samples_per_second": 28.583, |
|
"eval_steps_per_second": 3.587, |
|
"eval_weighted_fpr": 0.04347073086248701, |
|
"eval_weighted_sensitivity": 0.611154144074361, |
|
"eval_weighted_specificity": 0.9265697983698051, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.6994577846630519, |
|
"eval_f1_macro": 0.3947617401663212, |
|
"eval_f1_micro": 0.6994577846630519, |
|
"eval_f1_weighted": 0.6807748226338182, |
|
"eval_loss": 0.887535810470581, |
|
"eval_macro_fpr": 0.03062685085400977, |
|
"eval_macro_sensitivity": 0.4253981018601158, |
|
"eval_macro_specificity": 0.977359054380045, |
|
"eval_precision": 0.6728416067370143, |
|
"eval_precision_macro": 0.3822291983692299, |
|
"eval_recall": 0.6994577846630519, |
|
"eval_recall_macro": 0.4253981018601158, |
|
"eval_runtime": 44.0045, |
|
"eval_samples_per_second": 29.338, |
|
"eval_steps_per_second": 3.681, |
|
"eval_weighted_fpr": 0.02977743668457406, |
|
"eval_weighted_sensitivity": 0.6994577846630519, |
|
"eval_weighted_specificity": 0.9609280310376243, |
|
"step": 321 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7064291247095275, |
|
"eval_f1_macro": 0.39687975393644837, |
|
"eval_f1_micro": 0.7064291247095275, |
|
"eval_f1_weighted": 0.6751887743731854, |
|
"eval_loss": 0.842707633972168, |
|
"eval_macro_fpr": 0.029525759570689643, |
|
"eval_macro_sensitivity": 0.44418263304043937, |
|
"eval_macro_specificity": 0.9780349023882488, |
|
"eval_precision": 0.6951917464608133, |
|
"eval_precision_macro": 0.4131313886422618, |
|
"eval_recall": 0.7064291247095275, |
|
"eval_recall_macro": 0.44418263304043937, |
|
"eval_runtime": 44.2756, |
|
"eval_samples_per_second": 29.158, |
|
"eval_steps_per_second": 3.659, |
|
"eval_weighted_fpr": 0.02882786947592607, |
|
"eval_weighted_sensitivity": 0.7064291247095275, |
|
"eval_weighted_specificity": 0.9640944111142056, |
|
"step": 482 |
|
}, |
|
{ |
|
"epoch": 3.11, |
|
"learning_rate": 3.958333333333333e-05, |
|
"loss": 1.2895, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.7273431448489543, |
|
"eval_f1_macro": 0.42839565617146974, |
|
"eval_f1_micro": 0.7273431448489543, |
|
"eval_f1_weighted": 0.7166656051521775, |
|
"eval_loss": 0.7718679904937744, |
|
"eval_macro_fpr": 0.026373610346420835, |
|
"eval_macro_sensitivity": 0.4597947061276887, |
|
"eval_macro_specificity": 0.9797578098165848, |
|
"eval_precision": 0.7132141916978711, |
|
"eval_precision_macro": 0.41981312370683244, |
|
"eval_recall": 0.7273431448489543, |
|
"eval_recall_macro": 0.4597947061276887, |
|
"eval_runtime": 44.0471, |
|
"eval_samples_per_second": 29.31, |
|
"eval_steps_per_second": 3.678, |
|
"eval_weighted_fpr": 0.026077937472218107, |
|
"eval_weighted_sensitivity": 0.7273431448489543, |
|
"eval_weighted_specificity": 0.9690240023998159, |
|
"step": 643 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.750580945003873, |
|
"eval_f1_macro": 0.5071625387211971, |
|
"eval_f1_micro": 0.750580945003873, |
|
"eval_f1_weighted": 0.7368350875727435, |
|
"eval_loss": 0.7387559413909912, |
|
"eval_macro_fpr": 0.02390193870216418, |
|
"eval_macro_sensitivity": 0.5165232292614671, |
|
"eval_macro_specificity": 0.9813510652812688, |
|
"eval_precision": 0.739991301984922, |
|
"eval_precision_macro": 0.5733174750951799, |
|
"eval_recall": 0.750580945003873, |
|
"eval_recall_macro": 0.5165232292614671, |
|
"eval_runtime": 43.5191, |
|
"eval_samples_per_second": 29.665, |
|
"eval_steps_per_second": 3.723, |
|
"eval_weighted_fpr": 0.023185483870967742, |
|
"eval_weighted_sensitivity": 0.750580945003873, |
|
"eval_weighted_specificity": 0.9696850342151593, |
|
"step": 803 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.7443841982958946, |
|
"eval_f1_macro": 0.508766573370445, |
|
"eval_f1_micro": 0.7443841982958946, |
|
"eval_f1_weighted": 0.726841801268282, |
|
"eval_loss": 0.7526118755340576, |
|
"eval_macro_fpr": 0.024741953499129225, |
|
"eval_macro_sensitivity": 0.5229557335240369, |
|
"eval_macro_specificity": 0.980899976318631, |
|
"eval_precision": 0.7337183019873953, |
|
"eval_precision_macro": 0.5703412270657953, |
|
"eval_recall": 0.7443841982958946, |
|
"eval_recall_macro": 0.5229557335240369, |
|
"eval_runtime": 43.7116, |
|
"eval_samples_per_second": 29.534, |
|
"eval_steps_per_second": 3.706, |
|
"eval_weighted_fpr": 0.023940800928612886, |
|
"eval_weighted_sensitivity": 0.7443841982958946, |
|
"eval_weighted_specificity": 0.9691154464835722, |
|
"step": 964 |
|
}, |
|
{ |
|
"epoch": 6.22, |
|
"learning_rate": 2.916666666666667e-05, |
|
"loss": 0.7332, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.7552285050348567, |
|
"eval_f1_macro": 0.5608894910772386, |
|
"eval_f1_micro": 0.7552285050348567, |
|
"eval_f1_weighted": 0.7460771491633669, |
|
"eval_loss": 0.7082085609436035, |
|
"eval_macro_fpr": 0.02329269548734161, |
|
"eval_macro_sensitivity": 0.5727565701904757, |
|
"eval_macro_specificity": 0.9817624646436656, |
|
"eval_precision": 0.7436383222975608, |
|
"eval_precision_macro": 0.5665418243254761, |
|
"eval_recall": 0.7552285050348567, |
|
"eval_recall_macro": 0.5727565701904757, |
|
"eval_runtime": 43.8592, |
|
"eval_samples_per_second": 29.435, |
|
"eval_steps_per_second": 3.694, |
|
"eval_weighted_fpr": 0.02262637834741515, |
|
"eval_weighted_sensitivity": 0.7552285050348567, |
|
"eval_weighted_specificity": 0.9712084646201266, |
|
"step": 1125 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.7583268783888458, |
|
"eval_f1_macro": 0.5755845408528306, |
|
"eval_f1_micro": 0.7583268783888458, |
|
"eval_f1_weighted": 0.7502605827076951, |
|
"eval_loss": 0.7160602807998657, |
|
"eval_macro_fpr": 0.022834923601538912, |
|
"eval_macro_sensitivity": 0.5974764193374731, |
|
"eval_macro_specificity": 0.9820281006961107, |
|
"eval_precision": 0.7489019370925815, |
|
"eval_precision_macro": 0.5641453776326693, |
|
"eval_recall": 0.7583268783888458, |
|
"eval_recall_macro": 0.5974764193374731, |
|
"eval_runtime": 47.4544, |
|
"eval_samples_per_second": 27.205, |
|
"eval_steps_per_second": 3.414, |
|
"eval_weighted_fpr": 0.022257098016835498, |
|
"eval_weighted_sensitivity": 0.7583268783888458, |
|
"eval_weighted_specificity": 0.9720946320528147, |
|
"step": 1286 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.7776917118512781, |
|
"eval_f1_macro": 0.5874833340927881, |
|
"eval_f1_micro": 0.7776917118512781, |
|
"eval_f1_weighted": 0.7653015782806978, |
|
"eval_loss": 0.683149516582489, |
|
"eval_macro_fpr": 0.020831516213897273, |
|
"eval_macro_sensitivity": 0.606896137249408, |
|
"eval_macro_specificity": 0.9832816294136357, |
|
"eval_precision": 0.7586915140412427, |
|
"eval_precision_macro": 0.5780981033617572, |
|
"eval_recall": 0.7776917118512781, |
|
"eval_recall_macro": 0.606896137249408, |
|
"eval_runtime": 50.31, |
|
"eval_samples_per_second": 25.661, |
|
"eval_steps_per_second": 3.22, |
|
"eval_weighted_fpr": 0.02000976085895559, |
|
"eval_weighted_sensitivity": 0.7776917118512781, |
|
"eval_weighted_specificity": 0.9715327293532582, |
|
"step": 1446 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"learning_rate": 1.8750000000000002e-05, |
|
"loss": 0.6167, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.7862122385747483, |
|
"eval_f1_macro": 0.5987413950993845, |
|
"eval_f1_micro": 0.7862122385747482, |
|
"eval_f1_weighted": 0.7753590541094936, |
|
"eval_loss": 0.6683156490325928, |
|
"eval_macro_fpr": 0.019819293314469463, |
|
"eval_macro_sensitivity": 0.617364154098103, |
|
"eval_macro_specificity": 0.9839313497952282, |
|
"eval_precision": 0.7714272913975577, |
|
"eval_precision_macro": 0.5916700769971839, |
|
"eval_recall": 0.7862122385747483, |
|
"eval_recall_macro": 0.617364154098103, |
|
"eval_runtime": 46.3094, |
|
"eval_samples_per_second": 27.878, |
|
"eval_steps_per_second": 3.498, |
|
"eval_weighted_fpr": 0.019052878641446915, |
|
"eval_weighted_sensitivity": 0.7862122385747483, |
|
"eval_weighted_specificity": 0.972758008353676, |
|
"step": 1607 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.7761425251742835, |
|
"eval_f1_macro": 0.5945805235654043, |
|
"eval_f1_micro": 0.7761425251742835, |
|
"eval_f1_weighted": 0.7642426809512617, |
|
"eval_loss": 0.6884666085243225, |
|
"eval_macro_fpr": 0.020959556505082782, |
|
"eval_macro_sensitivity": 0.6219516621776988, |
|
"eval_macro_specificity": 0.9832325403042509, |
|
"eval_precision": 0.762752032263232, |
|
"eval_precision_macro": 0.581742682634886, |
|
"eval_recall": 0.7761425251742835, |
|
"eval_recall_macro": 0.6219516621776988, |
|
"eval_runtime": 44.4944, |
|
"eval_samples_per_second": 29.015, |
|
"eval_steps_per_second": 3.641, |
|
"eval_weighted_fpr": 0.02018579311308235, |
|
"eval_weighted_sensitivity": 0.7761425251742835, |
|
"eval_weighted_specificity": 0.9723455793894815, |
|
"step": 1768 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.7869868319132456, |
|
"eval_f1_macro": 0.6214234200731922, |
|
"eval_f1_micro": 0.7869868319132455, |
|
"eval_f1_weighted": 0.7764436224395941, |
|
"eval_loss": 0.6829659938812256, |
|
"eval_macro_fpr": 0.01971781574074696, |
|
"eval_macro_sensitivity": 0.6463770170214457, |
|
"eval_macro_specificity": 0.9840270123264785, |
|
"eval_precision": 0.7826408792667282, |
|
"eval_precision_macro": 0.6626773170335125, |
|
"eval_recall": 0.7869868319132456, |
|
"eval_recall_macro": 0.6463770170214457, |
|
"eval_runtime": 43.9944, |
|
"eval_samples_per_second": 29.345, |
|
"eval_steps_per_second": 3.682, |
|
"eval_weighted_fpr": 0.018966825298296436, |
|
"eval_weighted_sensitivity": 0.7869868319132456, |
|
"eval_weighted_specificity": 0.9734183529839338, |
|
"step": 1929 |
|
}, |
|
{ |
|
"epoch": 12.44, |
|
"learning_rate": 8.333333333333334e-06, |
|
"loss": 0.5314, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.7916343919442292, |
|
"eval_f1_macro": 0.6110606025775643, |
|
"eval_f1_micro": 0.7916343919442292, |
|
"eval_f1_weighted": 0.7817623460591858, |
|
"eval_loss": 0.660524845123291, |
|
"eval_macro_fpr": 0.01915789146680066, |
|
"eval_macro_sensitivity": 0.6358134270226833, |
|
"eval_macro_specificity": 0.984380207900859, |
|
"eval_precision": 0.7769679723590022, |
|
"eval_precision_macro": 0.5964718375735727, |
|
"eval_recall": 0.7916343919442292, |
|
"eval_recall_macro": 0.6358134270226833, |
|
"eval_runtime": 44.1283, |
|
"eval_samples_per_second": 29.256, |
|
"eval_steps_per_second": 3.671, |
|
"eval_weighted_fpr": 0.01845372847636688, |
|
"eval_weighted_sensitivity": 0.7916343919442292, |
|
"eval_weighted_specificity": 0.9740687265686558, |
|
"step": 2089 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.790859798605732, |
|
"eval_f1_macro": 0.6261172643852387, |
|
"eval_f1_micro": 0.790859798605732, |
|
"eval_f1_weighted": 0.780302820536599, |
|
"eval_loss": 0.6614473462104797, |
|
"eval_macro_fpr": 0.019344545099537428, |
|
"eval_macro_sensitivity": 0.6477733385910524, |
|
"eval_macro_specificity": 0.9842490309995476, |
|
"eval_precision": 0.7794397894982683, |
|
"eval_precision_macro": 0.6367821774875876, |
|
"eval_recall": 0.790859798605732, |
|
"eval_recall_macro": 0.6477733385910524, |
|
"eval_runtime": 52.6504, |
|
"eval_samples_per_second": 24.52, |
|
"eval_steps_per_second": 3.077, |
|
"eval_weighted_fpr": 0.018538862949739082, |
|
"eval_weighted_sensitivity": 0.790859798605732, |
|
"eval_weighted_specificity": 0.9728756663874838, |
|
"step": 2250 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 2400, |
|
"num_train_epochs": 15, |
|
"save_steps": 500, |
|
"total_flos": 2.278788590234419e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|