|
{ |
|
"best_metric": 0.1276090443134308, |
|
"best_model_checkpoint": "/home1/datawork/mcontini/models/multilabel/huggingface/dinov2-giant-2024_01_02-kornia_img-size518_batch-size32_epochs20_freeze/checkpoint-5360", |
|
"epoch": 20.0, |
|
"eval_steps": 500, |
|
"global_step": 5360, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.4055019649874955, |
|
"eval_f1_macro": 0.5114163498644834, |
|
"eval_f1_micro": 0.6258493771234429, |
|
"eval_loss": 0.22310702502727509, |
|
"eval_roc_auc": 0.7462668565240048, |
|
"eval_runtime": 1321.1574, |
|
"eval_samples_per_second": 2.119, |
|
"eval_steps_per_second": 0.067, |
|
"learning_rate": 0.01, |
|
"step": 268 |
|
}, |
|
{ |
|
"epoch": 1.87, |
|
"learning_rate": 0.01, |
|
"loss": 0.2273, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.38120757413361916, |
|
"eval_f1_macro": 0.45109440187622923, |
|
"eval_f1_micro": 0.6105779637780503, |
|
"eval_loss": 0.25052765011787415, |
|
"eval_roc_auc": 0.7359905994056075, |
|
"eval_runtime": 1321.0391, |
|
"eval_samples_per_second": 2.119, |
|
"eval_steps_per_second": 0.067, |
|
"learning_rate": 0.01, |
|
"step": 536 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.41764916041443373, |
|
"eval_f1_macro": 0.6951782991070653, |
|
"eval_f1_micro": 0.7531037857011804, |
|
"eval_loss": 0.17819169163703918, |
|
"eval_roc_auc": 0.8424985182786072, |
|
"eval_runtime": 1324.6672, |
|
"eval_samples_per_second": 2.113, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 804 |
|
}, |
|
{ |
|
"epoch": 3.73, |
|
"learning_rate": 0.01, |
|
"loss": 0.196, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.4240800285816363, |
|
"eval_f1_macro": 0.6667105102591024, |
|
"eval_f1_micro": 0.7645973453961074, |
|
"eval_loss": 0.15775558352470398, |
|
"eval_roc_auc": 0.8561540860224954, |
|
"eval_runtime": 1324.5164, |
|
"eval_samples_per_second": 2.113, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 1072 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.3551268310110754, |
|
"eval_f1_macro": 0.6462786847563172, |
|
"eval_f1_micro": 0.7289891034631567, |
|
"eval_loss": 0.1978054791688919, |
|
"eval_roc_auc": 0.8616257579280331, |
|
"eval_runtime": 1318.8019, |
|
"eval_samples_per_second": 2.122, |
|
"eval_steps_per_second": 0.067, |
|
"learning_rate": 0.01, |
|
"step": 1340 |
|
}, |
|
{ |
|
"epoch": 5.6, |
|
"learning_rate": 0.01, |
|
"loss": 0.1916, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.45480528760271527, |
|
"eval_f1_macro": 0.6154722345590861, |
|
"eval_f1_micro": 0.7533968253968253, |
|
"eval_loss": 0.1570044308900833, |
|
"eval_roc_auc": 0.8332111249225472, |
|
"eval_runtime": 1322.0736, |
|
"eval_samples_per_second": 2.117, |
|
"eval_steps_per_second": 0.067, |
|
"learning_rate": 0.01, |
|
"step": 1608 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.4076455877098964, |
|
"eval_f1_macro": 0.7033703129441511, |
|
"eval_f1_micro": 0.7711244893571275, |
|
"eval_loss": 0.17040091753005981, |
|
"eval_roc_auc": 0.8893350315039463, |
|
"eval_runtime": 1321.072, |
|
"eval_samples_per_second": 2.119, |
|
"eval_steps_per_second": 0.067, |
|
"learning_rate": 0.01, |
|
"step": 1876 |
|
}, |
|
{ |
|
"epoch": 7.46, |
|
"learning_rate": 0.01, |
|
"loss": 0.1935, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.44873168988924617, |
|
"eval_f1_macro": 0.7240467456541528, |
|
"eval_f1_micro": 0.7782660807031561, |
|
"eval_loss": 0.1583939492702484, |
|
"eval_roc_auc": 0.87591640182751, |
|
"eval_runtime": 1324.3647, |
|
"eval_samples_per_second": 2.113, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 2144 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.44337263308324404, |
|
"eval_f1_macro": 0.7026377863872897, |
|
"eval_f1_micro": 0.7724530831099197, |
|
"eval_loss": 0.16136306524276733, |
|
"eval_roc_auc": 0.878715414884403, |
|
"eval_runtime": 1334.0015, |
|
"eval_samples_per_second": 2.098, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 2412 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"learning_rate": 0.01, |
|
"loss": 0.1945, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.43658449446230796, |
|
"eval_f1_macro": 0.6244582432023046, |
|
"eval_f1_micro": 0.743831546311846, |
|
"eval_loss": 0.1569277048110962, |
|
"eval_roc_auc": 0.8239477455598103, |
|
"eval_runtime": 1341.7823, |
|
"eval_samples_per_second": 2.086, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 2680 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.42979635584137194, |
|
"eval_f1_macro": 0.6986025660751581, |
|
"eval_f1_micro": 0.763875932835821, |
|
"eval_loss": 0.1665951907634735, |
|
"eval_roc_auc": 0.8613857432852049, |
|
"eval_runtime": 1333.2352, |
|
"eval_samples_per_second": 2.099, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 2948 |
|
}, |
|
{ |
|
"epoch": 11.19, |
|
"learning_rate": 0.01, |
|
"loss": 0.1951, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.44765987852804573, |
|
"eval_f1_macro": 0.6291100964373895, |
|
"eval_f1_micro": 0.744811534234176, |
|
"eval_loss": 0.15847544372081757, |
|
"eval_roc_auc": 0.8242335503635296, |
|
"eval_runtime": 1336.9094, |
|
"eval_samples_per_second": 2.094, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 3216 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.43801357627724186, |
|
"eval_f1_macro": 0.6650314316976844, |
|
"eval_f1_micro": 0.7623590633130962, |
|
"eval_loss": 0.15646952390670776, |
|
"eval_roc_auc": 0.844307766178341, |
|
"eval_runtime": 1326.5168, |
|
"eval_samples_per_second": 2.11, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 3484 |
|
}, |
|
{ |
|
"epoch": 13.06, |
|
"learning_rate": 0.01, |
|
"loss": 0.1953, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.4465880671668453, |
|
"eval_f1_macro": 0.5021716379213181, |
|
"eval_f1_micro": 0.6728278270994033, |
|
"eval_loss": 0.17276929318904877, |
|
"eval_roc_auc": 0.7638863294586612, |
|
"eval_runtime": 1334.5311, |
|
"eval_samples_per_second": 2.097, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 3752 |
|
}, |
|
{ |
|
"epoch": 14.93, |
|
"learning_rate": 0.01, |
|
"loss": 0.1945, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_accuracy": 0.4555198285101822, |
|
"eval_f1_macro": 0.6523865470596933, |
|
"eval_f1_micro": 0.7441088615997346, |
|
"eval_loss": 0.15650007128715515, |
|
"eval_roc_auc": 0.8176688310877148, |
|
"eval_runtime": 1329.7371, |
|
"eval_samples_per_second": 2.105, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 4020 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.4580207216863165, |
|
"eval_f1_macro": 0.643940672540041, |
|
"eval_f1_micro": 0.7514664626370825, |
|
"eval_loss": 0.15759296715259552, |
|
"eval_roc_auc": 0.8311410282106092, |
|
"eval_runtime": 1337.597, |
|
"eval_samples_per_second": 2.093, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 4288 |
|
}, |
|
{ |
|
"epoch": 16.79, |
|
"learning_rate": 0.01, |
|
"loss": 0.1929, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_accuracy": 0.43122543765630583, |
|
"eval_f1_macro": 0.5707187678300992, |
|
"eval_f1_micro": 0.7358732093873818, |
|
"eval_loss": 0.17005115747451782, |
|
"eval_roc_auc": 0.833709678625855, |
|
"eval_runtime": 1326.7318, |
|
"eval_samples_per_second": 2.11, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 4556 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 0.42300821722043586, |
|
"eval_f1_macro": 0.6533638646137062, |
|
"eval_f1_micro": 0.7531492248062015, |
|
"eval_loss": 0.15990640223026276, |
|
"eval_roc_auc": 0.8450542243393845, |
|
"eval_runtime": 1329.7371, |
|
"eval_samples_per_second": 2.105, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 4824 |
|
}, |
|
{ |
|
"epoch": 18.66, |
|
"learning_rate": 0.01, |
|
"loss": 0.1952, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_accuracy": 0.45480528760271527, |
|
"eval_f1_macro": 0.6657705432619248, |
|
"eval_f1_micro": 0.7347428800106717, |
|
"eval_loss": 0.16034173965454102, |
|
"eval_roc_auc": 0.8117717147474299, |
|
"eval_runtime": 1328.0617, |
|
"eval_samples_per_second": 2.108, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.01, |
|
"step": 5092 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.5262593783494105, |
|
"eval_f1_macro": 0.7676828961065644, |
|
"eval_f1_micro": 0.8133643372904173, |
|
"eval_loss": 0.1276090443134308, |
|
"eval_roc_auc": 0.8759327417838362, |
|
"eval_runtime": 1330.6724, |
|
"eval_samples_per_second": 2.103, |
|
"eval_steps_per_second": 0.066, |
|
"learning_rate": 0.001, |
|
"step": 5360 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"learning_rate": 0.001, |
|
"step": 5360, |
|
"total_flos": 9.454976615476292e+20, |
|
"train_loss": 0.07645123254007367, |
|
"train_runtime": 44768.9701, |
|
"train_samples_per_second": 3.828, |
|
"train_steps_per_second": 0.12 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 5360, |
|
"num_train_epochs": 20, |
|
"save_steps": 500, |
|
"total_flos": 9.454976615476292e+20, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|