{ "best_metric": 0.11592021584510803, "best_model_checkpoint": "/home1/datawork/mcontini/models/multilabel/huggingface/dino-large-2023_12_19-kornia_img-size518_batch-size16_epochs20/checkpoint-9112", "epoch": 20.0, "eval_steps": 500, "global_step": 10720, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.93, "learning_rate": 0.01, "loss": 0.2545, "step": 500 }, { "epoch": 1.0, "eval_accuracy": 0.41336191496963204, "eval_f1_macro": 0.5552795713944485, "eval_f1_micro": 0.7016183870529035, "eval_loss": 0.19357216358184814, "eval_roc_auc": 0.7908326703460342, "eval_runtime": 669.1996, "eval_samples_per_second": 4.183, "eval_steps_per_second": 0.262, "learning_rate": 0.01, "step": 536 }, { "epoch": 1.87, "learning_rate": 0.01, "loss": 0.2163, "step": 1000 }, { "epoch": 2.0, "eval_accuracy": 0.4240800285816363, "eval_f1_macro": 0.6939559668202788, "eval_f1_micro": 0.7671674437345306, "eval_loss": 0.16442517936229706, "eval_roc_auc": 0.8668895881413139, "eval_runtime": 667.4861, "eval_samples_per_second": 4.193, "eval_steps_per_second": 0.262, "learning_rate": 0.01, "step": 1072 }, { "epoch": 2.8, "learning_rate": 0.01, "loss": 0.2142, "step": 1500 }, { "epoch": 3.0, "eval_accuracy": 0.4258663808503037, "eval_f1_macro": 0.6226385110394398, "eval_f1_micro": 0.7264495032071437, "eval_loss": 0.17197823524475098, "eval_roc_auc": 0.8209912192682602, "eval_runtime": 671.4241, "eval_samples_per_second": 4.169, "eval_steps_per_second": 0.261, "learning_rate": 0.01, "step": 1608 }, { "epoch": 3.73, "learning_rate": 0.01, "loss": 0.2107, "step": 2000 }, { "epoch": 4.0, "eval_accuracy": 0.40192926045016075, "eval_f1_macro": 0.60556232845899, "eval_f1_micro": 0.7311342592592591, "eval_loss": 0.17794817686080933, "eval_roc_auc": 0.844154343443223, "eval_runtime": 669.3476, "eval_samples_per_second": 4.182, "eval_steps_per_second": 0.261, "learning_rate": 0.01, "step": 2144 }, { "epoch": 4.66, "learning_rate": 0.01, "loss": 0.2117, "step": 2500 }, { "epoch": 5.0, "eval_accuracy": 0.38335119685602, "eval_f1_macro": 0.674484878286151, "eval_f1_micro": 0.754215411654858, "eval_loss": 0.1834840625524521, "eval_roc_auc": 0.8723557298678095, "eval_runtime": 667.4497, "eval_samples_per_second": 4.194, "eval_steps_per_second": 0.262, "learning_rate": 0.01, "step": 2680 }, { "epoch": 5.6, "learning_rate": 0.01, "loss": 0.2171, "step": 3000 }, { "epoch": 6.0, "eval_accuracy": 0.42086459449803504, "eval_f1_macro": 0.595946612091723, "eval_f1_micro": 0.7347275031685679, "eval_loss": 0.1732301414012909, "eval_roc_auc": 0.8236385276926494, "eval_runtime": 665.3111, "eval_samples_per_second": 4.207, "eval_steps_per_second": 0.263, "learning_rate": 0.01, "step": 3216 }, { "epoch": 6.53, "learning_rate": 0.01, "loss": 0.2178, "step": 3500 }, { "epoch": 7.0, "eval_accuracy": 0.3904966059306895, "eval_f1_macro": 0.5932113008464752, "eval_f1_micro": 0.7253084446717382, "eval_loss": 0.2698315978050232, "eval_roc_auc": 0.8165478137957464, "eval_runtime": 666.3656, "eval_samples_per_second": 4.2, "eval_steps_per_second": 0.263, "learning_rate": 0.01, "step": 3752 }, { "epoch": 7.46, "learning_rate": 0.01, "loss": 0.2177, "step": 4000 }, { "epoch": 8.0, "eval_accuracy": 0.4119328331546981, "eval_f1_macro": 0.6280317383192718, "eval_f1_micro": 0.7360358677377172, "eval_loss": 0.19401037693023682, "eval_roc_auc": 0.828564591229026, "eval_runtime": 671.4879, "eval_samples_per_second": 4.168, "eval_steps_per_second": 0.261, "learning_rate": 0.01, "step": 4288 }, { "epoch": 8.4, "learning_rate": 0.001, "loss": 0.212, "step": 4500 }, { "epoch": 9.0, "eval_accuracy": 0.48981779206859594, "eval_f1_macro": 0.7491476401858057, "eval_f1_micro": 0.7992611571232794, "eval_loss": 0.1454659402370453, "eval_roc_auc": 0.8756991587148717, "eval_runtime": 673.1035, "eval_samples_per_second": 4.158, "eval_steps_per_second": 0.26, "learning_rate": 0.001, "step": 4824 }, { "epoch": 9.33, "learning_rate": 0.001, "loss": 0.1761, "step": 5000 }, { "epoch": 10.0, "eval_accuracy": 0.5123258306538049, "eval_f1_macro": 0.7661404438716006, "eval_f1_micro": 0.8116191765647116, "eval_loss": 0.13573050498962402, "eval_roc_auc": 0.8733133406359384, "eval_runtime": 691.4938, "eval_samples_per_second": 4.048, "eval_steps_per_second": 0.253, "learning_rate": 0.001, "step": 5360 }, { "epoch": 10.26, "learning_rate": 0.001, "loss": 0.1681, "step": 5500 }, { "epoch": 11.0, "eval_accuracy": 0.5166130760986066, "eval_f1_macro": 0.7752662433951194, "eval_f1_micro": 0.8151612707282998, "eval_loss": 0.1386074423789978, "eval_roc_auc": 0.8790914856208012, "eval_runtime": 689.8939, "eval_samples_per_second": 4.057, "eval_steps_per_second": 0.254, "learning_rate": 0.001, "step": 5896 }, { "epoch": 11.19, "learning_rate": 0.001, "loss": 0.1579, "step": 6000 }, { "epoch": 12.0, "eval_accuracy": 0.5162558056448732, "eval_f1_macro": 0.7826923679681995, "eval_f1_micro": 0.8219824282092104, "eval_loss": 0.1820007711648941, "eval_roc_auc": 0.8918796772066396, "eval_runtime": 692.3943, "eval_samples_per_second": 4.042, "eval_steps_per_second": 0.253, "learning_rate": 0.001, "step": 6432 }, { "epoch": 12.13, "learning_rate": 0.001, "loss": 0.1553, "step": 6500 }, { "epoch": 13.0, "eval_accuracy": 0.5326902465166131, "eval_f1_macro": 0.7907678649401602, "eval_f1_micro": 0.8296795952782462, "eval_loss": 0.1227828711271286, "eval_roc_auc": 0.8898245747393245, "eval_runtime": 691.2613, "eval_samples_per_second": 4.049, "eval_steps_per_second": 0.253, "learning_rate": 0.001, "step": 6968 }, { "epoch": 13.06, "learning_rate": 0.001, "loss": 0.1517, "step": 7000 }, { "epoch": 13.99, "learning_rate": 0.001, "loss": 0.1512, "step": 7500 }, { "epoch": 14.0, "eval_accuracy": 0.5301893533404788, "eval_f1_macro": 0.7815063263088662, "eval_f1_micro": 0.8257773991358852, "eval_loss": 0.12334247678518295, "eval_roc_auc": 0.8845045355403204, "eval_runtime": 684.2138, "eval_samples_per_second": 4.091, "eval_steps_per_second": 0.256, "learning_rate": 0.001, "step": 7504 }, { "epoch": 14.93, "learning_rate": 0.001, "loss": 0.1508, "step": 8000 }, { "epoch": 15.0, "eval_accuracy": 0.5305466237942122, "eval_f1_macro": 0.7681866841890026, "eval_f1_micro": 0.817921948794432, "eval_loss": 0.12476785480976105, "eval_roc_auc": 0.8739908739957604, "eval_runtime": 690.4773, "eval_samples_per_second": 4.054, "eval_steps_per_second": 0.253, "learning_rate": 0.001, "step": 8040 }, { "epoch": 15.86, "learning_rate": 0.001, "loss": 0.1499, "step": 8500 }, { "epoch": 16.0, "eval_accuracy": 0.5394783851375491, "eval_f1_macro": 0.7902552675483185, "eval_f1_micro": 0.8276715549780336, "eval_loss": 0.11932893097400665, "eval_roc_auc": 0.8805997685784225, "eval_runtime": 690.469, "eval_samples_per_second": 4.054, "eval_steps_per_second": 0.253, "learning_rate": 0.001, "step": 8576 }, { "epoch": 16.79, "learning_rate": 0.001, "loss": 0.1435, "step": 9000 }, { "epoch": 17.0, "eval_accuracy": 0.5380493033226152, "eval_f1_macro": 0.7995743847858905, "eval_f1_micro": 0.8381208681916574, "eval_loss": 0.11592021584510803, "eval_roc_auc": 0.9037053380559585, "eval_runtime": 685.0697, "eval_samples_per_second": 4.086, "eval_steps_per_second": 0.255, "learning_rate": 0.001, "step": 9112 }, { "epoch": 17.72, "learning_rate": 0.001, "loss": 0.1463, "step": 9500 }, { "epoch": 18.0, "eval_accuracy": 0.5480528760271526, "eval_f1_macro": 0.803284244956481, "eval_f1_micro": 0.8392878623842175, "eval_loss": 0.11661119759082794, "eval_roc_auc": 0.8956742640228449, "eval_runtime": 684.4351, "eval_samples_per_second": 4.09, "eval_steps_per_second": 0.256, "learning_rate": 0.001, "step": 9648 }, { "epoch": 18.66, "learning_rate": 0.001, "loss": 0.1423, "step": 10000 }, { "epoch": 19.0, "eval_accuracy": 0.5459092533047517, "eval_f1_macro": 0.8008505005735617, "eval_f1_micro": 0.8327005511328843, "eval_loss": 0.1216365247964859, "eval_roc_auc": 0.8864852456725716, "eval_runtime": 683.4387, "eval_samples_per_second": 4.095, "eval_steps_per_second": 0.256, "learning_rate": 0.001, "step": 10184 }, { "epoch": 19.59, "learning_rate": 0.001, "loss": 0.1444, "step": 10500 }, { "epoch": 20.0, "eval_accuracy": 0.5509110396570204, "eval_f1_macro": 0.801973744395412, "eval_f1_micro": 0.8382846336851095, "eval_loss": 0.1171422228217125, "eval_roc_auc": 0.8907672852306303, "eval_runtime": 675.9942, "eval_samples_per_second": 4.141, "eval_steps_per_second": 0.259, "learning_rate": 0.001, "step": 10720 }, { "epoch": 20.0, "learning_rate": 0.001, "step": 10720, "total_flos": 2.5409000327874334e+20, "train_loss": 0.18060117693089728, "train_runtime": 57213.4657, "train_samples_per_second": 2.995, "train_steps_per_second": 0.187 } ], "logging_steps": 500, "max_steps": 10720, "num_train_epochs": 20, "save_steps": 500, "total_flos": 2.5409000327874334e+20, "trial_name": null, "trial_params": null }