{ "best_metric": 0.8242820390801596, "best_model_checkpoint": "turkish_multilabel_intent_bert-base-turkish-128k-uncased/checkpoint-384", "epoch": 2.887218045112782, "global_step": 384, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.24, "learning_rate": 4.7987362585716124e-05, "loss": 0.0139, "step": 32 }, { "epoch": 0.24, "eval_loss": 0.009882427752017975, "eval_macro f1": 0.3392960248919277, "eval_micro f1": 0.7193911317008603, "eval_runtime": 2.3212, "eval_samples_per_second": 461.408, "eval_steps_per_second": 7.324, "step": 32 }, { "epoch": 0.48, "learning_rate": 4.491617138023029e-05, "loss": 0.0082, "step": 64 }, { "epoch": 0.48, "eval_loss": 0.00571652315557003, "eval_macro f1": 0.5888766985486856, "eval_micro f1": 0.8291472868217056, "eval_runtime": 2.3143, "eval_samples_per_second": 462.783, "eval_steps_per_second": 7.346, "step": 64 }, { "epoch": 0.72, "learning_rate": 4.184498017474446e-05, "loss": 0.0062, "step": 96 }, { "epoch": 0.72, "eval_loss": 0.004936754237860441, "eval_macro f1": 0.6479513036422692, "eval_micro f1": 0.8529040404040404, "eval_runtime": 2.335, "eval_samples_per_second": 458.676, "eval_steps_per_second": 7.281, "step": 96 }, { "epoch": 0.96, "learning_rate": 3.877378896925863e-05, "loss": 0.0046, "step": 128 }, { "epoch": 0.96, "eval_loss": 0.0039069755002856255, "eval_macro f1": 0.7036941962393284, "eval_micro f1": 0.8735053492762743, "eval_runtime": 2.3196, "eval_samples_per_second": 461.727, "eval_steps_per_second": 7.329, "step": 128 }, { "epoch": 1.2, "learning_rate": 3.57025977637728e-05, "loss": 0.0035, "step": 160 }, { "epoch": 1.2, "eval_loss": 0.003501879284158349, "eval_macro f1": 0.7315796800388726, "eval_micro f1": 0.8865718799368089, "eval_runtime": 2.316, "eval_samples_per_second": 462.435, "eval_steps_per_second": 7.34, "step": 160 }, { "epoch": 1.44, "learning_rate": 3.263140655828696e-05, "loss": 0.0037, "step": 192 }, { "epoch": 1.44, "eval_loss": 0.0034342026337981224, "eval_macro f1": 0.7462213705474623, "eval_micro f1": 0.8902361199744736, "eval_runtime": 2.392, "eval_samples_per_second": 447.74, "eval_steps_per_second": 7.107, "step": 192 }, { "epoch": 1.68, "learning_rate": 2.956021535280113e-05, "loss": 0.0032, "step": 224 }, { "epoch": 1.68, "eval_loss": 0.0032742032781243324, "eval_macro f1": 0.7279673266730304, "eval_micro f1": 0.8998085513720486, "eval_runtime": 2.3105, "eval_samples_per_second": 463.546, "eval_steps_per_second": 7.358, "step": 224 }, { "epoch": 1.92, "learning_rate": 2.64890241473153e-05, "loss": 0.0033, "step": 256 }, { "epoch": 1.92, "eval_loss": 0.003130522323772311, "eval_macro f1": 0.7717739019762423, "eval_micro f1": 0.912258064516129, "eval_runtime": 2.3, "eval_samples_per_second": 465.662, "eval_steps_per_second": 7.391, "step": 256 }, { "epoch": 2.17, "learning_rate": 2.3417832941829465e-05, "loss": 0.0025, "step": 288 }, { "epoch": 2.17, "eval_loss": 0.0031702849082648754, "eval_macro f1": 0.7845634595933292, "eval_micro f1": 0.9168036829990136, "eval_runtime": 2.3461, "eval_samples_per_second": 456.499, "eval_steps_per_second": 7.246, "step": 288 }, { "epoch": 2.41, "learning_rate": 2.0346641736343635e-05, "loss": 0.0022, "step": 320 }, { "epoch": 2.41, "eval_loss": 0.0030924060847610235, "eval_macro f1": 0.7838887334413882, "eval_micro f1": 0.9131561892417368, "eval_runtime": 2.2918, "eval_samples_per_second": 467.308, "eval_steps_per_second": 7.418, "step": 320 }, { "epoch": 2.65, "learning_rate": 1.7275450530857802e-05, "loss": 0.0022, "step": 352 }, { "epoch": 2.65, "eval_loss": 0.0030099288560450077, "eval_macro f1": 0.7712848231573721, "eval_micro f1": 0.908565928777671, "eval_runtime": 2.3124, "eval_samples_per_second": 463.146, "eval_steps_per_second": 7.352, "step": 352 }, { "epoch": 2.89, "learning_rate": 1.420425932537197e-05, "loss": 0.0022, "step": 384 }, { "epoch": 2.89, "eval_loss": 0.0029520909301936626, "eval_macro f1": 0.8242820390801596, "eval_micro f1": 0.913988964621876, "eval_runtime": 2.3289, "eval_samples_per_second": 459.872, "eval_steps_per_second": 7.3, "step": 384 } ], "max_steps": 532, "num_train_epochs": 4, "total_flos": 630598146840000.0, "trial_name": null, "trial_params": null }