{ "best_metric": 0.3130991458892822, "best_model_checkpoint": "/gdrive/MyDrive/Marefa/Tebyan/models/huggingface/model-xlm-roberta-large/checkpoint-13000", "epoch": 9.0, "global_step": 58500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 1.8e-05, "loss": 0.4403, "step": 6500 }, { "epoch": 1.0, "eval_accuracy": 0.900120719929763, "eval_f1": 0.7773765268189059, "eval_loss": 0.3497047424316406, "eval_precision": 0.7735151130839146, "eval_recall": 0.7812766865926558, "eval_runtime": 26.5811, "eval_samples_per_second": 70.99, "eval_steps_per_second": 35.514, "step": 6500 }, { "epoch": 2.0, "learning_rate": 1.6000000000000003e-05, "loss": 0.307, "step": 13000 }, { "epoch": 2.0, "eval_accuracy": 0.904587357330992, "eval_f1": 0.7846807172066689, "eval_loss": 0.3130991458892822, "eval_precision": 0.7710179270554296, "eval_recall": 0.798836464560205, "eval_runtime": 26.8623, "eval_samples_per_second": 70.247, "eval_steps_per_second": 35.142, "step": 13000 }, { "epoch": 3.0, "learning_rate": 1.4e-05, "loss": 0.2386, "step": 19500 }, { "epoch": 3.0, "eval_accuracy": 0.9074187884108867, "eval_f1": 0.7895801055644548, "eval_loss": 0.348012775182724, "eval_precision": 0.7771517187903851, "eval_recall": 0.8024124679760888, "eval_runtime": 26.5101, "eval_samples_per_second": 71.18, "eval_steps_per_second": 35.609, "step": 19500 }, { "epoch": 4.0, "learning_rate": 1.2e-05, "loss": 0.1883, "step": 26000 }, { "epoch": 4.0, "eval_accuracy": 0.9088235294117647, "eval_f1": 0.7946725265301746, "eval_loss": 0.3668019771575928, "eval_precision": 0.7980086114101184, "eval_recall": 0.791364218616567, "eval_runtime": 26.9144, "eval_samples_per_second": 70.111, "eval_steps_per_second": 35.074, "step": 26000 }, { "epoch": 5.0, "learning_rate": 1e-05, "loss": 0.1439, "step": 32500 }, { "epoch": 5.0, "eval_accuracy": 0.9110074626865672, "eval_f1": 0.801425039215165, "eval_loss": 0.40606749057769775, "eval_precision": 0.7984319542300153, "eval_recall": 0.8044406490179334, "eval_runtime": 26.8012, "eval_samples_per_second": 70.407, "eval_steps_per_second": 35.222, "step": 32500 }, { "epoch": 6.0, "learning_rate": 8.000000000000001e-06, "loss": 0.1108, "step": 39000 }, { "epoch": 6.0, "eval_accuracy": 0.9115561896400352, "eval_f1": 0.8033741926980361, "eval_loss": 0.46604597568511963, "eval_precision": 0.7936871712068337, "eval_recall": 0.8133005977796754, "eval_runtime": 26.6526, "eval_samples_per_second": 70.8, "eval_steps_per_second": 35.419, "step": 39000 }, { "epoch": 7.0, "learning_rate": 6e-06, "loss": 0.0825, "step": 45500 }, { "epoch": 7.0, "eval_accuracy": 0.9102502194907814, "eval_f1": 0.8003274619061452, "eval_loss": 0.5183274149894714, "eval_precision": 0.7920652344362553, "eval_recall": 0.8087638770281811, "eval_runtime": 26.7116, "eval_samples_per_second": 70.643, "eval_steps_per_second": 35.34, "step": 45500 }, { "epoch": 8.0, "learning_rate": 4.000000000000001e-06, "loss": 0.0601, "step": 52000 }, { "epoch": 8.0, "eval_accuracy": 0.9106014047410009, "eval_f1": 0.8013862969874699, "eval_loss": 0.5683603882789612, "eval_precision": 0.800575263662512, "eval_recall": 0.802198975234842, "eval_runtime": 26.5594, "eval_samples_per_second": 71.048, "eval_steps_per_second": 35.543, "step": 52000 }, { "epoch": 9.0, "learning_rate": 2.0000000000000003e-06, "loss": 0.0431, "step": 58500 }, { "epoch": 9.0, "eval_accuracy": 0.91078797190518, "eval_f1": 0.8022889236230693, "eval_loss": 0.6140836477279663, "eval_precision": 0.7964862448056388, "eval_recall": 0.8081767719897524, "eval_runtime": 26.6356, "eval_samples_per_second": 70.845, "eval_steps_per_second": 35.441, "step": 58500 } ], "max_steps": 65000, "num_train_epochs": 10, "total_flos": 2.5323970171833972e+16, "trial_name": null, "trial_params": null }