{ "best_metric": null, "best_model_checkpoint": null, "epoch": 20.13422818791946, "global_step": 3000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 3.36, "eval_accuracy": 0.9206798866855525, "eval_f1": 0.9303482587064678, "eval_loss": 0.2345595508813858, "eval_precision": 0.919672131147541, "eval_recall": 0.9412751677852349, "eval_report": " precision recall f1-score support\n\n 0 0.92 0.89 0.91 463\n 1 0.92 0.94 0.93 596\n\n accuracy 0.92 1059\n macro avg 0.92 0.92 0.92 1059\nweighted avg 0.92 0.92 0.92 1059\n", "eval_runtime": 8.0364, "eval_samples_per_second": 131.775, "eval_steps_per_second": 8.337, "step": 500 }, { "epoch": 6.71, "learning_rate": 4e-05, "loss": 0.2212, "step": 1000 }, { "epoch": 6.71, "eval_accuracy": 0.9046270066100094, "eval_f1": 0.9141886151231945, "eval_loss": 0.31608325242996216, "eval_precision": 0.9259896729776248, "eval_recall": 0.9026845637583892, "eval_report": " precision recall f1-score support\n\n 0 0.88 0.91 0.89 463\n 1 0.93 0.90 0.91 596\n\n accuracy 0.90 1059\n macro avg 0.90 0.90 0.90 1059\nweighted avg 0.91 0.90 0.90 1059\n", "eval_runtime": 8.0054, "eval_samples_per_second": 132.285, "eval_steps_per_second": 8.369, "step": 1000 }, { "epoch": 10.07, "eval_accuracy": 0.9065155807365439, "eval_f1": 0.9167367535744324, "eval_loss": 0.43374723196029663, "eval_precision": 0.9190556492411467, "eval_recall": 0.9144295302013423, "eval_report": " precision recall f1-score support\n\n 0 0.89 0.90 0.89 463\n 1 0.92 0.91 0.92 596\n\n accuracy 0.91 1059\n macro avg 0.90 0.91 0.91 1059\nweighted avg 0.91 0.91 0.91 1059\n", "eval_runtime": 8.0154, "eval_samples_per_second": 132.12, "eval_steps_per_second": 8.359, "step": 1500 }, { "epoch": 13.42, "learning_rate": 2e-05, "loss": 0.0651, "step": 2000 }, { "epoch": 13.42, "eval_accuracy": 0.9178470254957507, "eval_f1": 0.9271966527196652, "eval_loss": 0.47431105375289917, "eval_precision": 0.9248747913188647, "eval_recall": 0.9295302013422819, "eval_report": " precision recall f1-score support\n\n 0 0.91 0.90 0.91 463\n 1 0.92 0.93 0.93 596\n\n accuracy 0.92 1059\n macro avg 0.92 0.92 0.92 1059\nweighted avg 0.92 0.92 0.92 1059\n", "eval_runtime": 8.0135, "eval_samples_per_second": 132.152, "eval_steps_per_second": 8.361, "step": 2000 }, { "epoch": 16.78, "eval_accuracy": 0.9102927289896129, "eval_f1": 0.9203688181056161, "eval_loss": 0.5537705421447754, "eval_precision": 0.9195979899497487, "eval_recall": 0.9211409395973155, "eval_report": " precision recall f1-score support\n\n 0 0.90 0.90 0.90 463\n 1 0.92 0.92 0.92 596\n\n accuracy 0.91 1059\n macro avg 0.91 0.91 0.91 1059\nweighted avg 0.91 0.91 0.91 1059\n", "eval_runtime": 8.0263, "eval_samples_per_second": 131.941, "eval_steps_per_second": 8.348, "step": 2500 }, { "epoch": 20.13, "learning_rate": 0.0, "loss": 0.0296, "step": 3000 }, { "epoch": 20.13, "eval_accuracy": 0.9102927289896129, "eval_f1": 0.9199663016006739, "eval_loss": 0.6190621256828308, "eval_precision": 0.9238578680203046, "eval_recall": 0.9161073825503355, "eval_report": " precision recall f1-score support\n\n 0 0.89 0.90 0.90 463\n 1 0.92 0.92 0.92 596\n\n accuracy 0.91 1059\n macro avg 0.91 0.91 0.91 1059\nweighted avg 0.91 0.91 0.91 1059\n", "eval_runtime": 8.0249, "eval_samples_per_second": 131.965, "eval_steps_per_second": 8.349, "step": 3000 }, { "epoch": 20.13, "step": 3000, "total_flos": 5.04436515336192e+16, "train_loss": 0.10527635129292806, "train_runtime": 3964.4436, "train_samples_per_second": 48.431, "train_steps_per_second": 0.757 } ], "max_steps": 3000, "num_train_epochs": 21, "total_flos": 5.04436515336192e+16, "trial_name": null, "trial_params": null }