{ "best_metric": null, "best_model_checkpoint": null, "epoch": 4.998331664998331, "global_step": 1870, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 2.8126709206927986e-06, "loss": 1.792, "step": 374 }, { "epoch": 1.0, "eval_accuracy": 0.2750904902928595, "eval_f1_score": 0.17558198955755575, "eval_loss": 1.792249083518982, "eval_runtime": 351.3884, "eval_samples_per_second": 8.649, "eval_steps_per_second": 2.163, "step": 374 }, { "epoch": 2.0, "learning_rate": 2.5569735642661806e-06, "loss": 1.7923, "step": 748 }, { "epoch": 2.0, "eval_accuracy": 0.2750904902928595, "eval_f1_score": 0.15209869477487561, "eval_loss": 1.7973285913467407, "eval_runtime": 349.7493, "eval_samples_per_second": 8.689, "eval_steps_per_second": 2.173, "step": 748 }, { "epoch": 3.0, "learning_rate": 2.3012762078395626e-06, "loss": 1.7867, "step": 1122 }, { "epoch": 3.0, "eval_accuracy": 0.39486673247778875, "eval_f1_score": 0.1978644849001168, "eval_loss": 1.773677110671997, "eval_runtime": 345.3478, "eval_samples_per_second": 8.8, "eval_steps_per_second": 2.201, "step": 1122 }, { "epoch": 4.0, "learning_rate": 2.0455788514129442e-06, "loss": 1.7681, "step": 1496 }, { "epoch": 4.0, "eval_accuracy": 0.49950641658440276, "eval_f1_score": 0.21909607145469126, "eval_loss": 1.751068115234375, "eval_runtime": 344.7764, "eval_samples_per_second": 8.814, "eval_steps_per_second": 2.204, "step": 1496 }, { "epoch": 5.0, "learning_rate": 1.7898814949863265e-06, "loss": 1.7286, "step": 1870 } ], "max_steps": 4488, "num_train_epochs": 12, "total_flos": 9.102887348352e+18, "trial_name": null, "trial_params": null }