{ "best_metric": null, "best_model_checkpoint": null, "epoch": 4.0, "global_step": 4992, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.4, "learning_rate": 2.4750000000000002e-05, "loss": 1.0323, "step": 500 }, { "epoch": 0.8, "learning_rate": 4.975e-05, "loss": 0.8721, "step": 1000 }, { "epoch": 1.0, "eval_accuracy": 0.6721768379211426, "eval_loss": 0.8143573999404907, "eval_runtime": 184.4068, "eval_samples_per_second": 54.456, "step": 1248 }, { "epoch": 1.2, "learning_rate": 4.38001002004008e-05, "loss": 0.7668, "step": 1500 }, { "epoch": 1.6, "learning_rate": 3.7537575150300605e-05, "loss": 0.6107, "step": 2000 }, { "epoch": 2.0, "eval_accuracy": 0.7067317366600037, "eval_loss": 0.8285614252090454, "eval_runtime": 184.2958, "eval_samples_per_second": 54.488, "step": 2496 }, { "epoch": 2.0, "learning_rate": 3.12875751503006e-05, "loss": 0.5935, "step": 2500 }, { "epoch": 2.4, "learning_rate": 2.5025050100200405e-05, "loss": 0.2335, "step": 3000 }, { "epoch": 2.8, "learning_rate": 1.8762525050100204e-05, "loss": 0.2216, "step": 3500 }, { "epoch": 3.0, "eval_accuracy": 0.731925904750824, "eval_loss": 1.0460597276687622, "eval_runtime": 184.6236, "eval_samples_per_second": 54.392, "step": 3744 }, { "epoch": 3.21, "learning_rate": 1.25e-05, "loss": 0.1372, "step": 4000 }, { "epoch": 3.61, "learning_rate": 6.2374749498998e-06, "loss": 0.0771, "step": 4500 }, { "epoch": 4.0, "eval_accuracy": 0.7498506307601929, "eval_loss": 1.6021397113800049, "eval_runtime": 184.1793, "eval_samples_per_second": 54.523, "step": 4992 }, { "epoch": 4.0, "step": 4992, "total_flos": 0, "train_runtime": 4895.7804, "train_samples_per_second": 1.02 } ], "max_steps": 4992, "num_train_epochs": 4, "total_flos": 0, "trial_name": null, "trial_params": null }