{ "best_metric": 0.7736625514403291, "best_model_checkpoint": "OS_OUT/harish/PT-UP-xlmR-FalseFalse-0_0_BEST/FalseFalse-0/2/checkpoint-40", "epoch": 8.0, "global_step": 40, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.6300366520881653, "eval_f1": 0.597609561752988, "eval_loss": 0.6447749137878418, "eval_runtime": 0.7675, "eval_samples_per_second": 355.702, "eval_steps_per_second": 45.603, "step": 5 }, { "epoch": 2.0, "eval_accuracy": 0.6813187003135681, "eval_f1": 0.6200873362445415, "eval_loss": 0.5641180872917175, "eval_runtime": 0.7675, "eval_samples_per_second": 355.721, "eval_steps_per_second": 45.605, "step": 10 }, { "epoch": 3.0, "eval_accuracy": 0.7289377450942993, "eval_f1": 0.6372549019607843, "eval_loss": 0.5698391795158386, "eval_runtime": 0.7673, "eval_samples_per_second": 355.789, "eval_steps_per_second": 45.614, "step": 15 }, { "epoch": 4.0, "eval_accuracy": 0.7289377450942993, "eval_f1": 0.7153846153846154, "eval_loss": 0.5229743719100952, "eval_runtime": 0.7688, "eval_samples_per_second": 355.082, "eval_steps_per_second": 45.523, "step": 20 }, { "epoch": 5.0, "eval_accuracy": 0.7582417726516724, "eval_f1": 0.7421875, "eval_loss": 0.5236229300498962, "eval_runtime": 0.7675, "eval_samples_per_second": 355.716, "eval_steps_per_second": 45.605, "step": 25 }, { "epoch": 6.0, "eval_accuracy": 0.7655677795410156, "eval_f1": 0.719298245614035, "eval_loss": 0.5164700150489807, "eval_runtime": 0.7779, "eval_samples_per_second": 350.939, "eval_steps_per_second": 44.992, "step": 30 }, { "epoch": 7.0, "eval_accuracy": 0.791208803653717, "eval_f1": 0.7673469387755103, "eval_loss": 0.5138589143753052, "eval_runtime": 0.7778, "eval_samples_per_second": 350.983, "eval_steps_per_second": 44.998, "step": 35 }, { "epoch": 8.0, "eval_accuracy": 0.7985348105430603, "eval_f1": 0.7736625514403291, "eval_loss": 0.5282412767410278, "eval_runtime": 0.7588, "eval_samples_per_second": 359.786, "eval_steps_per_second": 46.126, "step": 40 } ], "max_steps": 45, "num_train_epochs": 9, "total_flos": 82090649272320.0, "trial_name": null, "trial_params": null }