{ "best_metric": 0.4894636273384094, "best_model_checkpoint": "autotrain-sentiment-analyzer-reddit/checkpoint-691", "epoch": 1.0, "eval_steps": 500, "global_step": 691, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.05, "grad_norm": 10.44394588470459, "learning_rate": 8.173076923076923e-06, "loss": 0.3149, "step": 34 }, { "epoch": 0.1, "grad_norm": 12.510290145874023, "learning_rate": 1.6346153846153847e-05, "loss": 0.3768, "step": 68 }, { "epoch": 0.15, "grad_norm": 10.982364654541016, "learning_rate": 2.4519230769230768e-05, "loss": 0.3113, "step": 102 }, { "epoch": 0.2, "grad_norm": 14.942676544189453, "learning_rate": 3.269230769230769e-05, "loss": 0.4581, "step": 136 }, { "epoch": 0.25, "grad_norm": 15.461087226867676, "learning_rate": 4.0865384615384615e-05, "loss": 0.5979, "step": 170 }, { "epoch": 0.3, "grad_norm": 51.596256256103516, "learning_rate": 4.9038461538461536e-05, "loss": 0.548, "step": 204 }, { "epoch": 0.34, "grad_norm": 21.773590087890625, "learning_rate": 4.9195710455764076e-05, "loss": 0.5489, "step": 238 }, { "epoch": 0.39, "grad_norm": 11.456461906433105, "learning_rate": 4.8284182305630025e-05, "loss": 0.6068, "step": 272 }, { "epoch": 0.44, "grad_norm": 15.925763130187988, "learning_rate": 4.737265415549598e-05, "loss": 0.5067, "step": 306 }, { "epoch": 0.49, "grad_norm": 15.808685302734375, "learning_rate": 4.6461126005361935e-05, "loss": 0.5312, "step": 340 }, { "epoch": 0.54, "grad_norm": 53.43648910522461, "learning_rate": 4.554959785522788e-05, "loss": 0.4574, "step": 374 }, { "epoch": 0.59, "grad_norm": 4.778822898864746, "learning_rate": 4.463806970509384e-05, "loss": 0.6492, "step": 408 }, { "epoch": 0.64, "grad_norm": 9.234722137451172, "learning_rate": 4.3726541554959786e-05, "loss": 0.6046, "step": 442 }, { "epoch": 0.69, "grad_norm": 8.603498458862305, "learning_rate": 4.281501340482574e-05, "loss": 0.5429, "step": 476 }, { "epoch": 0.74, "grad_norm": 23.032926559448242, "learning_rate": 4.1903485254691696e-05, "loss": 0.5069, "step": 510 }, { "epoch": 0.79, "grad_norm": 3.559593915939331, "learning_rate": 4.0991957104557644e-05, "loss": 0.5562, "step": 544 }, { "epoch": 0.84, "grad_norm": 14.31966495513916, "learning_rate": 4.008042895442359e-05, "loss": 0.4328, "step": 578 }, { "epoch": 0.89, "grad_norm": 16.031381607055664, "learning_rate": 3.916890080428954e-05, "loss": 0.5084, "step": 612 }, { "epoch": 0.93, "grad_norm": 6.348935127258301, "learning_rate": 3.8257372654155496e-05, "loss": 0.5242, "step": 646 }, { "epoch": 0.98, "grad_norm": 20.074831008911133, "learning_rate": 3.734584450402145e-05, "loss": 0.5023, "step": 680 }, { "epoch": 1.0, "eval_accuracy": 0.8096960926193922, "eval_f1_macro": 0.7895193987806856, "eval_f1_micro": 0.8096960926193921, "eval_f1_weighted": 0.8045465713974906, "eval_loss": 0.4894636273384094, "eval_precision_macro": 0.814875613105015, "eval_precision_micro": 0.8096960926193922, "eval_precision_weighted": 0.8193628961020867, "eval_recall_macro": 0.7801134533159866, "eval_recall_micro": 0.8096960926193922, "eval_recall_weighted": 0.8096960926193922, "eval_runtime": 321.1321, "eval_samples_per_second": 4.304, "eval_steps_per_second": 0.271, "step": 691 } ], "logging_steps": 34, "max_steps": 2073, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 500, "total_flos": 363491186591232.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }