{ "best_metric": 0.14741940796375275, "best_model_checkpoint": "./trained_models/twitter-emotion-deberta-v3-base/checkpoint-500", "epoch": 6.0, "global_step": 1200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.5, "eval_accuracy": 0.8405, "eval_loss": 0.5359936952590942, "eval_runtime": 4.1757, "eval_samples_per_second": 478.965, "eval_steps_per_second": 5.987, "step": 100 }, { "epoch": 1.0, "eval_accuracy": 0.915, "eval_loss": 0.28240880370140076, "eval_runtime": 4.2049, "eval_samples_per_second": 475.638, "eval_steps_per_second": 5.945, "step": 200 }, { "epoch": 1.5, "eval_accuracy": 0.93, "eval_loss": 0.19999809563159943, "eval_runtime": 4.2283, "eval_samples_per_second": 473.002, "eval_steps_per_second": 5.913, "step": 300 }, { "epoch": 2.0, "eval_accuracy": 0.936, "eval_loss": 0.13397051393985748, "eval_runtime": 4.2488, "eval_samples_per_second": 470.716, "eval_steps_per_second": 5.884, "step": 400 }, { "epoch": 2.5, "learning_rate": 2.916666666666667e-05, "loss": 0.4142, "step": 500 }, { "epoch": 2.5, "eval_accuracy": 0.937, "eval_loss": 0.14741940796375275, "eval_runtime": 4.2278, "eval_samples_per_second": 473.054, "eval_steps_per_second": 5.913, "step": 500 }, { "epoch": 3.0, "eval_accuracy": 0.936, "eval_loss": 0.15366272628307343, "eval_runtime": 4.2318, "eval_samples_per_second": 472.612, "eval_steps_per_second": 5.908, "step": 600 }, { "epoch": 3.5, "eval_accuracy": 0.939, "eval_loss": 0.13712549209594727, "eval_runtime": 4.2434, "eval_samples_per_second": 471.315, "eval_steps_per_second": 5.891, "step": 700 }, { "epoch": 4.0, "eval_accuracy": 0.941, "eval_loss": 0.13440823554992676, "eval_runtime": 4.2389, "eval_samples_per_second": 471.816, "eval_steps_per_second": 5.898, "step": 800 }, { "epoch": 4.5, "eval_accuracy": 0.939, "eval_loss": 0.13154806196689606, "eval_runtime": 4.244, "eval_samples_per_second": 471.257, "eval_steps_per_second": 5.891, "step": 900 }, { "epoch": 5.0, "learning_rate": 8.333333333333334e-06, "loss": 0.1013, "step": 1000 }, { "epoch": 5.0, "eval_accuracy": 0.936, "eval_loss": 0.15716207027435303, "eval_runtime": 4.2453, "eval_samples_per_second": 471.109, "eval_steps_per_second": 5.889, "step": 1000 }, { "epoch": 5.5, "eval_accuracy": 0.938, "eval_loss": 0.15671509504318237, "eval_runtime": 4.2362, "eval_samples_per_second": 472.124, "eval_steps_per_second": 5.902, "step": 1100 }, { "epoch": 6.0, "eval_accuracy": 0.939, "eval_loss": 0.15347838401794434, "eval_runtime": 4.2428, "eval_samples_per_second": 471.385, "eval_steps_per_second": 5.892, "step": 1200 }, { "epoch": 6.0, "step": 1200, "total_flos": 6907037114880000.0, "train_loss": 0.2273927664756775, "train_runtime": 627.7316, "train_samples_per_second": 152.932, "train_steps_per_second": 1.912 } ], "max_steps": 1200, "num_train_epochs": 6, "total_flos": 6907037114880000.0, "trial_name": null, "trial_params": null }