{ "best_metric": 0.6570678460213344, "best_model_checkpoint": "FS_OUT/harish/PT-UP-xlmR-ContextIncluded_IdiomExcluded-4_BEST/TrueFalse-0/4/checkpoint-45", "epoch": 9.0, "global_step": 45, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.5567765831947327, "eval_f1": 0.5578118336364079, "eval_loss": 0.6907439827919006, "eval_runtime": 0.7876, "eval_samples_per_second": 346.644, "eval_steps_per_second": 44.442, "step": 5 }, { "epoch": 2.0, "eval_accuracy": 0.5787546038627625, "eval_f1": 0.4448845849320908, "eval_loss": 0.665475606918335, "eval_runtime": 0.7917, "eval_samples_per_second": 344.817, "eval_steps_per_second": 44.207, "step": 10 }, { "epoch": 3.0, "eval_accuracy": 0.622710645198822, "eval_f1": 0.5963622262791237, "eval_loss": 0.6525125503540039, "eval_runtime": 0.7838, "eval_samples_per_second": 348.295, "eval_steps_per_second": 44.653, "step": 15 }, { "epoch": 4.0, "eval_accuracy": 0.5970696210861206, "eval_f1": 0.5985724185724186, "eval_loss": 0.6665695309638977, "eval_runtime": 0.7871, "eval_samples_per_second": 346.827, "eval_steps_per_second": 44.465, "step": 20 }, { "epoch": 5.0, "eval_accuracy": 0.593406617641449, "eval_f1": 0.5940832214099966, "eval_loss": 0.6762897372245789, "eval_runtime": 0.7899, "eval_samples_per_second": 345.632, "eval_steps_per_second": 44.312, "step": 25 }, { "epoch": 6.0, "eval_accuracy": 0.6336996555328369, "eval_f1": 0.6314261706515927, "eval_loss": 0.6941685676574707, "eval_runtime": 0.7926, "eval_samples_per_second": 344.418, "eval_steps_per_second": 44.156, "step": 30 }, { "epoch": 7.0, "eval_accuracy": 0.6446886658668518, "eval_f1": 0.645882102061817, "eval_loss": 0.754807710647583, "eval_runtime": 0.7972, "eval_samples_per_second": 342.457, "eval_steps_per_second": 43.905, "step": 35 }, { "epoch": 8.0, "eval_accuracy": 0.6446886658668518, "eval_f1": 0.645882102061817, "eval_loss": 0.7887275815010071, "eval_runtime": 0.7852, "eval_samples_per_second": 347.667, "eval_steps_per_second": 44.573, "step": 40 }, { "epoch": 9.0, "eval_accuracy": 0.6556776762008667, "eval_f1": 0.6570678460213344, "eval_loss": 0.7924347519874573, "eval_runtime": 0.7913, "eval_samples_per_second": 345.022, "eval_steps_per_second": 44.234, "step": 45 } ], "max_steps": 45, "num_train_epochs": 9, "total_flos": 92351980431360.0, "trial_name": null, "trial_params": null }