{ "best_metric": 0.27679798007011414, "best_model_checkpoint": "spa_en_mBERT/checkpoint-4480", "epoch": 6.0, "global_step": 5376, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.56, "learning_rate": 1.988839285714286e-05, "loss": 1.015, "step": 500 }, { "epoch": 1.0, "eval_accuracy": 0.8975234842015372, "eval_f1": 0.7030225599300675, "eval_loss": 0.40301570296287537, "eval_precision": 0.7149695684879983, "eval_recall": 0.691468253968254, "eval_runtime": 5.8245, "eval_samples_per_second": 283.973, "eval_steps_per_second": 17.856, "step": 896 }, { "epoch": 1.12, "learning_rate": 1.9776785714285716e-05, "loss": 0.466, "step": 1000 }, { "epoch": 1.67, "learning_rate": 1.9665178571428575e-05, "loss": 0.3444, "step": 1500 }, { "epoch": 2.0, "eval_accuracy": 0.9197465890810875, "eval_f1": 0.772121694173792, "eval_loss": 0.30006563663482666, "eval_precision": 0.7738142686329215, "eval_recall": 0.770436507936508, "eval_runtime": 5.9225, "eval_samples_per_second": 279.276, "eval_steps_per_second": 17.56, "step": 1792 }, { "epoch": 2.23, "learning_rate": 1.955357142857143e-05, "loss": 0.2916, "step": 2000 }, { "epoch": 2.79, "learning_rate": 1.944196428571429e-05, "loss": 0.2491, "step": 2500 }, { "epoch": 3.0, "eval_accuracy": 0.9214545310110619, "eval_f1": 0.7768938768773725, "eval_loss": 0.2882336974143982, "eval_precision": 0.7754859967051071, "eval_recall": 0.7783068783068783, "eval_runtime": 5.8599, "eval_samples_per_second": 282.259, "eval_steps_per_second": 17.748, "step": 2688 }, { "epoch": 3.35, "learning_rate": 1.9330357142857144e-05, "loss": 0.2111, "step": 3000 }, { "epoch": 3.91, "learning_rate": 1.9218750000000003e-05, "loss": 0.1889, "step": 3500 }, { "epoch": 4.0, "eval_accuracy": 0.9311659682640557, "eval_f1": 0.8087478559176673, "eval_loss": 0.279913067817688, "eval_precision": 0.8067254540668597, "eval_recall": 0.8107804232804233, "eval_runtime": 5.8665, "eval_samples_per_second": 281.939, "eval_steps_per_second": 17.728, "step": 3584 }, { "epoch": 4.46, "learning_rate": 1.910714285714286e-05, "loss": 0.1683, "step": 4000 }, { "epoch": 5.0, "eval_accuracy": 0.9332115266220483, "eval_f1": 0.8155864706270193, "eval_loss": 0.27679798007011414, "eval_precision": 0.8130669120546865, "eval_recall": 0.8181216931216931, "eval_runtime": 6.0326, "eval_samples_per_second": 274.178, "eval_steps_per_second": 17.24, "step": 4480 }, { "epoch": 5.02, "learning_rate": 1.8995535714285717e-05, "loss": 0.1568, "step": 4500 }, { "epoch": 5.58, "learning_rate": 1.8883928571428573e-05, "loss": 0.1313, "step": 5000 }, { "epoch": 6.0, "eval_accuracy": 0.9282068595714257, "eval_f1": 0.7986634908032288, "eval_loss": 0.30244389176368713, "eval_precision": 0.7989806724913953, "eval_recall": 0.7983465608465609, "eval_runtime": 5.8739, "eval_samples_per_second": 281.583, "eval_steps_per_second": 17.705, "step": 5376 } ], "max_steps": 89600, "num_train_epochs": 100, "total_flos": 3919265715030336.0, "trial_name": null, "trial_params": null }