{ "best_metric": 0.9597055019401054, "best_model_checkpoint": "/scratch/mrahma45/pixel/finetuned_models/mbert/mbert-base-finetuned-masakhaner-conll_2003_en/checkpoint-2000", "epoch": 6.83371298405467, "global_step": 3000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.46, "eval_accuracy_score": 0.9880261672053269, "eval_f1": 0.9325536848472628, "eval_loss": 0.05282844603061676, "eval_precision": 0.9440702184119208, "eval_recall": 0.9213147410358565, "eval_runtime": 45.1558, "eval_samples_per_second": 71.973, "eval_steps_per_second": 9.013, "step": 200 }, { "epoch": 0.91, "eval_accuracy_score": 0.9911218410498034, "eval_f1": 0.9478570017776022, "eval_loss": 0.03281404450535774, "eval_precision": 0.9398746572659616, "eval_recall": 0.9559760956175298, "eval_runtime": 45.2247, "eval_samples_per_second": 71.863, "eval_steps_per_second": 9.0, "step": 400 }, { "epoch": 1.14, "learning_rate": 4.865771812080537e-05, "loss": 0.1432, "step": 500 }, { "epoch": 1.37, "eval_accuracy_score": 0.9911607803434446, "eval_f1": 0.9469395866454691, "eval_loss": 0.03454526141285896, "eval_precision": 0.9446867565424266, "eval_recall": 0.9492031872509961, "eval_runtime": 45.0931, "eval_samples_per_second": 72.073, "eval_steps_per_second": 9.026, "step": 600 }, { "epoch": 1.82, "eval_accuracy_score": 0.9924457770336046, "eval_f1": 0.9525887720690339, "eval_loss": 0.03193691000342369, "eval_precision": 0.9486369024101146, "eval_recall": 0.9565737051792829, "eval_runtime": 45.1422, "eval_samples_per_second": 71.995, "eval_steps_per_second": 9.016, "step": 800 }, { "epoch": 2.28, "learning_rate": 4.697986577181208e-05, "loss": 0.0248, "step": 1000 }, { "epoch": 2.28, "eval_accuracy_score": 0.9919979751567306, "eval_f1": 0.9510281116519319, "eval_loss": 0.03897447884082794, "eval_precision": 0.9484842480681593, "eval_recall": 0.9535856573705179, "eval_runtime": 45.33, "eval_samples_per_second": 71.696, "eval_steps_per_second": 8.979, "step": 1000 }, { "epoch": 2.73, "eval_accuracy_score": 0.9928741092636579, "eval_f1": 0.955820895522388, "eval_loss": 0.03231716528534889, "eval_precision": 0.9548707753479125, "eval_recall": 0.9567729083665338, "eval_runtime": 45.1734, "eval_samples_per_second": 71.945, "eval_steps_per_second": 9.01, "step": 1200 }, { "epoch": 3.19, "eval_accuracy_score": 0.9924068377399634, "eval_f1": 0.9529388403494836, "eval_loss": 0.03496513515710831, "eval_precision": 0.9499208234362628, "eval_recall": 0.9559760956175298, "eval_runtime": 45.4093, "eval_samples_per_second": 71.571, "eval_steps_per_second": 8.963, "step": 1400 }, { "epoch": 3.42, "learning_rate": 4.530201342281879e-05, "loss": 0.0137, "step": 1500 }, { "epoch": 3.64, "eval_accuracy_score": 0.9919395662162689, "eval_f1": 0.9535965172652617, "eval_loss": 0.035889387130737305, "eval_precision": 0.9473166896009436, "eval_recall": 0.9599601593625497, "eval_runtime": 45.1155, "eval_samples_per_second": 72.037, "eval_steps_per_second": 9.021, "step": 1600 }, { "epoch": 4.1, "eval_accuracy_score": 0.9932245629064289, "eval_f1": 0.9622116149562451, "eval_loss": 0.03680919110774994, "eval_precision": 0.9606830818109611, "eval_recall": 0.9637450199203187, "eval_runtime": 45.2409, "eval_samples_per_second": 71.838, "eval_steps_per_second": 8.996, "step": 1800 }, { "epoch": 4.56, "learning_rate": 4.36241610738255e-05, "loss": 0.009, "step": 2000 }, { "epoch": 4.56, "eval_accuracy_score": 0.9931272146723259, "eval_f1": 0.9597055019401054, "eval_loss": 0.03970629721879959, "eval_precision": 0.958656330749354, "eval_recall": 0.9607569721115538, "eval_runtime": 45.2082, "eval_samples_per_second": 71.89, "eval_steps_per_second": 9.003, "step": 2000 }, { "epoch": 5.01, "eval_accuracy_score": 0.9928157003231961, "eval_f1": 0.9558970265416085, "eval_loss": 0.034936945885419846, "eval_precision": 0.9576169532187125, "eval_recall": 0.954183266932271, "eval_runtime": 45.2011, "eval_samples_per_second": 71.901, "eval_steps_per_second": 9.004, "step": 2200 }, { "epoch": 5.47, "eval_accuracy_score": 0.9927378217359137, "eval_f1": 0.9555819948443386, "eval_loss": 0.04039572924375534, "eval_precision": 0.951243584682195, "eval_recall": 0.9599601593625497, "eval_runtime": 45.1221, "eval_samples_per_second": 72.027, "eval_steps_per_second": 9.02, "step": 2400 }, { "epoch": 5.69, "learning_rate": 4.194630872483222e-05, "loss": 0.0068, "step": 2500 }, { "epoch": 5.92, "eval_accuracy_score": 0.9922900198590398, "eval_f1": 0.9525325903074933, "eval_loss": 0.037243932485580444, "eval_precision": 0.9516802545237621, "eval_recall": 0.953386454183267, "eval_runtime": 110.5281, "eval_samples_per_second": 29.404, "eval_steps_per_second": 3.682, "step": 2600 }, { "epoch": 6.38, "eval_accuracy_score": 0.9928157003231961, "eval_f1": 0.9561569959053231, "eval_loss": 0.045760806649923325, "eval_precision": 0.9587422391347887, "eval_recall": 0.9535856573705179, "eval_runtime": 45.0678, "eval_samples_per_second": 72.114, "eval_steps_per_second": 9.031, "step": 2800 }, { "epoch": 6.83, "learning_rate": 4.026845637583892e-05, "loss": 0.0058, "step": 3000 }, { "epoch": 6.83, "eval_accuracy_score": 0.9929909271445816, "eval_f1": 0.957639788697299, "eval_loss": 0.04067611321806908, "eval_precision": 0.9583083981647716, "eval_recall": 0.9569721115537848, "eval_runtime": 45.0199, "eval_samples_per_second": 72.19, "eval_steps_per_second": 9.04, "step": 3000 }, { "epoch": 6.83, "step": 3000, "total_flos": 1.2538334439696384e+16, "train_loss": 0.03388593363761902, "train_runtime": 6160.4656, "train_samples_per_second": 77.916, "train_steps_per_second": 2.435 } ], "max_steps": 15000, "num_train_epochs": 35, "total_flos": 1.2538334439696384e+16, "trial_name": null, "trial_params": null }