{ "best_metric": null, "best_model_checkpoint": null, "epoch": 10.0, "global_step": 910, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.9533894011551323, "eval_f1": 0.6969990319457888, "eval_loss": 0.20486080646514893, "eval_precision": 0.6617647058823529, "eval_recall": 0.7361963190184049, "eval_runtime": 1.2373, "eval_samples_per_second": 130.123, "eval_steps_per_second": 33.137, "step": 91 }, { "epoch": 1.1, "learning_rate": 4.4505494505494504e-05, "loss": 0.5036, "step": 100 }, { "epoch": 2.0, "eval_accuracy": 0.9722362954706657, "eval_f1": 0.8234146341463414, "eval_loss": 0.11564752459526062, "eval_precision": 0.7873134328358209, "eval_recall": 0.8629856850715747, "eval_runtime": 1.2367, "eval_samples_per_second": 130.181, "eval_steps_per_second": 33.152, "step": 182 }, { "epoch": 2.2, "learning_rate": 3.901098901098901e-05, "loss": 0.1442, "step": 200 }, { "epoch": 3.0, "eval_accuracy": 0.9771000101327388, "eval_f1": 0.8632812499999999, "eval_loss": 0.10779214650392532, "eval_precision": 0.8261682242990654, "eval_recall": 0.9038854805725971, "eval_runtime": 1.2508, "eval_samples_per_second": 128.715, "eval_steps_per_second": 32.778, "step": 273 }, { "epoch": 3.3, "learning_rate": 3.3516483516483513e-05, "loss": 0.0757, "step": 300 }, { "epoch": 4.0, "eval_accuracy": 0.9780119566318776, "eval_f1": 0.8851148851148851, "eval_loss": 0.1178947389125824, "eval_precision": 0.865234375, "eval_recall": 0.9059304703476483, "eval_runtime": 1.2453, "eval_samples_per_second": 129.288, "eval_steps_per_second": 32.924, "step": 364 }, { "epoch": 4.4, "learning_rate": 2.8021978021978025e-05, "loss": 0.0526, "step": 400 }, { "epoch": 5.0, "eval_accuracy": 0.9836862904042962, "eval_f1": 0.897876643073812, "eval_loss": 0.0906740128993988, "eval_precision": 0.888, "eval_recall": 0.9079754601226994, "eval_runtime": 1.2584, "eval_samples_per_second": 127.94, "eval_steps_per_second": 32.581, "step": 455 }, { "epoch": 5.49, "learning_rate": 2.252747252747253e-05, "loss": 0.0342, "step": 500 }, { "epoch": 6.0, "eval_accuracy": 0.9831796534603303, "eval_f1": 0.9130869130869131, "eval_loss": 0.0972292423248291, "eval_precision": 0.892578125, "eval_recall": 0.934560327198364, "eval_runtime": 1.2748, "eval_samples_per_second": 126.296, "eval_steps_per_second": 32.162, "step": 546 }, { "epoch": 6.59, "learning_rate": 1.7032967032967035e-05, "loss": 0.0245, "step": 600 }, { "epoch": 7.0, "eval_accuracy": 0.9833823082379167, "eval_f1": 0.9107321965897693, "eval_loss": 0.10643576085567474, "eval_precision": 0.8937007874015748, "eval_recall": 0.9284253578732107, "eval_runtime": 1.2478, "eval_samples_per_second": 129.031, "eval_steps_per_second": 32.859, "step": 637 }, { "epoch": 7.69, "learning_rate": 1.153846153846154e-05, "loss": 0.0188, "step": 700 }, { "epoch": 8.0, "eval_accuracy": 0.9850035464586078, "eval_f1": 0.9169169169169169, "eval_loss": 0.09653466939926147, "eval_precision": 0.8980392156862745, "eval_recall": 0.9366053169734151, "eval_runtime": 1.2451, "eval_samples_per_second": 129.306, "eval_steps_per_second": 32.929, "step": 728 }, { "epoch": 8.79, "learning_rate": 6.043956043956044e-06, "loss": 0.0159, "step": 800 }, { "epoch": 9.0, "eval_accuracy": 0.984598236903435, "eval_f1": 0.9201213346814965, "eval_loss": 0.09986742585897446, "eval_precision": 0.91, "eval_recall": 0.9304703476482618, "eval_runtime": 1.2461, "eval_samples_per_second": 129.208, "eval_steps_per_second": 32.904, "step": 819 }, { "epoch": 9.89, "learning_rate": 5.494505494505495e-07, "loss": 0.0141, "step": 900 }, { "epoch": 10.0, "eval_accuracy": 0.985104873847401, "eval_f1": 0.911088911088911, "eval_loss": 0.09563781321048737, "eval_precision": 0.890625, "eval_recall": 0.9325153374233128, "eval_runtime": 1.2493, "eval_samples_per_second": 128.877, "eval_steps_per_second": 32.819, "step": 910 }, { "epoch": 10.0, "step": 910, "total_flos": 1883034567828480.0, "train_loss": 0.09724931471295409, "train_runtime": 322.9196, "train_samples_per_second": 44.624, "train_steps_per_second": 2.818 } ], "max_steps": 910, "num_train_epochs": 10, "total_flos": 1883034567828480.0, "trial_name": null, "trial_params": null }