{ "best_metric": 0.7565779291131405, "best_model_checkpoint": "output-no-git/EN-OUTPUT/distilbert-base-cased/FalseTrue-0/2/checkpoint-520", "epoch": 5.0, "global_step": 520, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.7446351647377014, "eval_f1": 0.7378445712448767, "eval_f1_binary": 0.7800369685767097, "eval_f1_weighted": 0.7470798170127886, "eval_loss": 0.7295559048652649, "eval_runtime": 0.9453, "eval_samples_per_second": 492.97, "eval_steps_per_second": 62.415, "step": 104 }, { "epoch": 2.0, "eval_accuracy": 0.7424892783164978, "eval_f1": 0.7401728463897408, "eval_f1_binary": 0.7647058823529411, "eval_f1_weighted": 0.7455427383816858, "eval_loss": 0.9534124732017517, "eval_runtime": 0.7364, "eval_samples_per_second": 632.823, "eval_steps_per_second": 80.121, "step": 208 }, { "epoch": 3.0, "eval_accuracy": 0.7618025541305542, "eval_f1": 0.7543816329922364, "eval_f1_binary": 0.7970749542961609, "eval_f1_weighted": 0.7637265230630523, "eval_loss": 1.0867007970809937, "eval_runtime": 0.736, "eval_samples_per_second": 633.169, "eval_steps_per_second": 80.165, "step": 312 }, { "epoch": 4.0, "eval_accuracy": 0.7532188892364502, "eval_f1": 0.7470105321795617, "eval_f1_binary": 0.7866419294990724, "eval_f1_weighted": 0.7556852157130167, "eval_loss": 1.2413438558578491, "eval_runtime": 0.7367, "eval_samples_per_second": 632.508, "eval_steps_per_second": 80.082, "step": 416 }, { "epoch": 4.81, "learning_rate": 9.316239316239318e-06, "loss": 0.1347, "step": 500 }, { "epoch": 5.0, "eval_accuracy": 0.7682403326034546, "eval_f1": 0.7565779291131405, "eval_f1_binary": 0.8098591549295775, "eval_f1_weighted": 0.7682403433476395, "eval_loss": 1.2424249649047852, "eval_runtime": 0.7359, "eval_samples_per_second": 633.202, "eval_steps_per_second": 80.169, "step": 520 } ], "max_steps": 936, "num_train_epochs": 9, "total_flos": 550898794160640.0, "trial_name": null, "trial_params": null }