{ "best_metric": 0.688748846434271, "best_model_checkpoint": "output-no-git/EN-OUTPUT/ON_FS_OUT/XLNetFalseTrue-0-1/TrueFalse-0/train_from_dev_and_test_short.csv/1/checkpoint-18", "epoch": 6.0, "global_step": 18, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.7060086131095886, "eval_f1": 0.6763806868584463, "eval_f1_binary": 0.7742998352553541, "eval_f1_weighted": 0.697813633503263, "eval_loss": 0.6087642312049866, "eval_runtime": 1.8252, "eval_samples_per_second": 255.31, "eval_steps_per_second": 32.325, "step": 3 }, { "epoch": 2.0, "eval_accuracy": 0.7038626670837402, "eval_f1": 0.6863881086142323, "eval_f1_binary": 0.7604166666666667, "eval_f1_weighted": 0.702591784411117, "eval_loss": 0.5733329057693481, "eval_runtime": 1.8207, "eval_samples_per_second": 255.939, "eval_steps_per_second": 32.404, "step": 6 }, { "epoch": 3.0, "eval_accuracy": 0.7145922780036926, "eval_f1": 0.6748046823760278, "eval_f1_binary": 0.7885532591414944, "eval_f1_weighted": 0.6997024395221171, "eval_loss": 0.5822879672050476, "eval_runtime": 1.8268, "eval_samples_per_second": 255.088, "eval_steps_per_second": 32.297, "step": 9 }, { "epoch": 4.0, "eval_accuracy": 0.6995708346366882, "eval_f1": 0.6317370001580527, "eval_f1_binary": 0.7897897897897898, "eval_f1_weighted": 0.6663322459572741, "eval_loss": 0.652556300163269, "eval_runtime": 1.8238, "eval_samples_per_second": 255.509, "eval_steps_per_second": 32.35, "step": 12 }, { "epoch": 5.0, "eval_accuracy": 0.725321888923645, "eval_f1": 0.6831548529661737, "eval_f1_binary": 0.7987421383647799, "eval_f1_weighted": 0.7084550742336797, "eval_loss": 0.6597227454185486, "eval_runtime": 1.8184, "eval_samples_per_second": 256.267, "eval_steps_per_second": 32.446, "step": 15 }, { "epoch": 6.0, "eval_accuracy": 0.7188841104507446, "eval_f1": 0.688748846434271, "eval_f1_binary": 0.7855973813420623, "eval_f1_weighted": 0.7099474527874785, "eval_loss": 0.6554996371269226, "eval_runtime": 1.8291, "eval_samples_per_second": 254.774, "eval_steps_per_second": 32.257, "step": 18 } ], "max_steps": 27, "num_train_epochs": 9, "total_flos": 37176876481536.0, "trial_name": null, "trial_params": null }