Harish Tayyar Madabushi
added model
8977b8e
{
"best_metric": 0.688748846434271,
"best_model_checkpoint": "output-no-git/EN-OUTPUT/ON_FS_OUT/XLNetFalseTrue-0-1/TrueFalse-0/train_from_dev_and_test_short.csv/1/checkpoint-18",
"epoch": 6.0,
"global_step": 18,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.7060086131095886,
"eval_f1": 0.6763806868584463,
"eval_f1_binary": 0.7742998352553541,
"eval_f1_weighted": 0.697813633503263,
"eval_loss": 0.6087642312049866,
"eval_runtime": 1.8252,
"eval_samples_per_second": 255.31,
"eval_steps_per_second": 32.325,
"step": 3
},
{
"epoch": 2.0,
"eval_accuracy": 0.7038626670837402,
"eval_f1": 0.6863881086142323,
"eval_f1_binary": 0.7604166666666667,
"eval_f1_weighted": 0.702591784411117,
"eval_loss": 0.5733329057693481,
"eval_runtime": 1.8207,
"eval_samples_per_second": 255.939,
"eval_steps_per_second": 32.404,
"step": 6
},
{
"epoch": 3.0,
"eval_accuracy": 0.7145922780036926,
"eval_f1": 0.6748046823760278,
"eval_f1_binary": 0.7885532591414944,
"eval_f1_weighted": 0.6997024395221171,
"eval_loss": 0.5822879672050476,
"eval_runtime": 1.8268,
"eval_samples_per_second": 255.088,
"eval_steps_per_second": 32.297,
"step": 9
},
{
"epoch": 4.0,
"eval_accuracy": 0.6995708346366882,
"eval_f1": 0.6317370001580527,
"eval_f1_binary": 0.7897897897897898,
"eval_f1_weighted": 0.6663322459572741,
"eval_loss": 0.652556300163269,
"eval_runtime": 1.8238,
"eval_samples_per_second": 255.509,
"eval_steps_per_second": 32.35,
"step": 12
},
{
"epoch": 5.0,
"eval_accuracy": 0.725321888923645,
"eval_f1": 0.6831548529661737,
"eval_f1_binary": 0.7987421383647799,
"eval_f1_weighted": 0.7084550742336797,
"eval_loss": 0.6597227454185486,
"eval_runtime": 1.8184,
"eval_samples_per_second": 256.267,
"eval_steps_per_second": 32.446,
"step": 15
},
{
"epoch": 6.0,
"eval_accuracy": 0.7188841104507446,
"eval_f1": 0.688748846434271,
"eval_f1_binary": 0.7855973813420623,
"eval_f1_weighted": 0.7099474527874785,
"eval_loss": 0.6554996371269226,
"eval_runtime": 1.8291,
"eval_samples_per_second": 254.774,
"eval_steps_per_second": 32.257,
"step": 18
}
],
"max_steps": 27,
"num_train_epochs": 9,
"total_flos": 37176876481536.0,
"trial_name": null,
"trial_params": null
}