Harish Tayyar Madabushi
added model
b9616c4
{
"best_metric": 0.8225606853879106,
"best_model_checkpoint": "output-no-git/EN-OUTPUT/xlnet-base-cased/FalseTrue-0/1/checkpoint-312",
"epoch": 3.0,
"global_step": 312,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.7875536680221558,
"eval_f1": 0.7775119963347881,
"eval_f1_binary": 0.8247787610619469,
"eval_f1_weighted": 0.7878579405454538,
"eval_loss": 0.5327664017677307,
"eval_runtime": 1.8369,
"eval_samples_per_second": 253.685,
"eval_steps_per_second": 32.119,
"step": 104
},
{
"epoch": 2.0,
"eval_accuracy": 0.7982832789421082,
"eval_f1": 0.7889492753623188,
"eval_f1_binary": 0.8333333333333334,
"eval_f1_weighted": 0.7986642408409529,
"eval_loss": 1.0078827142715454,
"eval_runtime": 1.83,
"eval_samples_per_second": 254.641,
"eval_steps_per_second": 32.24,
"step": 208
},
{
"epoch": 3.0,
"eval_accuracy": 0.8283261656761169,
"eval_f1": 0.8225606853879106,
"eval_f1_binary": 0.8545454545454546,
"eval_f1_weighted": 0.8295616434438536,
"eval_loss": 0.77229905128479,
"eval_runtime": 1.8293,
"eval_samples_per_second": 254.742,
"eval_steps_per_second": 32.253,
"step": 312
}
],
"max_steps": 936,
"num_train_epochs": 9,
"total_flos": 710847517552128.0,
"trial_name": null,
"trial_params": null
}