File size: 2,653 Bytes
04378e2 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 |
{
"best_metric": 0.7140781182094741,
"best_model_checkpoint": "OUTPUT/xlm-roberta-base/FalseTrue-0/0/checkpoint-296",
"epoch": 8.0,
"global_step": 296,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.5641025900840759,
"eval_f1": 0.4068936527952921,
"eval_loss": 0.6925989985466003,
"eval_runtime": 0.8159,
"eval_samples_per_second": 334.599,
"eval_steps_per_second": 42.897,
"step": 37
},
{
"epoch": 2.0,
"eval_accuracy": 0.5641025900840759,
"eval_f1": 0.4068936527952921,
"eval_loss": 0.7125938534736633,
"eval_runtime": 0.8146,
"eval_samples_per_second": 335.145,
"eval_steps_per_second": 42.967,
"step": 74
},
{
"epoch": 3.0,
"eval_accuracy": 0.5604395866394043,
"eval_f1": 0.4052004333694475,
"eval_loss": 0.7705000042915344,
"eval_runtime": 0.8132,
"eval_samples_per_second": 335.709,
"eval_steps_per_second": 43.04,
"step": 111
},
{
"epoch": 4.0,
"eval_accuracy": 0.7142857313156128,
"eval_f1": 0.7028323699421966,
"eval_loss": 0.8162457346916199,
"eval_runtime": 0.814,
"eval_samples_per_second": 335.389,
"eval_steps_per_second": 42.999,
"step": 148
},
{
"epoch": 5.0,
"eval_accuracy": 0.7069597244262695,
"eval_f1": 0.6908952629291613,
"eval_loss": 1.4020615816116333,
"eval_runtime": 0.8166,
"eval_samples_per_second": 334.305,
"eval_steps_per_second": 42.86,
"step": 185
},
{
"epoch": 6.0,
"eval_accuracy": 0.721611738204956,
"eval_f1": 0.7063504997827033,
"eval_loss": 1.4205191135406494,
"eval_runtime": 0.8137,
"eval_samples_per_second": 335.499,
"eval_steps_per_second": 43.013,
"step": 222
},
{
"epoch": 7.0,
"eval_accuracy": 0.7252747416496277,
"eval_f1": 0.7118124041200964,
"eval_loss": 1.5443077087402344,
"eval_runtime": 0.8137,
"eval_samples_per_second": 335.506,
"eval_steps_per_second": 43.014,
"step": 259
},
{
"epoch": 8.0,
"eval_accuracy": 0.7289377450942993,
"eval_f1": 0.7140781182094741,
"eval_loss": 1.6495815515518188,
"eval_runtime": 0.8093,
"eval_samples_per_second": 337.346,
"eval_steps_per_second": 43.249,
"step": 296
}
],
"max_steps": 333,
"num_train_epochs": 9,
"total_flos": 1988472400920576.0,
"trial_name": null,
"trial_params": null
}
|