PT-UP-xlmR-TrueTrue-0_4_BEST / trainer_state.json
Harish Tayyar Madabushi
added model
81e97e0
{
"best_metric": 0.7055396916047973,
"best_model_checkpoint": "OUTPUT/xlm-roberta-base/TrueTrue-0/4/checkpoint-185",
"epoch": 5.0,
"global_step": 185,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.5641025900840759,
"eval_f1": 0.4068936527952921,
"eval_loss": 0.6910404562950134,
"eval_runtime": 0.8157,
"eval_samples_per_second": 334.668,
"eval_steps_per_second": 42.906,
"step": 37
},
{
"epoch": 2.0,
"eval_accuracy": 0.5641025900840759,
"eval_f1": 0.4068936527952921,
"eval_loss": 0.7116556763648987,
"eval_runtime": 0.8152,
"eval_samples_per_second": 334.895,
"eval_steps_per_second": 42.935,
"step": 74
},
{
"epoch": 3.0,
"eval_accuracy": 0.5641025900840759,
"eval_f1": 0.4068936527952921,
"eval_loss": 0.7275816798210144,
"eval_runtime": 0.8189,
"eval_samples_per_second": 333.376,
"eval_steps_per_second": 42.74,
"step": 111
},
{
"epoch": 4.0,
"eval_accuracy": 0.6410256624221802,
"eval_f1": 0.6183577308621883,
"eval_loss": 0.8214528560638428,
"eval_runtime": 0.8151,
"eval_samples_per_second": 334.93,
"eval_steps_per_second": 42.94,
"step": 148
},
{
"epoch": 5.0,
"eval_accuracy": 0.7142857313156128,
"eval_f1": 0.7055396916047973,
"eval_loss": 1.0689555406570435,
"eval_runtime": 0.8147,
"eval_samples_per_second": 335.111,
"eval_steps_per_second": 42.963,
"step": 185
}
],
"max_steps": 333,
"num_train_epochs": 9,
"total_flos": 1242795250575360.0,
"trial_name": null,
"trial_params": null
}