PT-UP-xlmR-FalseFalse-0_0_BEST / trainer_state.json
Harish Tayyar Madabushi
added modle
2b0f74d
{
"best_metric": 0.6019402643037202,
"best_model_checkpoint": "OUTPUT/xlm-roberta-base/FalseFalse-0/0/checkpoint-185",
"epoch": 5.0,
"global_step": 185,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.5641025900840759,
"eval_f1": 0.4068936527952921,
"eval_loss": 0.7115342617034912,
"eval_runtime": 0.8107,
"eval_samples_per_second": 336.765,
"eval_steps_per_second": 43.175,
"step": 37
},
{
"epoch": 2.0,
"eval_accuracy": 0.5641025900840759,
"eval_f1": 0.4068936527952921,
"eval_loss": 0.7905893921852112,
"eval_runtime": 0.8099,
"eval_samples_per_second": 337.067,
"eval_steps_per_second": 43.214,
"step": 74
},
{
"epoch": 3.0,
"eval_accuracy": 0.553113579750061,
"eval_f1": 0.547169190727473,
"eval_loss": 0.7051942944526672,
"eval_runtime": 0.8079,
"eval_samples_per_second": 337.926,
"eval_steps_per_second": 43.324,
"step": 111
},
{
"epoch": 4.0,
"eval_accuracy": 0.5897436141967773,
"eval_f1": 0.5815671023417899,
"eval_loss": 1.058557391166687,
"eval_runtime": 0.8079,
"eval_samples_per_second": 337.916,
"eval_steps_per_second": 43.323,
"step": 148
},
{
"epoch": 5.0,
"eval_accuracy": 0.6043956279754639,
"eval_f1": 0.6019402643037202,
"eval_loss": 1.1202752590179443,
"eval_runtime": 0.8093,
"eval_samples_per_second": 337.327,
"eval_steps_per_second": 43.247,
"step": 185
}
],
"max_steps": 333,
"num_train_epochs": 9,
"total_flos": 1242795250575360.0,
"trial_name": null,
"trial_params": null
}