deberta-em-large / trainer_state.json
Kerem P
End of training
cb4b708
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 2.980891719745223,
"eval_steps": 500,
"global_step": 234,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 2.98,
"step": 234,
"total_flos": 1751693284868096.0,
"train_loss": 0.17317123087043437,
"train_runtime": 1075.8425,
"train_samples_per_second": 13.97,
"train_steps_per_second": 0.218
}
],
"logging_steps": 500,
"max_steps": 234,
"num_train_epochs": 3,
"save_steps": 500,
"total_flos": 1751693284868096.0,
"trial_name": null,
"trial_params": null
}