ThaiFood-Image-captioning / trainer_state.json
TeetouchQQ's picture
Upload trainer_state.json
e9c907c
raw history blame
No virus
2.53 kB
{
"best_metric": 0.976475715637207,
"best_model_checkpoint": "microsoft-swin-base-patch4-window7-224_bert-base-multilingual-cased_bert-base-multilingual-cased/checkpoint-3864",
"epoch": 6.0,
"global_step": 3864,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.78,
"learning_rate": 3.923136645962734e-05,
"loss": 2.2925,
"step": 500
},
{
"epoch": 1.0,
"eval_loss": 1.6365079879760742,
"eval_runtime": 232.7485,
"eval_samples_per_second": 11.068,
"eval_steps_per_second": 0.692,
"step": 644
},
{
"epoch": 1.55,
"learning_rate": 3.845496894409938e-05,
"loss": 1.4969,
"step": 1000
},
{
"epoch": 2.0,
"eval_loss": 1.3718241453170776,
"eval_runtime": 40.4125,
"eval_samples_per_second": 63.743,
"eval_steps_per_second": 3.984,
"step": 1288
},
{
"epoch": 2.33,
"learning_rate": 3.7678571428571433e-05,
"loss": 1.2926,
"step": 1500
},
{
"epoch": 3.0,
"eval_loss": 1.1062968969345093,
"eval_runtime": 40.4904,
"eval_samples_per_second": 63.62,
"eval_steps_per_second": 3.976,
"step": 1932
},
{
"epoch": 3.11,
"learning_rate": 3.690217391304348e-05,
"loss": 1.1515,
"step": 2000
},
{
"epoch": 3.88,
"learning_rate": 3.612577639751553e-05,
"loss": 1.0376,
"step": 2500
},
{
"epoch": 4.0,
"eval_loss": 1.0416237115859985,
"eval_runtime": 40.3883,
"eval_samples_per_second": 63.781,
"eval_steps_per_second": 3.986,
"step": 2576
},
{
"epoch": 4.66,
"learning_rate": 3.534937888198758e-05,
"loss": 0.9386,
"step": 3000
},
{
"epoch": 5.0,
"eval_loss": 1.0240283012390137,
"eval_runtime": 40.487,
"eval_samples_per_second": 63.625,
"eval_steps_per_second": 3.977,
"step": 3220
},
{
"epoch": 5.43,
"learning_rate": 3.4572981366459633e-05,
"loss": 0.867,
"step": 3500
},
{
"epoch": 6.0,
"eval_loss": 0.976475715637207,
"eval_runtime": 40.4063,
"eval_samples_per_second": 63.752,
"eval_steps_per_second": 3.985,
"step": 3864
}
],
"max_steps": 25760,
"num_train_epochs": 40,
"total_flos": 1.1256086855275315e+19,
"trial_name": null,
"trial_params": null
}