tyzhu's picture
Training in progress, epoch 2, checkpoint
31c4477 verified
raw
history blame
No virus
2.19 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 2.0,
"eval_steps": 500,
"global_step": 1058,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.19,
"learning_rate": 3e-05,
"loss": 1.7194,
"step": 100
},
{
"epoch": 0.38,
"learning_rate": 3e-05,
"loss": 1.4369,
"step": 200
},
{
"epoch": 0.57,
"learning_rate": 3e-05,
"loss": 1.4257,
"step": 300
},
{
"epoch": 0.76,
"learning_rate": 3e-05,
"loss": 1.3947,
"step": 400
},
{
"epoch": 0.95,
"learning_rate": 3e-05,
"loss": 1.3948,
"step": 500
},
{
"epoch": 1.0,
"eval_accuracy": 0.6132307692307692,
"eval_loss": 1.3087366819381714,
"eval_runtime": 4.3553,
"eval_samples_per_second": 114.803,
"eval_steps_per_second": 14.465,
"step": 529
},
{
"epoch": 1.0,
"eval_exact_match": 24.4,
"eval_f1": 37.614420394420414,
"step": 529
},
{
"epoch": 1.13,
"learning_rate": 3e-05,
"loss": 1.3927,
"step": 600
},
{
"epoch": 1.32,
"learning_rate": 3e-05,
"loss": 1.3644,
"step": 700
},
{
"epoch": 1.51,
"learning_rate": 3e-05,
"loss": 1.3791,
"step": 800
},
{
"epoch": 1.7,
"learning_rate": 3e-05,
"loss": 1.3627,
"step": 900
},
{
"epoch": 1.89,
"learning_rate": 3e-05,
"loss": 1.3789,
"step": 1000
},
{
"epoch": 2.0,
"eval_accuracy": 0.6146153846153846,
"eval_loss": 1.289727807044983,
"eval_runtime": 4.4281,
"eval_samples_per_second": 112.915,
"eval_steps_per_second": 14.227,
"step": 1058
},
{
"epoch": 2.0,
"eval_exact_match": 23.2,
"eval_f1": 35.56775335775336,
"step": 1058
}
],
"logging_steps": 100,
"max_steps": 26450,
"num_train_epochs": 50,
"save_steps": 500,
"total_flos": 1.7853789925434982e+17,
"trial_name": null,
"trial_params": null
}