table_qa_1 / last-checkpoint /trainer_state.json
daydrill's picture
Training in progress, step 20000
31cd801
raw
history blame
1.99 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.6515506906437321,
"global_step": 20000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.16,
"learning_rate": 2.8373729476153247e-05,
"loss": 1.6126,
"step": 5000
},
{
"epoch": 0.16,
"eval_exact_match": 68.15336463223787,
"eval_f1": 73.98256617857639,
"eval_loss": 1.189887523651123,
"eval_runtime": 1542.7266,
"eval_samples_per_second": 7.463,
"eval_steps_per_second": 3.732,
"step": 5000
},
{
"epoch": 0.33,
"learning_rate": 2.674550430023456e-05,
"loss": 1.1965,
"step": 10000
},
{
"epoch": 0.33,
"eval_exact_match": 75.13475917231786,
"eval_f1": 79.95184555682803,
"eval_loss": 0.9056070446968079,
"eval_runtime": 1533.9546,
"eval_samples_per_second": 7.505,
"eval_steps_per_second": 3.753,
"step": 10000
},
{
"epoch": 0.49,
"learning_rate": 2.511695334897055e-05,
"loss": 1.0769,
"step": 15000
},
{
"epoch": 0.49,
"eval_exact_match": 77.56042427403929,
"eval_f1": 82.22503770504048,
"eval_loss": 0.9495312571525574,
"eval_runtime": 1533.818,
"eval_samples_per_second": 7.506,
"eval_steps_per_second": 3.753,
"step": 15000
},
{
"epoch": 0.65,
"learning_rate": 2.3488728173051864e-05,
"loss": 0.9992,
"step": 20000
},
{
"epoch": 0.65,
"eval_exact_match": 81.09024517475221,
"eval_f1": 85.49992934663945,
"eval_loss": 0.8323877453804016,
"eval_runtime": 1541.3611,
"eval_samples_per_second": 7.469,
"eval_steps_per_second": 3.735,
"step": 20000
}
],
"max_steps": 92088,
"num_train_epochs": 3,
"total_flos": 4.412940582912e+16,
"trial_name": null,
"trial_params": null
}