File size: 1,860 Bytes
51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 9713d73 51ebc81 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 2.0,
"eval_steps": 500,
"global_step": 683,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.29,
"learning_rate": 0.0001,
"loss": 1.4842,
"step": 100
},
{
"epoch": 0.59,
"learning_rate": 0.0001,
"loss": 1.4016,
"step": 200
},
{
"epoch": 0.88,
"learning_rate": 0.0001,
"loss": 1.3892,
"step": 300
},
{
"epoch": 1.0,
"eval_accuracy": 0.4543589743589744,
"eval_loss": 3.4055869579315186,
"eval_runtime": 4.1688,
"eval_samples_per_second": 119.938,
"eval_steps_per_second": 15.112,
"step": 341
},
{
"epoch": 1.0,
"eval_bleu": 0.09711501224106496,
"eval_exact_match": 0.0,
"eval_prefix_exact_match": 0.054,
"step": 341
},
{
"epoch": 1.17,
"learning_rate": 0.0001,
"loss": 1.3608,
"step": 400
},
{
"epoch": 1.46,
"learning_rate": 0.0001,
"loss": 1.3456,
"step": 500
},
{
"epoch": 1.76,
"learning_rate": 0.0001,
"loss": 1.3499,
"step": 600
},
{
"epoch": 2.0,
"eval_accuracy": 0.4576923076923077,
"eval_loss": 3.453113317489624,
"eval_runtime": 4.4031,
"eval_samples_per_second": 113.556,
"eval_steps_per_second": 14.308,
"step": 683
},
{
"epoch": 2.0,
"eval_bleu": 0.1225593574040313,
"eval_exact_match": 0.0,
"eval_prefix_exact_match": 0.056,
"step": 683
}
],
"logging_steps": 100,
"max_steps": 17050,
"num_train_epochs": 50,
"save_steps": 500,
"total_flos": 1.3526659229967974e+17,
"trial_name": null,
"trial_params": null
}
|