File size: 1,979 Bytes
4bce82d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 |
{
"best_metric": 0.8544235229492188,
"best_model_checkpoint": "beto-SDS-long-esp-mchoice/checkpoint-5547",
"epoch": 1.0,
"global_step": 5547,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.09,
"learning_rate": 4.774652965566974e-05,
"loss": 0.7789,
"step": 500
},
{
"epoch": 0.18,
"learning_rate": 4.549305931133946e-05,
"loss": 0.6927,
"step": 1000
},
{
"epoch": 0.27,
"learning_rate": 4.32395889670092e-05,
"loss": 0.6155,
"step": 1500
},
{
"epoch": 0.36,
"learning_rate": 4.0986118622678924e-05,
"loss": 0.6213,
"step": 2000
},
{
"epoch": 0.45,
"learning_rate": 3.873264827834866e-05,
"loss": 0.5896,
"step": 2500
},
{
"epoch": 0.54,
"learning_rate": 3.647917793401839e-05,
"loss": 0.5446,
"step": 3000
},
{
"epoch": 0.63,
"learning_rate": 3.422570758968812e-05,
"loss": 0.5276,
"step": 3500
},
{
"epoch": 0.72,
"learning_rate": 3.197223724535785e-05,
"loss": 0.5183,
"step": 4000
},
{
"epoch": 0.81,
"learning_rate": 2.9718766901027585e-05,
"loss": 0.5084,
"step": 4500
},
{
"epoch": 0.9,
"learning_rate": 2.746529655669732e-05,
"loss": 0.5032,
"step": 5000
},
{
"epoch": 0.99,
"learning_rate": 2.5211826212367046e-05,
"loss": 0.4839,
"step": 5500
},
{
"epoch": 1.0,
"eval_accuracy": 0.8544235229492188,
"eval_loss": 0.4278242290019989,
"eval_runtime": 63.6742,
"eval_samples_per_second": 72.604,
"eval_steps_per_second": 12.109,
"step": 5547
}
],
"max_steps": 11094,
"num_train_epochs": 2,
"total_flos": 4307533300198464.0,
"trial_name": null,
"trial_params": null
}
|