File size: 1,316 Bytes
2da217f e4aa0ab 6e1cd2e 2da217f e4aa0ab 6e1cd2e fc88da5 2da217f 6e1cd2e fc88da5 2da217f 6e1cd2e fc88da5 2da217f 153c95c 6e1cd2e fc88da5 2da217f 153c95c 6e1cd2e fc88da5 2da217f 6e1cd2e fc88da5 0cb8366 2da217f e4aa0ab 6e1cd2e 2da217f 6e1cd2e e4aa0ab 6e1cd2e 2da217f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 1.0,
"global_step": 339,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.15,
"learning_rate": 4.262536873156342e-05,
"loss": 0.0544,
"step": 50
},
{
"epoch": 0.29,
"learning_rate": 3.5250737463126844e-05,
"loss": 0.0046,
"step": 100
},
{
"epoch": 0.44,
"learning_rate": 2.7876106194690264e-05,
"loss": 0.0017,
"step": 150
},
{
"epoch": 0.59,
"learning_rate": 2.0501474926253688e-05,
"loss": 0.0008,
"step": 200
},
{
"epoch": 0.74,
"learning_rate": 1.3126843657817109e-05,
"loss": 0.0003,
"step": 250
},
{
"epoch": 0.88,
"learning_rate": 5.752212389380531e-06,
"loss": 0.0005,
"step": 300
},
{
"epoch": 1.0,
"step": 339,
"total_flos": 2741653307243520.0,
"train_loss": 0.009268463998593412,
"train_runtime": 186.2906,
"train_samples_per_second": 116.34,
"train_steps_per_second": 1.82
}
],
"max_steps": 339,
"num_train_epochs": 1,
"total_flos": 2741653307243520.0,
"trial_name": null,
"trial_params": null
}
|