File size: 1,573 Bytes
afb21a1 54dca21 afb21a1 54dca21 afb21a1 86f875a 54dca21 afb21a1 86f875a 54dca21 afb21a1 86f875a 54dca21 afb21a1 86f875a 54dca21 afb21a1 86f875a 54dca21 a8ad4d2 86f875a 54dca21 a8ad4d2 86f875a 54dca21 a8ad4d2 86f875a 54dca21 a8ad4d2 54dca21 a8ad4d2 54dca21 afb21a1 54dca21 f16bf60 54dca21 afb21a1 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.9005276529216337,
"eval_steps": 500,
"global_step": 9,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.1,
"learning_rate": 0.001,
"loss": 2.3313,
"step": 1
},
{
"epoch": 0.2,
"learning_rate": 0.001,
"loss": 3.851,
"step": 2
},
{
"epoch": 0.3,
"learning_rate": 0.001,
"loss": 3.2287,
"step": 3
},
{
"epoch": 0.4,
"learning_rate": 0.001,
"loss": 2.7855,
"step": 4
},
{
"epoch": 0.5,
"learning_rate": 0.001,
"loss": 2.6085,
"step": 5
},
{
"epoch": 0.6,
"learning_rate": 0.001,
"loss": 2.4226,
"step": 6
},
{
"epoch": 0.7,
"learning_rate": 0.001,
"loss": 2.3728,
"step": 7
},
{
"epoch": 0.8,
"learning_rate": 0.001,
"loss": 2.3366,
"step": 8
},
{
"epoch": 0.9,
"learning_rate": 0.001,
"loss": 2.2684,
"step": 9
},
{
"epoch": 0.9,
"step": 9,
"total_flos": 9440754728435712.0,
"train_loss": 2.689473125669691,
"train_runtime": 118.9327,
"train_samples_per_second": 43.024,
"train_steps_per_second": 0.076
}
],
"logging_steps": 1.0,
"max_steps": 9,
"num_train_epochs": 1,
"save_steps": -9,
"total_flos": 9440754728435712.0,
"trial_name": null,
"trial_params": null
}
|