File size: 2,224 Bytes
68c0706 2cee2d4 50808b6 2cee2d4 68c0706 50808b6 68c0706 525d2ab 68c0706 50808b6 525d2ab 2cee2d4 68c0706 50808b6 2cee2d4 68c0706 525d2ab d7eb129 c537bc2 50808b6 2cee2d4 d7eb129 525d2ab 25946e5 16c8fbd 50808b6 2cee2d4 50808b6 4e8e0bb 2cee2d4 4e8e0bb 2cee2d4 4e8e0bb 2cee2d4 4e8e0bb 2cee2d4 4e8e0bb 2cee2d4 4e8e0bb 2cee2d4 4e8e0bb 2cee2d4 4e8e0bb 68c0706 50808b6 68c0706 50808b6 68c0706 6fc380d 68c0706 2cee2d4 68c0706 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.5,
"eval_steps": 3,
"global_step": 6,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.08333333333333333,
"grad_norm": NaN,
"learning_rate": 0.0,
"loss": 1.4927,
"step": 1
},
{
"epoch": 0.08333333333333333,
"eval_loss": 1.4977792501449585,
"eval_runtime": 0.2209,
"eval_samples_per_second": 13.579,
"eval_steps_per_second": 13.579,
"step": 1
},
{
"epoch": 0.16666666666666666,
"grad_norm": 4.962691783905029,
"learning_rate": 2e-05,
"loss": 1.307,
"step": 2
},
{
"epoch": 0.25,
"grad_norm": 5.919677734375,
"learning_rate": 4e-05,
"loss": 1.5735,
"step": 3
},
{
"epoch": 0.25,
"eval_loss": 1.4450377225875854,
"eval_runtime": 0.2257,
"eval_samples_per_second": 13.291,
"eval_steps_per_second": 13.291,
"step": 3
},
{
"epoch": 0.3333333333333333,
"grad_norm": 4.771228313446045,
"learning_rate": 6e-05,
"loss": 1.2789,
"step": 4
},
{
"epoch": 0.4166666666666667,
"grad_norm": 3.510233163833618,
"learning_rate": 8e-05,
"loss": 1.3015,
"step": 5
},
{
"epoch": 0.5,
"grad_norm": 2.8811535835266113,
"learning_rate": 0.0001,
"loss": 1.0788,
"step": 6
},
{
"epoch": 0.5,
"eval_loss": 0.8092367053031921,
"eval_runtime": 0.2418,
"eval_samples_per_second": 12.405,
"eval_steps_per_second": 12.405,
"step": 6
}
],
"logging_steps": 1,
"max_steps": 10,
"num_input_tokens_seen": 0,
"num_train_epochs": 1,
"save_steps": 3,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 1109738548887552.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}
|