File size: 1,377 Bytes
bc841eb a320ff5 bc841eb 9e64091 bc841eb fc2a210 a320ff5 bc841eb fc2a210 a320ff5 fc2a210 a320ff5 fc2a210 a320ff5 fc2a210 a320ff5 fc2a210 bc841eb a320ff5 fc2a210 a320ff5 bc841eb a320ff5 9e64091 a320ff5 bc841eb fc2a210 9e64091 bc841eb a320ff5 bc841eb |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.0014344526845781992,
"eval_steps": 500,
"global_step": 100,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"learning_rate": 2e-05,
"loss": 0.0,
"step": 1
},
{
"epoch": 0.0,
"learning_rate": 0.00019396926207859084,
"loss": 0.0,
"step": 20
},
{
"epoch": 0.0,
"learning_rate": 0.00015000000000000001,
"loss": 0.0,
"step": 40
},
{
"epoch": 0.0,
"learning_rate": 8.263518223330697e-05,
"loss": 0.0,
"step": 60
},
{
"epoch": 0.0,
"learning_rate": 2.339555568810221e-05,
"loss": 0.0,
"step": 80
},
{
"epoch": 0.0,
"learning_rate": 0.0,
"loss": 0.0,
"step": 100
},
{
"epoch": 0.0,
"step": 100,
"total_flos": 1.768131718545408e+16,
"train_loss": 0.0,
"train_runtime": 501.823,
"train_samples_per_second": 0.399,
"train_steps_per_second": 0.199
}
],
"logging_steps": 20,
"max_steps": 100,
"num_input_tokens_seen": 0,
"num_train_epochs": 1,
"save_steps": 100,
"total_flos": 1.768131718545408e+16,
"train_batch_size": 2,
"trial_name": null,
"trial_params": null
}
|