kiranshivaraju's picture
End of training
2c8b233 verified
{
"best_metric": 0.7464788732394366,
"best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-aug-pcb/checkpoint-15",
"epoch": 3.0,
"eval_steps": 500,
"global_step": 45,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.6666666666666666,
"grad_norm": 3.8551907539367676,
"learning_rate": 4.375e-05,
"loss": 0.5945,
"step": 10
},
{
"epoch": 1.0,
"eval_accuracy": 0.7464788732394366,
"eval_loss": 0.5191543698310852,
"eval_runtime": 3.2613,
"eval_samples_per_second": 65.311,
"eval_steps_per_second": 2.146,
"step": 15
},
{
"epoch": 1.3333333333333333,
"grad_norm": 2.4505937099456787,
"learning_rate": 3.125e-05,
"loss": 0.5456,
"step": 20
},
{
"epoch": 2.0,
"grad_norm": 3.593410015106201,
"learning_rate": 1.8750000000000002e-05,
"loss": 0.5435,
"step": 30
},
{
"epoch": 2.0,
"eval_accuracy": 0.7230046948356808,
"eval_loss": 0.4960363209247589,
"eval_runtime": 2.5999,
"eval_samples_per_second": 81.927,
"eval_steps_per_second": 2.692,
"step": 30
},
{
"epoch": 2.6666666666666665,
"grad_norm": 2.4927446842193604,
"learning_rate": 6.25e-06,
"loss": 0.5187,
"step": 40
},
{
"epoch": 3.0,
"eval_accuracy": 0.7417840375586855,
"eval_loss": 0.48202893137931824,
"eval_runtime": 2.9734,
"eval_samples_per_second": 71.635,
"eval_steps_per_second": 2.354,
"step": 45
},
{
"epoch": 3.0,
"step": 45,
"total_flos": 1.581835139059876e+17,
"train_loss": 0.5431705315907797,
"train_runtime": 137.9694,
"train_samples_per_second": 41.553,
"train_steps_per_second": 0.326
}
],
"logging_steps": 10,
"max_steps": 45,
"num_input_tokens_seen": 0,
"num_train_epochs": 3,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.581835139059876e+17,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}