b07611031's picture
End of training
0ab2ed6 verified
{
"best_metric": 0.9675324675324676,
"best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-70",
"epoch": 30.0,
"eval_steps": 500,
"global_step": 150,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.6298701298701299,
"eval_loss": 0.6615892648696899,
"eval_runtime": 5.9895,
"eval_samples_per_second": 25.712,
"eval_steps_per_second": 0.835,
"step": 5
},
{
"epoch": 2.0,
"grad_norm": 6.212774753570557,
"learning_rate": 3.3333333333333335e-05,
"loss": 0.6583,
"step": 10
},
{
"epoch": 2.0,
"eval_accuracy": 0.7597402597402597,
"eval_loss": 0.5232259631156921,
"eval_runtime": 5.5139,
"eval_samples_per_second": 27.929,
"eval_steps_per_second": 0.907,
"step": 10
},
{
"epoch": 3.0,
"eval_accuracy": 0.7857142857142857,
"eval_loss": 0.5042803287506104,
"eval_runtime": 5.8851,
"eval_samples_per_second": 26.168,
"eval_steps_per_second": 0.85,
"step": 15
},
{
"epoch": 4.0,
"grad_norm": 3.873718738555908,
"learning_rate": 4.814814814814815e-05,
"loss": 0.3346,
"step": 20
},
{
"epoch": 4.0,
"eval_accuracy": 0.8766233766233766,
"eval_loss": 0.287881076335907,
"eval_runtime": 5.8126,
"eval_samples_per_second": 26.494,
"eval_steps_per_second": 0.86,
"step": 20
},
{
"epoch": 5.0,
"eval_accuracy": 0.9090909090909091,
"eval_loss": 0.24241776764392853,
"eval_runtime": 5.8885,
"eval_samples_per_second": 26.152,
"eval_steps_per_second": 0.849,
"step": 25
},
{
"epoch": 6.0,
"grad_norm": 4.3201093673706055,
"learning_rate": 4.4444444444444447e-05,
"loss": 0.1544,
"step": 30
},
{
"epoch": 6.0,
"eval_accuracy": 0.8896103896103896,
"eval_loss": 0.22171010076999664,
"eval_runtime": 5.7903,
"eval_samples_per_second": 26.596,
"eval_steps_per_second": 0.864,
"step": 30
},
{
"epoch": 7.0,
"eval_accuracy": 0.922077922077922,
"eval_loss": 0.14658886194229126,
"eval_runtime": 5.8797,
"eval_samples_per_second": 26.192,
"eval_steps_per_second": 0.85,
"step": 35
},
{
"epoch": 8.0,
"grad_norm": 4.792673587799072,
"learning_rate": 4.074074074074074e-05,
"loss": 0.088,
"step": 40
},
{
"epoch": 8.0,
"eval_accuracy": 0.948051948051948,
"eval_loss": 0.12608817219734192,
"eval_runtime": 5.723,
"eval_samples_per_second": 26.909,
"eval_steps_per_second": 0.874,
"step": 40
},
{
"epoch": 9.0,
"eval_accuracy": 0.922077922077922,
"eval_loss": 0.16798314452171326,
"eval_runtime": 5.7613,
"eval_samples_per_second": 26.73,
"eval_steps_per_second": 0.868,
"step": 45
},
{
"epoch": 10.0,
"grad_norm": 6.038075923919678,
"learning_rate": 3.7037037037037037e-05,
"loss": 0.0977,
"step": 50
},
{
"epoch": 10.0,
"eval_accuracy": 0.935064935064935,
"eval_loss": 0.14464019238948822,
"eval_runtime": 5.8083,
"eval_samples_per_second": 26.514,
"eval_steps_per_second": 0.861,
"step": 50
},
{
"epoch": 11.0,
"eval_accuracy": 0.922077922077922,
"eval_loss": 0.18122775852680206,
"eval_runtime": 6.1597,
"eval_samples_per_second": 25.001,
"eval_steps_per_second": 0.812,
"step": 55
},
{
"epoch": 12.0,
"grad_norm": 4.068108558654785,
"learning_rate": 3.3333333333333335e-05,
"loss": 0.0719,
"step": 60
},
{
"epoch": 12.0,
"eval_accuracy": 0.9285714285714286,
"eval_loss": 0.17976221442222595,
"eval_runtime": 6.0227,
"eval_samples_per_second": 25.57,
"eval_steps_per_second": 0.83,
"step": 60
},
{
"epoch": 13.0,
"eval_accuracy": 0.961038961038961,
"eval_loss": 0.105579674243927,
"eval_runtime": 5.8224,
"eval_samples_per_second": 26.449,
"eval_steps_per_second": 0.859,
"step": 65
},
{
"epoch": 14.0,
"grad_norm": 3.0755834579467773,
"learning_rate": 2.962962962962963e-05,
"loss": 0.0629,
"step": 70
},
{
"epoch": 14.0,
"eval_accuracy": 0.9675324675324676,
"eval_loss": 0.10734522342681885,
"eval_runtime": 5.9253,
"eval_samples_per_second": 25.99,
"eval_steps_per_second": 0.844,
"step": 70
},
{
"epoch": 15.0,
"eval_accuracy": 0.9545454545454546,
"eval_loss": 0.11058878153562546,
"eval_runtime": 5.9322,
"eval_samples_per_second": 25.96,
"eval_steps_per_second": 0.843,
"step": 75
},
{
"epoch": 16.0,
"grad_norm": 1.3675538301467896,
"learning_rate": 2.5925925925925925e-05,
"loss": 0.0414,
"step": 80
},
{
"epoch": 16.0,
"eval_accuracy": 0.9415584415584416,
"eval_loss": 0.12863656878471375,
"eval_runtime": 5.8097,
"eval_samples_per_second": 26.508,
"eval_steps_per_second": 0.861,
"step": 80
},
{
"epoch": 17.0,
"eval_accuracy": 0.961038961038961,
"eval_loss": 0.07608745247125626,
"eval_runtime": 5.9871,
"eval_samples_per_second": 25.722,
"eval_steps_per_second": 0.835,
"step": 85
},
{
"epoch": 18.0,
"grad_norm": 3.8409650325775146,
"learning_rate": 2.2222222222222223e-05,
"loss": 0.0397,
"step": 90
},
{
"epoch": 18.0,
"eval_accuracy": 0.9675324675324676,
"eval_loss": 0.07851818948984146,
"eval_runtime": 5.9494,
"eval_samples_per_second": 25.885,
"eval_steps_per_second": 0.84,
"step": 90
},
{
"epoch": 19.0,
"eval_accuracy": 0.9675324675324676,
"eval_loss": 0.07459615916013718,
"eval_runtime": 5.5847,
"eval_samples_per_second": 27.575,
"eval_steps_per_second": 0.895,
"step": 95
},
{
"epoch": 20.0,
"grad_norm": 40.9788932800293,
"learning_rate": 1.8518518518518518e-05,
"loss": 0.0487,
"step": 100
},
{
"epoch": 20.0,
"eval_accuracy": 0.9675324675324676,
"eval_loss": 0.06842251867055893,
"eval_runtime": 5.7506,
"eval_samples_per_second": 26.78,
"eval_steps_per_second": 0.869,
"step": 100
},
{
"epoch": 21.0,
"eval_accuracy": 0.961038961038961,
"eval_loss": 0.06015988811850548,
"eval_runtime": 5.6354,
"eval_samples_per_second": 27.327,
"eval_steps_per_second": 0.887,
"step": 105
},
{
"epoch": 22.0,
"grad_norm": 0.32140201330184937,
"learning_rate": 1.4814814814814815e-05,
"loss": 0.0244,
"step": 110
},
{
"epoch": 22.0,
"eval_accuracy": 0.9675324675324676,
"eval_loss": 0.055138688534498215,
"eval_runtime": 5.6318,
"eval_samples_per_second": 27.344,
"eval_steps_per_second": 0.888,
"step": 110
},
{
"epoch": 23.0,
"eval_accuracy": 0.9675324675324676,
"eval_loss": 0.06390709429979324,
"eval_runtime": 5.9133,
"eval_samples_per_second": 26.043,
"eval_steps_per_second": 0.846,
"step": 115
},
{
"epoch": 24.0,
"grad_norm": 0.17090357840061188,
"learning_rate": 1.1111111111111112e-05,
"loss": 0.0214,
"step": 120
},
{
"epoch": 24.0,
"eval_accuracy": 0.9675324675324676,
"eval_loss": 0.05834332853555679,
"eval_runtime": 5.6237,
"eval_samples_per_second": 27.384,
"eval_steps_per_second": 0.889,
"step": 120
},
{
"epoch": 25.0,
"eval_accuracy": 0.9675324675324676,
"eval_loss": 0.06634216755628586,
"eval_runtime": 5.782,
"eval_samples_per_second": 26.634,
"eval_steps_per_second": 0.865,
"step": 125
},
{
"epoch": 26.0,
"grad_norm": 15.199660301208496,
"learning_rate": 7.4074074074074075e-06,
"loss": 0.0261,
"step": 130
},
{
"epoch": 26.0,
"eval_accuracy": 0.961038961038961,
"eval_loss": 0.10064199566841125,
"eval_runtime": 5.8966,
"eval_samples_per_second": 26.117,
"eval_steps_per_second": 0.848,
"step": 130
},
{
"epoch": 27.0,
"eval_accuracy": 0.9675324675324676,
"eval_loss": 0.07111012190580368,
"eval_runtime": 5.7198,
"eval_samples_per_second": 26.924,
"eval_steps_per_second": 0.874,
"step": 135
},
{
"epoch": 28.0,
"grad_norm": 0.7294249534606934,
"learning_rate": 3.7037037037037037e-06,
"loss": 0.019,
"step": 140
},
{
"epoch": 28.0,
"eval_accuracy": 0.9675324675324676,
"eval_loss": 0.06293747574090958,
"eval_runtime": 6.017,
"eval_samples_per_second": 25.594,
"eval_steps_per_second": 0.831,
"step": 140
},
{
"epoch": 29.0,
"eval_accuracy": 0.961038961038961,
"eval_loss": 0.07278253883123398,
"eval_runtime": 5.5819,
"eval_samples_per_second": 27.589,
"eval_steps_per_second": 0.896,
"step": 145
},
{
"epoch": 30.0,
"grad_norm": 0.9749196171760559,
"learning_rate": 0.0,
"loss": 0.0237,
"step": 150
},
{
"epoch": 30.0,
"eval_accuracy": 0.961038961038961,
"eval_loss": 0.07468711584806442,
"eval_runtime": 5.8121,
"eval_samples_per_second": 26.496,
"eval_steps_per_second": 0.86,
"step": 150
},
{
"epoch": 30.0,
"step": 150,
"total_flos": 4.548645984411648e+17,
"train_loss": 0.11414109120766322,
"train_runtime": 869.5797,
"train_samples_per_second": 21.045,
"train_steps_per_second": 0.172
}
],
"logging_steps": 10,
"max_steps": 150,
"num_input_tokens_seen": 0,
"num_train_epochs": 30,
"save_steps": 500,
"total_flos": 4.548645984411648e+17,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}