Prachetas's picture
End of training
c5621a3
{
"best_metric": 0.7989690721649485,
"best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat/checkpoint-56",
"epoch": 14.4,
"global_step": 90,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.96,
"eval_accuracy": 0.6701030927835051,
"eval_loss": 1.1081335544586182,
"eval_runtime": 3.5046,
"eval_samples_per_second": 55.356,
"eval_steps_per_second": 1.997,
"step": 6
},
{
"epoch": 1.6,
"learning_rate": 0.0009876543209876543,
"loss": 0.6578,
"step": 10
},
{
"epoch": 1.92,
"eval_accuracy": 0.6701030927835051,
"eval_loss": 0.7938751578330994,
"eval_runtime": 4.9264,
"eval_samples_per_second": 39.379,
"eval_steps_per_second": 1.421,
"step": 12
},
{
"epoch": 2.88,
"eval_accuracy": 0.7783505154639175,
"eval_loss": 0.7289248704910278,
"eval_runtime": 4.0288,
"eval_samples_per_second": 48.153,
"eval_steps_per_second": 1.737,
"step": 18
},
{
"epoch": 3.2,
"learning_rate": 0.0008641975308641975,
"loss": 0.8064,
"step": 20
},
{
"epoch": 4.0,
"eval_accuracy": 0.6804123711340206,
"eval_loss": 0.7616495490074158,
"eval_runtime": 3.5168,
"eval_samples_per_second": 55.164,
"eval_steps_per_second": 1.99,
"step": 25
},
{
"epoch": 4.8,
"learning_rate": 0.0007407407407407407,
"loss": 0.7259,
"step": 30
},
{
"epoch": 4.96,
"eval_accuracy": 0.7319587628865979,
"eval_loss": 0.627986490726471,
"eval_runtime": 3.5355,
"eval_samples_per_second": 54.872,
"eval_steps_per_second": 1.98,
"step": 31
},
{
"epoch": 5.92,
"eval_accuracy": 0.7474226804123711,
"eval_loss": 0.6325005888938904,
"eval_runtime": 4.6009,
"eval_samples_per_second": 42.166,
"eval_steps_per_second": 1.521,
"step": 37
},
{
"epoch": 6.4,
"learning_rate": 0.0006172839506172839,
"loss": 0.6316,
"step": 40
},
{
"epoch": 6.88,
"eval_accuracy": 0.7319587628865979,
"eval_loss": 0.6799241900444031,
"eval_runtime": 4.5386,
"eval_samples_per_second": 42.745,
"eval_steps_per_second": 1.542,
"step": 43
},
{
"epoch": 8.0,
"learning_rate": 0.0004938271604938272,
"loss": 0.607,
"step": 50
},
{
"epoch": 8.0,
"eval_accuracy": 0.788659793814433,
"eval_loss": 0.7443605661392212,
"eval_runtime": 3.543,
"eval_samples_per_second": 54.756,
"eval_steps_per_second": 1.976,
"step": 50
},
{
"epoch": 8.96,
"eval_accuracy": 0.7989690721649485,
"eval_loss": 0.6149767637252808,
"eval_runtime": 3.5088,
"eval_samples_per_second": 55.29,
"eval_steps_per_second": 1.995,
"step": 56
},
{
"epoch": 9.6,
"learning_rate": 0.00037037037037037035,
"loss": 0.5268,
"step": 60
},
{
"epoch": 9.92,
"eval_accuracy": 0.7577319587628866,
"eval_loss": 0.5972550511360168,
"eval_runtime": 4.7222,
"eval_samples_per_second": 41.082,
"eval_steps_per_second": 1.482,
"step": 62
},
{
"epoch": 10.88,
"eval_accuracy": 0.7731958762886598,
"eval_loss": 0.7381436824798584,
"eval_runtime": 4.4998,
"eval_samples_per_second": 43.113,
"eval_steps_per_second": 1.556,
"step": 68
},
{
"epoch": 11.2,
"learning_rate": 0.0002469135802469136,
"loss": 0.4797,
"step": 70
},
{
"epoch": 12.0,
"eval_accuracy": 0.7731958762886598,
"eval_loss": 0.6777181625366211,
"eval_runtime": 3.5325,
"eval_samples_per_second": 54.919,
"eval_steps_per_second": 1.982,
"step": 75
},
{
"epoch": 12.8,
"learning_rate": 0.0001234567901234568,
"loss": 0.4618,
"step": 80
},
{
"epoch": 12.96,
"eval_accuracy": 0.788659793814433,
"eval_loss": 0.6430295705795288,
"eval_runtime": 3.4979,
"eval_samples_per_second": 55.462,
"eval_steps_per_second": 2.001,
"step": 81
},
{
"epoch": 13.92,
"eval_accuracy": 0.7783505154639175,
"eval_loss": 0.6716616749763489,
"eval_runtime": 4.7354,
"eval_samples_per_second": 40.968,
"eval_steps_per_second": 1.478,
"step": 87
},
{
"epoch": 14.4,
"learning_rate": 0.0,
"loss": 0.3618,
"step": 90
},
{
"epoch": 14.4,
"eval_accuracy": 0.7938144329896907,
"eval_loss": 0.6744318008422852,
"eval_runtime": 3.5202,
"eval_samples_per_second": 55.111,
"eval_steps_per_second": 1.989,
"step": 90
},
{
"epoch": 14.4,
"step": 90,
"total_flos": 2.7800491620335616e+17,
"train_loss": 0.5843003829320271,
"train_runtime": 517.5663,
"train_samples_per_second": 22.49,
"train_steps_per_second": 0.174
}
],
"max_steps": 90,
"num_train_epochs": 15,
"total_flos": 2.7800491620335616e+17,
"trial_name": null,
"trial_params": null
}