SiddharthaM's picture
End of training
6047fac
{
"best_metric": 0.9178082191780822,
"best_model_checkpoint": "beit-base-patch16-224-pt22k-ft22k-rim_one-new/checkpoint-2",
"epoch": 29.727272727272727,
"global_step": 60,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.73,
"eval_accuracy": 0.9178082191780822,
"eval_loss": 0.24113720655441284,
"eval_runtime": 4.0491,
"eval_samples_per_second": 36.057,
"eval_steps_per_second": 1.235,
"step": 2
},
{
"epoch": 1.73,
"eval_accuracy": 0.8972602739726028,
"eval_loss": 0.21820734441280365,
"eval_runtime": 4.3715,
"eval_samples_per_second": 33.398,
"eval_steps_per_second": 1.144,
"step": 4
},
{
"epoch": 2.73,
"eval_accuracy": 0.8972602739726028,
"eval_loss": 0.3085276186466217,
"eval_runtime": 4.3762,
"eval_samples_per_second": 33.362,
"eval_steps_per_second": 1.143,
"step": 6
},
{
"epoch": 3.73,
"eval_accuracy": 0.8972602739726028,
"eval_loss": 0.27944016456604004,
"eval_runtime": 4.3106,
"eval_samples_per_second": 33.87,
"eval_steps_per_second": 1.16,
"step": 8
},
{
"epoch": 4.73,
"learning_rate": 4.62962962962963e-05,
"loss": 0.1392,
"step": 10
},
{
"epoch": 4.73,
"eval_accuracy": 0.910958904109589,
"eval_loss": 0.23977190256118774,
"eval_runtime": 4.3753,
"eval_samples_per_second": 33.369,
"eval_steps_per_second": 1.143,
"step": 10
},
{
"epoch": 5.73,
"eval_accuracy": 0.8972602739726028,
"eval_loss": 0.29249313473701477,
"eval_runtime": 4.3239,
"eval_samples_per_second": 33.766,
"eval_steps_per_second": 1.156,
"step": 12
},
{
"epoch": 6.73,
"eval_accuracy": 0.910958904109589,
"eval_loss": 0.2797797918319702,
"eval_runtime": 4.3315,
"eval_samples_per_second": 33.707,
"eval_steps_per_second": 1.154,
"step": 14
},
{
"epoch": 7.73,
"eval_accuracy": 0.9178082191780822,
"eval_loss": 0.21835216879844666,
"eval_runtime": 4.3475,
"eval_samples_per_second": 33.582,
"eval_steps_per_second": 1.15,
"step": 16
},
{
"epoch": 8.73,
"eval_accuracy": 0.910958904109589,
"eval_loss": 0.30065301060676575,
"eval_runtime": 4.3333,
"eval_samples_per_second": 33.693,
"eval_steps_per_second": 1.154,
"step": 18
},
{
"epoch": 9.73,
"learning_rate": 3.7037037037037037e-05,
"loss": 0.0416,
"step": 20
},
{
"epoch": 9.73,
"eval_accuracy": 0.9041095890410958,
"eval_loss": 0.3344126045703888,
"eval_runtime": 4.366,
"eval_samples_per_second": 33.44,
"eval_steps_per_second": 1.145,
"step": 20
},
{
"epoch": 10.73,
"eval_accuracy": 0.910958904109589,
"eval_loss": 0.36264100670814514,
"eval_runtime": 4.3578,
"eval_samples_per_second": 33.503,
"eval_steps_per_second": 1.147,
"step": 22
},
{
"epoch": 11.73,
"eval_accuracy": 0.8904109589041096,
"eval_loss": 0.48421263694763184,
"eval_runtime": 4.3873,
"eval_samples_per_second": 33.278,
"eval_steps_per_second": 1.14,
"step": 24
},
{
"epoch": 12.73,
"eval_accuracy": 0.8972602739726028,
"eval_loss": 0.36641207337379456,
"eval_runtime": 4.1126,
"eval_samples_per_second": 35.5,
"eval_steps_per_second": 1.216,
"step": 26
},
{
"epoch": 13.73,
"eval_accuracy": 0.910958904109589,
"eval_loss": 0.3457633852958679,
"eval_runtime": 4.131,
"eval_samples_per_second": 35.342,
"eval_steps_per_second": 1.21,
"step": 28
},
{
"epoch": 14.73,
"learning_rate": 2.777777777777778e-05,
"loss": 0.0263,
"step": 30
},
{
"epoch": 14.73,
"eval_accuracy": 0.910958904109589,
"eval_loss": 0.28100982308387756,
"eval_runtime": 4.0812,
"eval_samples_per_second": 35.773,
"eval_steps_per_second": 1.225,
"step": 30
},
{
"epoch": 15.73,
"eval_accuracy": 0.8698630136986302,
"eval_loss": 0.4695476293563843,
"eval_runtime": 4.0905,
"eval_samples_per_second": 35.692,
"eval_steps_per_second": 1.222,
"step": 32
},
{
"epoch": 16.73,
"eval_accuracy": 0.9041095890410958,
"eval_loss": 0.3723364770412445,
"eval_runtime": 4.1081,
"eval_samples_per_second": 35.539,
"eval_steps_per_second": 1.217,
"step": 34
},
{
"epoch": 17.73,
"eval_accuracy": 0.9041095890410958,
"eval_loss": 0.34467366337776184,
"eval_runtime": 4.1554,
"eval_samples_per_second": 35.135,
"eval_steps_per_second": 1.203,
"step": 36
},
{
"epoch": 18.73,
"eval_accuracy": 0.8904109589041096,
"eval_loss": 0.37077629566192627,
"eval_runtime": 4.0887,
"eval_samples_per_second": 35.708,
"eval_steps_per_second": 1.223,
"step": 38
},
{
"epoch": 19.73,
"learning_rate": 1.8518518518518518e-05,
"loss": 0.0264,
"step": 40
},
{
"epoch": 19.73,
"eval_accuracy": 0.910958904109589,
"eval_loss": 0.4051611125469208,
"eval_runtime": 4.1078,
"eval_samples_per_second": 35.542,
"eval_steps_per_second": 1.217,
"step": 40
},
{
"epoch": 20.73,
"eval_accuracy": 0.9041095890410958,
"eval_loss": 0.44917088747024536,
"eval_runtime": 4.0898,
"eval_samples_per_second": 35.699,
"eval_steps_per_second": 1.223,
"step": 42
},
{
"epoch": 21.73,
"eval_accuracy": 0.8904109589041096,
"eval_loss": 0.4648548662662506,
"eval_runtime": 4.151,
"eval_samples_per_second": 35.173,
"eval_steps_per_second": 1.205,
"step": 44
},
{
"epoch": 22.73,
"eval_accuracy": 0.9178082191780822,
"eval_loss": 0.4061222970485687,
"eval_runtime": 4.1096,
"eval_samples_per_second": 35.527,
"eval_steps_per_second": 1.217,
"step": 46
},
{
"epoch": 23.73,
"eval_accuracy": 0.910958904109589,
"eval_loss": 0.4136480391025543,
"eval_runtime": 4.0895,
"eval_samples_per_second": 35.701,
"eval_steps_per_second": 1.223,
"step": 48
},
{
"epoch": 24.73,
"learning_rate": 9.259259259259259e-06,
"loss": 0.0139,
"step": 50
},
{
"epoch": 24.73,
"eval_accuracy": 0.8972602739726028,
"eval_loss": 0.41833144426345825,
"eval_runtime": 4.0666,
"eval_samples_per_second": 35.903,
"eval_steps_per_second": 1.23,
"step": 50
},
{
"epoch": 25.73,
"eval_accuracy": 0.8904109589041096,
"eval_loss": 0.4503590762615204,
"eval_runtime": 4.105,
"eval_samples_per_second": 35.567,
"eval_steps_per_second": 1.218,
"step": 52
},
{
"epoch": 26.73,
"eval_accuracy": 0.8972602739726028,
"eval_loss": 0.43678611516952515,
"eval_runtime": 4.1124,
"eval_samples_per_second": 35.503,
"eval_steps_per_second": 1.216,
"step": 54
},
{
"epoch": 27.73,
"eval_accuracy": 0.910958904109589,
"eval_loss": 0.4710823893547058,
"eval_runtime": 4.126,
"eval_samples_per_second": 35.385,
"eval_steps_per_second": 1.212,
"step": 56
},
{
"epoch": 28.73,
"eval_accuracy": 0.910958904109589,
"eval_loss": 0.39282917976379395,
"eval_runtime": 4.1214,
"eval_samples_per_second": 35.425,
"eval_steps_per_second": 1.213,
"step": 58
},
{
"epoch": 29.73,
"learning_rate": 0.0,
"loss": 0.005,
"step": 60
},
{
"epoch": 29.73,
"eval_accuracy": 0.8767123287671232,
"eval_loss": 0.45500674843788147,
"eval_runtime": 4.1417,
"eval_samples_per_second": 35.251,
"eval_steps_per_second": 1.207,
"step": 60
},
{
"epoch": 29.73,
"step": 60,
"total_flos": 7.813276079484396e+17,
"train_loss": 0.042075487226247786,
"train_runtime": 801.9686,
"train_samples_per_second": 12.681,
"train_steps_per_second": 0.075
}
],
"max_steps": 60,
"num_train_epochs": 30,
"total_flos": 7.813276079484396e+17,
"trial_name": null,
"trial_params": null
}