ntnxx2's picture
End of training
275bf7a
{
"best_metric": 0.5625,
"best_model_checkpoint": "vit-base-patch16-224-finetuned-Visual-Emotional/checkpoint-132",
"epoch": 27.82608695652174,
"eval_steps": 500,
"global_step": 160,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.87,
"eval_accuracy": 0.15,
"eval_loss": 2.141930341720581,
"eval_runtime": 1.0932,
"eval_samples_per_second": 73.177,
"eval_steps_per_second": 2.744,
"step": 5
},
{
"epoch": 1.74,
"learning_rate": 3.125e-05,
"loss": 2.1722,
"step": 10
},
{
"epoch": 1.91,
"eval_accuracy": 0.1625,
"eval_loss": 2.038079023361206,
"eval_runtime": 1.0792,
"eval_samples_per_second": 74.126,
"eval_steps_per_second": 2.78,
"step": 11
},
{
"epoch": 2.96,
"eval_accuracy": 0.3,
"eval_loss": 1.8728723526000977,
"eval_runtime": 1.0061,
"eval_samples_per_second": 79.518,
"eval_steps_per_second": 2.982,
"step": 17
},
{
"epoch": 3.48,
"learning_rate": 4.8611111111111115e-05,
"loss": 1.8696,
"step": 20
},
{
"epoch": 4.0,
"eval_accuracy": 0.3625,
"eval_loss": 1.6683166027069092,
"eval_runtime": 1.0334,
"eval_samples_per_second": 77.411,
"eval_steps_per_second": 2.903,
"step": 23
},
{
"epoch": 4.87,
"eval_accuracy": 0.4,
"eval_loss": 1.5172284841537476,
"eval_runtime": 1.0518,
"eval_samples_per_second": 76.061,
"eval_steps_per_second": 2.852,
"step": 28
},
{
"epoch": 5.22,
"learning_rate": 4.5138888888888894e-05,
"loss": 1.4531,
"step": 30
},
{
"epoch": 5.91,
"eval_accuracy": 0.4625,
"eval_loss": 1.3959767818450928,
"eval_runtime": 1.1351,
"eval_samples_per_second": 70.478,
"eval_steps_per_second": 2.643,
"step": 34
},
{
"epoch": 6.96,
"learning_rate": 4.166666666666667e-05,
"loss": 1.1483,
"step": 40
},
{
"epoch": 6.96,
"eval_accuracy": 0.45,
"eval_loss": 1.378754734992981,
"eval_runtime": 1.1386,
"eval_samples_per_second": 70.26,
"eval_steps_per_second": 2.635,
"step": 40
},
{
"epoch": 8.0,
"eval_accuracy": 0.5125,
"eval_loss": 1.318593144416809,
"eval_runtime": 1.0875,
"eval_samples_per_second": 73.565,
"eval_steps_per_second": 2.759,
"step": 46
},
{
"epoch": 8.7,
"learning_rate": 3.8194444444444444e-05,
"loss": 0.955,
"step": 50
},
{
"epoch": 8.87,
"eval_accuracy": 0.475,
"eval_loss": 1.2741286754608154,
"eval_runtime": 1.0684,
"eval_samples_per_second": 74.879,
"eval_steps_per_second": 2.808,
"step": 51
},
{
"epoch": 9.91,
"eval_accuracy": 0.5,
"eval_loss": 1.2990485429763794,
"eval_runtime": 1.0705,
"eval_samples_per_second": 74.731,
"eval_steps_per_second": 2.802,
"step": 57
},
{
"epoch": 10.43,
"learning_rate": 3.472222222222222e-05,
"loss": 0.7894,
"step": 60
},
{
"epoch": 10.96,
"eval_accuracy": 0.475,
"eval_loss": 1.246220588684082,
"eval_runtime": 1.0689,
"eval_samples_per_second": 74.845,
"eval_steps_per_second": 2.807,
"step": 63
},
{
"epoch": 12.0,
"eval_accuracy": 0.5375,
"eval_loss": 1.308982491493225,
"eval_runtime": 1.1406,
"eval_samples_per_second": 70.141,
"eval_steps_per_second": 2.63,
"step": 69
},
{
"epoch": 12.17,
"learning_rate": 3.125e-05,
"loss": 0.6769,
"step": 70
},
{
"epoch": 12.87,
"eval_accuracy": 0.5125,
"eval_loss": 1.2809442281723022,
"eval_runtime": 1.0624,
"eval_samples_per_second": 75.301,
"eval_steps_per_second": 2.824,
"step": 74
},
{
"epoch": 13.91,
"learning_rate": 2.777777777777778e-05,
"loss": 0.5958,
"step": 80
},
{
"epoch": 13.91,
"eval_accuracy": 0.525,
"eval_loss": 1.30197274684906,
"eval_runtime": 1.0687,
"eval_samples_per_second": 74.857,
"eval_steps_per_second": 2.807,
"step": 80
},
{
"epoch": 14.96,
"eval_accuracy": 0.5,
"eval_loss": 1.3032042980194092,
"eval_runtime": 1.1451,
"eval_samples_per_second": 69.863,
"eval_steps_per_second": 2.62,
"step": 86
},
{
"epoch": 15.65,
"learning_rate": 2.4305555555555558e-05,
"loss": 0.5179,
"step": 90
},
{
"epoch": 16.0,
"eval_accuracy": 0.5375,
"eval_loss": 1.2624261379241943,
"eval_runtime": 1.0678,
"eval_samples_per_second": 74.923,
"eval_steps_per_second": 2.81,
"step": 92
},
{
"epoch": 16.87,
"eval_accuracy": 0.525,
"eval_loss": 1.2776085138320923,
"eval_runtime": 1.0697,
"eval_samples_per_second": 74.787,
"eval_steps_per_second": 2.805,
"step": 97
},
{
"epoch": 17.39,
"learning_rate": 2.0833333333333336e-05,
"loss": 0.4808,
"step": 100
},
{
"epoch": 17.91,
"eval_accuracy": 0.525,
"eval_loss": 1.2705215215682983,
"eval_runtime": 1.0793,
"eval_samples_per_second": 74.121,
"eval_steps_per_second": 2.78,
"step": 103
},
{
"epoch": 18.96,
"eval_accuracy": 0.5125,
"eval_loss": 1.2791962623596191,
"eval_runtime": 1.1606,
"eval_samples_per_second": 68.927,
"eval_steps_per_second": 2.585,
"step": 109
},
{
"epoch": 19.13,
"learning_rate": 1.736111111111111e-05,
"loss": 0.4025,
"step": 110
},
{
"epoch": 20.0,
"eval_accuracy": 0.5375,
"eval_loss": 1.2922601699829102,
"eval_runtime": 1.0786,
"eval_samples_per_second": 74.168,
"eval_steps_per_second": 2.781,
"step": 115
},
{
"epoch": 20.87,
"learning_rate": 1.388888888888889e-05,
"loss": 0.3908,
"step": 120
},
{
"epoch": 20.87,
"eval_accuracy": 0.525,
"eval_loss": 1.3156249523162842,
"eval_runtime": 1.0785,
"eval_samples_per_second": 74.178,
"eval_steps_per_second": 2.782,
"step": 120
},
{
"epoch": 21.91,
"eval_accuracy": 0.5375,
"eval_loss": 1.3289515972137451,
"eval_runtime": 1.067,
"eval_samples_per_second": 74.979,
"eval_steps_per_second": 2.812,
"step": 126
},
{
"epoch": 22.61,
"learning_rate": 1.0416666666666668e-05,
"loss": 0.3384,
"step": 130
},
{
"epoch": 22.96,
"eval_accuracy": 0.5625,
"eval_loss": 1.314065933227539,
"eval_runtime": 1.0756,
"eval_samples_per_second": 74.377,
"eval_steps_per_second": 2.789,
"step": 132
},
{
"epoch": 24.0,
"eval_accuracy": 0.55,
"eval_loss": 1.3252638578414917,
"eval_runtime": 1.0776,
"eval_samples_per_second": 74.236,
"eval_steps_per_second": 2.784,
"step": 138
},
{
"epoch": 24.35,
"learning_rate": 6.944444444444445e-06,
"loss": 0.3428,
"step": 140
},
{
"epoch": 24.87,
"eval_accuracy": 0.5375,
"eval_loss": 1.350243330001831,
"eval_runtime": 1.1571,
"eval_samples_per_second": 69.139,
"eval_steps_per_second": 2.593,
"step": 143
},
{
"epoch": 25.91,
"eval_accuracy": 0.525,
"eval_loss": 1.349756121635437,
"eval_runtime": 1.0754,
"eval_samples_per_second": 74.39,
"eval_steps_per_second": 2.79,
"step": 149
},
{
"epoch": 26.09,
"learning_rate": 3.4722222222222224e-06,
"loss": 0.3236,
"step": 150
},
{
"epoch": 26.96,
"eval_accuracy": 0.525,
"eval_loss": 1.3449714183807373,
"eval_runtime": 1.0921,
"eval_samples_per_second": 73.256,
"eval_steps_per_second": 2.747,
"step": 155
},
{
"epoch": 27.83,
"learning_rate": 0.0,
"loss": 0.2951,
"step": 160
},
{
"epoch": 27.83,
"eval_accuracy": 0.5375,
"eval_loss": 1.3424607515335083,
"eval_runtime": 1.0784,
"eval_samples_per_second": 74.181,
"eval_steps_per_second": 2.782,
"step": 160
},
{
"epoch": 27.83,
"step": 160,
"total_flos": 1.5536429521628037e+18,
"train_loss": 0.7970057874917984,
"train_runtime": 905.2766,
"train_samples_per_second": 25.451,
"train_steps_per_second": 0.177
}
],
"logging_steps": 10,
"max_steps": 160,
"num_train_epochs": 32,
"save_steps": 500,
"total_flos": 1.5536429521628037e+18,
"trial_name": null,
"trial_params": null
}