dima806's picture
Upload folder using huggingface_hub
4e8ea47
raw
history blame
7 kB
{
"best_metric": 0.8303472995758057,
"best_model_checkpoint": "face_emotions_image_detection/checkpoint-6800",
"epoch": 20.0,
"eval_steps": 500,
"global_step": 6800,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.5581299131154324,
"eval_loss": 1.5780813694000244,
"eval_runtime": 34.4094,
"eval_samples_per_second": 70.242,
"eval_steps_per_second": 2.209,
"step": 340
},
{
"epoch": 1.47,
"learning_rate": 9.333333333333333e-07,
"loss": 1.5754,
"step": 500
},
{
"epoch": 2.0,
"eval_accuracy": 0.6235002068680182,
"eval_loss": 1.4531924724578857,
"eval_runtime": 33.5063,
"eval_samples_per_second": 72.136,
"eval_steps_per_second": 2.268,
"step": 680
},
{
"epoch": 2.94,
"learning_rate": 8.592592592592592e-07,
"loss": 1.3718,
"step": 1000
},
{
"epoch": 3.0,
"eval_accuracy": 0.6607364501448076,
"eval_loss": 1.335525631904602,
"eval_runtime": 33.5199,
"eval_samples_per_second": 72.107,
"eval_steps_per_second": 2.267,
"step": 1020
},
{
"epoch": 4.0,
"eval_accuracy": 0.676458419528341,
"eval_loss": 1.2385190725326538,
"eval_runtime": 33.0393,
"eval_samples_per_second": 73.155,
"eval_steps_per_second": 2.3,
"step": 1360
},
{
"epoch": 4.41,
"learning_rate": 7.851851851851852e-07,
"loss": 1.2055,
"step": 1500
},
{
"epoch": 5.0,
"eval_accuracy": 0.6830781961108813,
"eval_loss": 1.1576205492019653,
"eval_runtime": 34.4609,
"eval_samples_per_second": 70.137,
"eval_steps_per_second": 2.205,
"step": 1700
},
{
"epoch": 5.88,
"learning_rate": 7.111111111111111e-07,
"loss": 1.0902,
"step": 2000
},
{
"epoch": 6.0,
"eval_accuracy": 0.6963177492759619,
"eval_loss": 1.0941061973571777,
"eval_runtime": 33.7137,
"eval_samples_per_second": 71.692,
"eval_steps_per_second": 2.254,
"step": 2040
},
{
"epoch": 7.0,
"eval_accuracy": 0.7136946628051303,
"eval_loss": 1.0437400341033936,
"eval_runtime": 34.1074,
"eval_samples_per_second": 70.864,
"eval_steps_per_second": 2.228,
"step": 2380
},
{
"epoch": 7.35,
"learning_rate": 6.37037037037037e-07,
"loss": 0.9981,
"step": 2500
},
{
"epoch": 8.0,
"eval_accuracy": 0.7194869673148532,
"eval_loss": 0.999989926815033,
"eval_runtime": 34.4809,
"eval_samples_per_second": 70.097,
"eval_steps_per_second": 2.204,
"step": 2720
},
{
"epoch": 8.82,
"learning_rate": 5.62962962962963e-07,
"loss": 0.9352,
"step": 3000
},
{
"epoch": 9.0,
"eval_accuracy": 0.7273479520066197,
"eval_loss": 0.9669674634933472,
"eval_runtime": 34.4622,
"eval_samples_per_second": 70.135,
"eval_steps_per_second": 2.205,
"step": 3060
},
{
"epoch": 10.0,
"eval_accuracy": 0.7290028961522549,
"eval_loss": 0.9405105113983154,
"eval_runtime": 33.8763,
"eval_samples_per_second": 71.348,
"eval_steps_per_second": 2.243,
"step": 3400
},
{
"epoch": 10.29,
"learning_rate": 4.888888888888889e-07,
"loss": 0.8851,
"step": 3500
},
{
"epoch": 11.0,
"eval_accuracy": 0.7343814646255689,
"eval_loss": 0.9163816571235657,
"eval_runtime": 34.0893,
"eval_samples_per_second": 70.902,
"eval_steps_per_second": 2.229,
"step": 3740
},
{
"epoch": 11.76,
"learning_rate": 4.1481481481481476e-07,
"loss": 0.8465,
"step": 4000
},
{
"epoch": 12.0,
"eval_accuracy": 0.7347952006619777,
"eval_loss": 0.8966172933578491,
"eval_runtime": 34.3056,
"eval_samples_per_second": 70.455,
"eval_steps_per_second": 2.215,
"step": 4080
},
{
"epoch": 13.0,
"eval_accuracy": 0.7422424493173355,
"eval_loss": 0.8790085911750793,
"eval_runtime": 34.0958,
"eval_samples_per_second": 70.888,
"eval_steps_per_second": 2.229,
"step": 4420
},
{
"epoch": 13.24,
"learning_rate": 3.407407407407407e-07,
"loss": 0.8165,
"step": 4500
},
{
"epoch": 14.0,
"eval_accuracy": 0.7480347538270583,
"eval_loss": 0.8644098043441772,
"eval_runtime": 34.0216,
"eval_samples_per_second": 71.043,
"eval_steps_per_second": 2.234,
"step": 4760
},
{
"epoch": 14.71,
"learning_rate": 2.6666666666666667e-07,
"loss": 0.7954,
"step": 5000
},
{
"epoch": 15.0,
"eval_accuracy": 0.750517170045511,
"eval_loss": 0.8529735803604126,
"eval_runtime": 34.2111,
"eval_samples_per_second": 70.649,
"eval_steps_per_second": 2.221,
"step": 5100
},
{
"epoch": 16.0,
"eval_accuracy": 0.7509309060819197,
"eval_loss": 0.8457837104797363,
"eval_runtime": 33.6533,
"eval_samples_per_second": 71.821,
"eval_steps_per_second": 2.258,
"step": 5440
},
{
"epoch": 16.18,
"learning_rate": 1.9259259259259257e-07,
"loss": 0.7811,
"step": 5500
},
{
"epoch": 17.0,
"eval_accuracy": 0.7534133223003724,
"eval_loss": 0.8384882211685181,
"eval_runtime": 33.6326,
"eval_samples_per_second": 71.865,
"eval_steps_per_second": 2.26,
"step": 5780
},
{
"epoch": 17.65,
"learning_rate": 1.1851851851851851e-07,
"loss": 0.7673,
"step": 6000
},
{
"epoch": 18.0,
"eval_accuracy": 0.7550682664460074,
"eval_loss": 0.8335217237472534,
"eval_runtime": 33.2974,
"eval_samples_per_second": 72.588,
"eval_steps_per_second": 2.282,
"step": 6120
},
{
"epoch": 19.0,
"eval_accuracy": 0.7529995862639636,
"eval_loss": 0.8314878940582275,
"eval_runtime": 33.8017,
"eval_samples_per_second": 71.505,
"eval_steps_per_second": 2.248,
"step": 6460
},
{
"epoch": 19.12,
"learning_rate": 4.444444444444444e-08,
"loss": 0.7594,
"step": 6500
},
{
"epoch": 20.0,
"eval_accuracy": 0.7538270583367811,
"eval_loss": 0.8303472995758057,
"eval_runtime": 34.3877,
"eval_samples_per_second": 70.287,
"eval_steps_per_second": 2.21,
"step": 6800
}
],
"logging_steps": 500,
"max_steps": 6800,
"num_input_tokens_seen": 0,
"num_train_epochs": 20,
"save_steps": 500,
"total_flos": 3.3702474498545664e+19,
"train_batch_size": 64,
"trial_name": null,
"trial_params": null
}