Beans / trainer_state.json
NDSrex's picture
Upload folder using huggingface_hub
fd6bc47
{
"best_metric": 0.12367749214172363,
"best_model_checkpoint": "./vit-base-beans/checkpoint-300",
"epoch": 1.8072289156626506,
"global_step": 300,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.06,
"learning_rate": 0.00019951807228915663,
"loss": 1.6515,
"step": 10
},
{
"epoch": 0.12,
"learning_rate": 0.00019903614457831325,
"loss": 1.0551,
"step": 20
},
{
"epoch": 0.18,
"learning_rate": 0.0001985542168674699,
"loss": 0.6568,
"step": 30
},
{
"epoch": 0.24,
"learning_rate": 0.00019807228915662652,
"loss": 0.4811,
"step": 40
},
{
"epoch": 0.3,
"learning_rate": 0.00019759036144578314,
"loss": 0.3576,
"step": 50
},
{
"epoch": 0.36,
"learning_rate": 0.00019710843373493977,
"loss": 0.2787,
"step": 60
},
{
"epoch": 0.42,
"learning_rate": 0.00019662650602409642,
"loss": 0.233,
"step": 70
},
{
"epoch": 0.48,
"learning_rate": 0.000196144578313253,
"loss": 0.1287,
"step": 80
},
{
"epoch": 0.54,
"learning_rate": 0.00019566265060240966,
"loss": 0.1755,
"step": 90
},
{
"epoch": 0.6,
"learning_rate": 0.00019518072289156628,
"loss": 0.109,
"step": 100
},
{
"epoch": 0.6,
"eval_accuracy": 0.959349593495935,
"eval_loss": 0.16569873690605164,
"eval_runtime": 4.541,
"eval_samples_per_second": 54.173,
"eval_steps_per_second": 6.827,
"step": 100
},
{
"epoch": 0.66,
"learning_rate": 0.0001946987951807229,
"loss": 0.1129,
"step": 110
},
{
"epoch": 0.72,
"learning_rate": 0.00019421686746987952,
"loss": 0.1769,
"step": 120
},
{
"epoch": 0.78,
"learning_rate": 0.00019373493975903617,
"loss": 0.1511,
"step": 130
},
{
"epoch": 0.84,
"learning_rate": 0.00019325301204819277,
"loss": 0.2121,
"step": 140
},
{
"epoch": 0.9,
"learning_rate": 0.00019277108433734942,
"loss": 0.135,
"step": 150
},
{
"epoch": 0.96,
"learning_rate": 0.00019228915662650604,
"loss": 0.1046,
"step": 160
},
{
"epoch": 1.02,
"learning_rate": 0.00019180722891566266,
"loss": 0.0742,
"step": 170
},
{
"epoch": 1.08,
"learning_rate": 0.00019132530120481928,
"loss": 0.0655,
"step": 180
},
{
"epoch": 1.14,
"learning_rate": 0.00019084337349397593,
"loss": 0.0735,
"step": 190
},
{
"epoch": 1.2,
"learning_rate": 0.00019036144578313252,
"loss": 0.0599,
"step": 200
},
{
"epoch": 1.2,
"eval_accuracy": 0.9471544715447154,
"eval_loss": 0.16865180432796478,
"eval_runtime": 4.123,
"eval_samples_per_second": 59.665,
"eval_steps_per_second": 7.519,
"step": 200
},
{
"epoch": 1.27,
"learning_rate": 0.00018987951807228917,
"loss": 0.1547,
"step": 210
},
{
"epoch": 1.33,
"learning_rate": 0.0001893975903614458,
"loss": 0.0723,
"step": 220
},
{
"epoch": 1.39,
"learning_rate": 0.00018891566265060242,
"loss": 0.045,
"step": 230
},
{
"epoch": 1.45,
"learning_rate": 0.00018843373493975904,
"loss": 0.0339,
"step": 240
},
{
"epoch": 1.51,
"learning_rate": 0.00018795180722891569,
"loss": 0.0424,
"step": 250
},
{
"epoch": 1.57,
"learning_rate": 0.00018746987951807228,
"loss": 0.1061,
"step": 260
},
{
"epoch": 1.63,
"learning_rate": 0.00018698795180722893,
"loss": 0.0557,
"step": 270
},
{
"epoch": 1.69,
"learning_rate": 0.00018650602409638555,
"loss": 0.0491,
"step": 280
},
{
"epoch": 1.75,
"learning_rate": 0.00018602409638554217,
"loss": 0.0489,
"step": 290
},
{
"epoch": 1.81,
"learning_rate": 0.0001855421686746988,
"loss": 0.0387,
"step": 300
},
{
"epoch": 1.81,
"eval_accuracy": 0.9715447154471545,
"eval_loss": 0.12367749214172363,
"eval_runtime": 4.2743,
"eval_samples_per_second": 57.553,
"eval_steps_per_second": 7.253,
"step": 300
}
],
"max_steps": 4150,
"num_train_epochs": 25,
"total_flos": 3.716682371694674e+17,
"trial_name": null,
"trial_params": null
}