klobasa-ni-klobasa / trainer_state.json
pcernuta's picture
End of training
4f9e986
raw
history blame
No virus
8.78 kB
{
"best_metric": 0.8958333333333334,
"best_model_checkpoint": "convnext-tiny-224-klobasaniklobasa/checkpoint-288",
"epoch": 10.0,
"global_step": 480,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.21,
"learning_rate": 8.333333333333334e-06,
"loss": 0.608,
"step": 10
},
{
"epoch": 0.42,
"learning_rate": 1.6666666666666667e-05,
"loss": 0.6676,
"step": 20
},
{
"epoch": 0.62,
"learning_rate": 2.5e-05,
"loss": 0.6403,
"step": 30
},
{
"epoch": 0.83,
"learning_rate": 3.3333333333333335e-05,
"loss": 0.7062,
"step": 40
},
{
"epoch": 1.0,
"eval_accuracy": 0.84375,
"eval_loss": 0.7115556597709656,
"eval_runtime": 3.3605,
"eval_samples_per_second": 28.567,
"eval_steps_per_second": 3.571,
"step": 48
},
{
"epoch": 1.04,
"learning_rate": 3.981481481481482e-05,
"loss": 0.5469,
"step": 50
},
{
"epoch": 1.25,
"learning_rate": 3.888888888888889e-05,
"loss": 0.5691,
"step": 60
},
{
"epoch": 1.46,
"learning_rate": 3.7962962962962964e-05,
"loss": 0.5161,
"step": 70
},
{
"epoch": 1.67,
"learning_rate": 3.703703703703704e-05,
"loss": 0.4157,
"step": 80
},
{
"epoch": 1.88,
"learning_rate": 3.6111111111111116e-05,
"loss": 0.4831,
"step": 90
},
{
"epoch": 2.0,
"eval_accuracy": 0.8333333333333334,
"eval_loss": 0.5967997312545776,
"eval_runtime": 3.6773,
"eval_samples_per_second": 26.106,
"eval_steps_per_second": 3.263,
"step": 96
},
{
"epoch": 2.08,
"learning_rate": 3.518518518518519e-05,
"loss": 0.3808,
"step": 100
},
{
"epoch": 2.29,
"learning_rate": 3.425925925925926e-05,
"loss": 0.3956,
"step": 110
},
{
"epoch": 2.5,
"learning_rate": 3.3333333333333335e-05,
"loss": 0.3992,
"step": 120
},
{
"epoch": 2.71,
"learning_rate": 3.2407407407407415e-05,
"loss": 0.3256,
"step": 130
},
{
"epoch": 2.92,
"learning_rate": 3.148148148148149e-05,
"loss": 0.2429,
"step": 140
},
{
"epoch": 3.0,
"eval_accuracy": 0.8541666666666666,
"eval_loss": 0.5383699536323547,
"eval_runtime": 3.5584,
"eval_samples_per_second": 26.979,
"eval_steps_per_second": 3.372,
"step": 144
},
{
"epoch": 3.12,
"learning_rate": 3.0555555555555554e-05,
"loss": 0.2586,
"step": 150
},
{
"epoch": 3.33,
"learning_rate": 2.962962962962963e-05,
"loss": 0.3041,
"step": 160
},
{
"epoch": 3.54,
"learning_rate": 2.8703703703703706e-05,
"loss": 0.2511,
"step": 170
},
{
"epoch": 3.75,
"learning_rate": 2.777777777777778e-05,
"loss": 0.2165,
"step": 180
},
{
"epoch": 3.96,
"learning_rate": 2.6851851851851852e-05,
"loss": 0.2292,
"step": 190
},
{
"epoch": 4.0,
"eval_accuracy": 0.84375,
"eval_loss": 0.4995401203632355,
"eval_runtime": 3.5701,
"eval_samples_per_second": 26.89,
"eval_steps_per_second": 3.361,
"step": 192
},
{
"epoch": 4.17,
"learning_rate": 2.5925925925925928e-05,
"loss": 0.2336,
"step": 200
},
{
"epoch": 4.38,
"learning_rate": 2.5e-05,
"loss": 0.1827,
"step": 210
},
{
"epoch": 4.58,
"learning_rate": 2.4074074074074077e-05,
"loss": 0.1918,
"step": 220
},
{
"epoch": 4.79,
"learning_rate": 2.314814814814815e-05,
"loss": 0.1316,
"step": 230
},
{
"epoch": 5.0,
"learning_rate": 2.2222222222222227e-05,
"loss": 0.1549,
"step": 240
},
{
"epoch": 5.0,
"eval_accuracy": 0.8854166666666666,
"eval_loss": 0.45076122879981995,
"eval_runtime": 3.3498,
"eval_samples_per_second": 28.658,
"eval_steps_per_second": 3.582,
"step": 240
},
{
"epoch": 5.21,
"learning_rate": 2.12962962962963e-05,
"loss": 0.0792,
"step": 250
},
{
"epoch": 5.42,
"learning_rate": 2.0370370370370372e-05,
"loss": 0.1449,
"step": 260
},
{
"epoch": 5.62,
"learning_rate": 1.9444444444444445e-05,
"loss": 0.0869,
"step": 270
},
{
"epoch": 5.83,
"learning_rate": 1.851851851851852e-05,
"loss": 0.1682,
"step": 280
},
{
"epoch": 6.0,
"eval_accuracy": 0.8958333333333334,
"eval_loss": 0.4400902986526489,
"eval_runtime": 3.566,
"eval_samples_per_second": 26.921,
"eval_steps_per_second": 3.365,
"step": 288
},
{
"epoch": 6.04,
"learning_rate": 1.7592592592592595e-05,
"loss": 0.1264,
"step": 290
},
{
"epoch": 6.25,
"learning_rate": 1.6666666666666667e-05,
"loss": 0.1211,
"step": 300
},
{
"epoch": 6.46,
"learning_rate": 1.5740740740740744e-05,
"loss": 0.0649,
"step": 310
},
{
"epoch": 6.67,
"learning_rate": 1.4814814814814815e-05,
"loss": 0.1159,
"step": 320
},
{
"epoch": 6.88,
"learning_rate": 1.388888888888889e-05,
"loss": 0.1736,
"step": 330
},
{
"epoch": 7.0,
"eval_accuracy": 0.8958333333333334,
"eval_loss": 0.4440065622329712,
"eval_runtime": 3.5045,
"eval_samples_per_second": 27.393,
"eval_steps_per_second": 3.424,
"step": 336
},
{
"epoch": 7.08,
"learning_rate": 1.2962962962962964e-05,
"loss": 0.0679,
"step": 340
},
{
"epoch": 7.29,
"learning_rate": 1.2037037037037039e-05,
"loss": 0.0915,
"step": 350
},
{
"epoch": 7.5,
"learning_rate": 1.1111111111111113e-05,
"loss": 0.1254,
"step": 360
},
{
"epoch": 7.71,
"learning_rate": 1.0185185185185186e-05,
"loss": 0.0588,
"step": 370
},
{
"epoch": 7.92,
"learning_rate": 9.25925925925926e-06,
"loss": 0.0633,
"step": 380
},
{
"epoch": 8.0,
"eval_accuracy": 0.8958333333333334,
"eval_loss": 0.44057992100715637,
"eval_runtime": 3.5708,
"eval_samples_per_second": 26.885,
"eval_steps_per_second": 3.361,
"step": 384
},
{
"epoch": 8.12,
"learning_rate": 8.333333333333334e-06,
"loss": 0.0512,
"step": 390
},
{
"epoch": 8.33,
"learning_rate": 7.4074074074074075e-06,
"loss": 0.129,
"step": 400
},
{
"epoch": 8.54,
"learning_rate": 6.481481481481482e-06,
"loss": 0.0776,
"step": 410
},
{
"epoch": 8.75,
"learning_rate": 5.555555555555557e-06,
"loss": 0.0628,
"step": 420
},
{
"epoch": 8.96,
"learning_rate": 4.62962962962963e-06,
"loss": 0.0689,
"step": 430
},
{
"epoch": 9.0,
"eval_accuracy": 0.8958333333333334,
"eval_loss": 0.4371330738067627,
"eval_runtime": 3.3898,
"eval_samples_per_second": 28.32,
"eval_steps_per_second": 3.54,
"step": 432
},
{
"epoch": 9.17,
"learning_rate": 3.7037037037037037e-06,
"loss": 0.0947,
"step": 440
},
{
"epoch": 9.38,
"learning_rate": 2.7777777777777783e-06,
"loss": 0.1003,
"step": 450
},
{
"epoch": 9.58,
"learning_rate": 1.8518518518518519e-06,
"loss": 0.0593,
"step": 460
},
{
"epoch": 9.79,
"learning_rate": 9.259259259259259e-07,
"loss": 0.0722,
"step": 470
},
{
"epoch": 10.0,
"learning_rate": 0.0,
"loss": 0.0558,
"step": 480
},
{
"epoch": 10.0,
"eval_accuracy": 0.8958333333333334,
"eval_loss": 0.43337997794151306,
"eval_runtime": 4.6987,
"eval_samples_per_second": 20.431,
"eval_steps_per_second": 2.554,
"step": 480
},
{
"epoch": 10.0,
"step": 480,
"total_flos": 9.499297468243968e+16,
"train_loss": 0.23564616565903027,
"train_runtime": 303.0343,
"train_samples_per_second": 12.474,
"train_steps_per_second": 1.584
}
],
"max_steps": 480,
"num_train_epochs": 10,
"total_flos": 9.499297468243968e+16,
"trial_name": null,
"trial_params": null
}