paul
End of training
56b615b
{
"best_metric": 0.8578052550231839,
"best_model_checkpoint": "swin-base-patch4-window7-224-in22k-finetuned-memes/checkpoint-340",
"epoch": 19.987654320987655,
"global_step": 400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.49,
"learning_rate": 3e-05,
"loss": 1.5528,
"step": 10
},
{
"epoch": 0.99,
"learning_rate": 6e-05,
"loss": 1.1655,
"step": 20
},
{
"epoch": 0.99,
"eval_accuracy": 0.6955177743431221,
"eval_f1": 0.6682587615239292,
"eval_loss": 0.8572999835014343,
"eval_precision": 0.6952978724784165,
"eval_recall": 0.6955177743431221,
"eval_runtime": 14.2645,
"eval_samples_per_second": 90.715,
"eval_steps_per_second": 1.472,
"step": 20
},
{
"epoch": 1.49,
"learning_rate": 9e-05,
"loss": 0.7275,
"step": 30
},
{
"epoch": 1.99,
"learning_rate": 0.00012,
"loss": 0.5506,
"step": 40
},
{
"epoch": 1.99,
"eval_accuracy": 0.8083462132921174,
"eval_f1": 0.7962870636686081,
"eval_loss": 0.5326675176620483,
"eval_precision": 0.8049703591765521,
"eval_recall": 0.8083462132921174,
"eval_runtime": 12.6486,
"eval_samples_per_second": 102.304,
"eval_steps_per_second": 1.66,
"step": 40
},
{
"epoch": 2.49,
"learning_rate": 0.00011666666666666667,
"loss": 0.3788,
"step": 50
},
{
"epoch": 2.99,
"learning_rate": 0.00011333333333333333,
"loss": 0.3573,
"step": 60
},
{
"epoch": 2.99,
"eval_accuracy": 0.8338485316846986,
"eval_f1": 0.831666163408815,
"eval_loss": 0.4496992528438568,
"eval_precision": 0.8339121233593048,
"eval_recall": 0.8338485316846986,
"eval_runtime": 12.8713,
"eval_samples_per_second": 100.534,
"eval_steps_per_second": 1.632,
"step": 60
},
{
"epoch": 3.49,
"learning_rate": 0.00011,
"loss": 0.2378,
"step": 70
},
{
"epoch": 3.99,
"learning_rate": 0.00010666666666666667,
"loss": 0.2083,
"step": 80
},
{
"epoch": 3.99,
"eval_accuracy": 0.8353941267387944,
"eval_f1": 0.8368249403721092,
"eval_loss": 0.45606011152267456,
"eval_precision": 0.84498910302744,
"eval_recall": 0.8353941267387944,
"eval_runtime": 12.8489,
"eval_samples_per_second": 100.709,
"eval_steps_per_second": 1.634,
"step": 80
},
{
"epoch": 4.49,
"learning_rate": 0.00010333333333333334,
"loss": 0.1314,
"step": 90
},
{
"epoch": 4.99,
"learning_rate": 0.0001,
"loss": 0.1545,
"step": 100
},
{
"epoch": 4.99,
"eval_accuracy": 0.8423493044822257,
"eval_f1": 0.8429773996176875,
"eval_loss": 0.4605261981487274,
"eval_precision": 0.8457880236763888,
"eval_recall": 0.8423493044822257,
"eval_runtime": 13.8028,
"eval_samples_per_second": 93.749,
"eval_steps_per_second": 1.521,
"step": 100
},
{
"epoch": 5.49,
"learning_rate": 9.666666666666667e-05,
"loss": 0.124,
"step": 110
},
{
"epoch": 5.99,
"learning_rate": 9.333333333333334e-05,
"loss": 0.1014,
"step": 120
},
{
"epoch": 5.99,
"eval_accuracy": 0.8523956723338485,
"eval_f1": 0.8538473676550408,
"eval_loss": 0.4924044609069824,
"eval_precision": 0.8570555975028126,
"eval_recall": 0.8523956723338485,
"eval_runtime": 13.153,
"eval_samples_per_second": 98.381,
"eval_steps_per_second": 1.597,
"step": 120
},
{
"epoch": 6.49,
"learning_rate": 9e-05,
"loss": 0.0886,
"step": 130
},
{
"epoch": 6.99,
"learning_rate": 8.666666666666667e-05,
"loss": 0.0854,
"step": 140
},
{
"epoch": 6.99,
"eval_accuracy": 0.839258114374034,
"eval_f1": 0.8399595295849303,
"eval_loss": 0.575903594493866,
"eval_precision": 0.8452221761378239,
"eval_recall": 0.839258114374034,
"eval_runtime": 12.9566,
"eval_samples_per_second": 99.872,
"eval_steps_per_second": 1.621,
"step": 140
},
{
"epoch": 7.49,
"learning_rate": 8.333333333333333e-05,
"loss": 0.0804,
"step": 150
},
{
"epoch": 7.99,
"learning_rate": 7.999999999999999e-05,
"loss": 0.1012,
"step": 160
},
{
"epoch": 7.99,
"eval_accuracy": 0.8361669242658424,
"eval_f1": 0.8361306593636055,
"eval_loss": 0.5141878724098206,
"eval_precision": 0.8378496563621973,
"eval_recall": 0.8361669242658424,
"eval_runtime": 12.9916,
"eval_samples_per_second": 99.602,
"eval_steps_per_second": 1.616,
"step": 160
},
{
"epoch": 8.49,
"learning_rate": 7.666666666666667e-05,
"loss": 0.0745,
"step": 170
},
{
"epoch": 8.99,
"learning_rate": 7.333333333333334e-05,
"loss": 0.077,
"step": 180
},
{
"epoch": 8.99,
"eval_accuracy": 0.8330757341576507,
"eval_f1": 0.8406946514001388,
"eval_loss": 0.5646628141403198,
"eval_precision": 0.8537522286474765,
"eval_recall": 0.8330757341576507,
"eval_runtime": 13.9321,
"eval_samples_per_second": 92.879,
"eval_steps_per_second": 1.507,
"step": 180
},
{
"epoch": 9.49,
"learning_rate": 7.000000000000001e-05,
"loss": 0.0587,
"step": 190
},
{
"epoch": 9.99,
"learning_rate": 6.666666666666667e-05,
"loss": 0.0667,
"step": 200
},
{
"epoch": 9.99,
"eval_accuracy": 0.8462132921174652,
"eval_f1": 0.8482978184490837,
"eval_loss": 0.5293765068054199,
"eval_precision": 0.8508576163797781,
"eval_recall": 0.8462132921174652,
"eval_runtime": 13.4474,
"eval_samples_per_second": 96.227,
"eval_steps_per_second": 1.562,
"step": 200
},
{
"epoch": 10.49,
"learning_rate": 6.333333333333333e-05,
"loss": 0.0452,
"step": 210
},
{
"epoch": 10.99,
"learning_rate": 6e-05,
"loss": 0.0666,
"step": 220
},
{
"epoch": 10.99,
"eval_accuracy": 0.8384853168469861,
"eval_f1": 0.839606513626033,
"eval_loss": 0.6037518382072449,
"eval_precision": 0.84149883116413,
"eval_recall": 0.8384853168469861,
"eval_runtime": 12.7726,
"eval_samples_per_second": 101.311,
"eval_steps_per_second": 1.644,
"step": 220
},
{
"epoch": 11.49,
"learning_rate": 5.6666666666666664e-05,
"loss": 0.0577,
"step": 230
},
{
"epoch": 11.99,
"learning_rate": 5.333333333333333e-05,
"loss": 0.0574,
"step": 240
},
{
"epoch": 11.99,
"eval_accuracy": 0.8408037094281299,
"eval_f1": 0.8411127335807149,
"eval_loss": 0.6383613348007202,
"eval_precision": 0.8431342855971845,
"eval_recall": 0.8408037094281299,
"eval_runtime": 13.1432,
"eval_samples_per_second": 98.454,
"eval_steps_per_second": 1.598,
"step": 240
},
{
"epoch": 12.49,
"learning_rate": 5e-05,
"loss": 0.0509,
"step": 250
},
{
"epoch": 12.99,
"learning_rate": 4.666666666666667e-05,
"loss": 0.0488,
"step": 260
},
{
"epoch": 12.99,
"eval_accuracy": 0.8516228748068007,
"eval_f1": 0.8532381219142173,
"eval_loss": 0.6304579973220825,
"eval_precision": 0.8561226939263563,
"eval_recall": 0.8516228748068007,
"eval_runtime": 13.6608,
"eval_samples_per_second": 94.723,
"eval_steps_per_second": 1.537,
"step": 260
},
{
"epoch": 13.49,
"learning_rate": 4.3333333333333334e-05,
"loss": 0.0517,
"step": 270
},
{
"epoch": 13.99,
"learning_rate": 3.9999999999999996e-05,
"loss": 0.0524,
"step": 280
},
{
"epoch": 13.99,
"eval_accuracy": 0.8508500772797527,
"eval_f1": 0.8510093409043722,
"eval_loss": 0.6410980224609375,
"eval_precision": 0.8526221088238606,
"eval_recall": 0.8508500772797527,
"eval_runtime": 12.8216,
"eval_samples_per_second": 100.923,
"eval_steps_per_second": 1.638,
"step": 280
},
{
"epoch": 14.49,
"learning_rate": 3.666666666666667e-05,
"loss": 0.0377,
"step": 290
},
{
"epoch": 14.99,
"learning_rate": 3.3333333333333335e-05,
"loss": 0.0511,
"step": 300
},
{
"epoch": 14.99,
"eval_accuracy": 0.8547140649149922,
"eval_f1": 0.8543059086099318,
"eval_loss": 0.6461631655693054,
"eval_precision": 0.8541819570387084,
"eval_recall": 0.8547140649149922,
"eval_runtime": 14.3489,
"eval_samples_per_second": 90.181,
"eval_steps_per_second": 1.464,
"step": 300
},
{
"epoch": 15.49,
"learning_rate": 3e-05,
"loss": 0.0446,
"step": 310
},
{
"epoch": 15.99,
"learning_rate": 2.6666666666666667e-05,
"loss": 0.0495,
"step": 320
},
{
"epoch": 15.99,
"eval_accuracy": 0.8531684698608965,
"eval_f1": 0.8527356330319577,
"eval_loss": 0.6869231462478638,
"eval_precision": 0.8533821751799587,
"eval_recall": 0.8531684698608965,
"eval_runtime": 12.6457,
"eval_samples_per_second": 102.327,
"eval_steps_per_second": 1.661,
"step": 320
},
{
"epoch": 16.49,
"learning_rate": 2.3333333333333336e-05,
"loss": 0.0489,
"step": 330
},
{
"epoch": 16.99,
"learning_rate": 1.9999999999999998e-05,
"loss": 0.0412,
"step": 340
},
{
"epoch": 16.99,
"eval_accuracy": 0.8578052550231839,
"eval_f1": 0.8563934506342421,
"eval_loss": 0.6643078327178955,
"eval_precision": 0.8553636638149845,
"eval_recall": 0.8578052550231839,
"eval_runtime": 13.1315,
"eval_samples_per_second": 98.542,
"eval_steps_per_second": 1.599,
"step": 340
},
{
"epoch": 17.49,
"learning_rate": 1.6666666666666667e-05,
"loss": 0.0447,
"step": 350
},
{
"epoch": 17.99,
"learning_rate": 1.3333333333333333e-05,
"loss": 0.0411,
"step": 360
},
{
"epoch": 17.99,
"eval_accuracy": 0.857032457496136,
"eval_f1": 0.8552106741098364,
"eval_loss": 0.7213734984397888,
"eval_precision": 0.8538988900347119,
"eval_recall": 0.857032457496136,
"eval_runtime": 12.729,
"eval_samples_per_second": 101.658,
"eval_steps_per_second": 1.65,
"step": 360
},
{
"epoch": 18.49,
"learning_rate": 9.999999999999999e-06,
"loss": 0.0411,
"step": 370
},
{
"epoch": 18.99,
"learning_rate": 6.666666666666667e-06,
"loss": 0.0434,
"step": 380
},
{
"epoch": 18.99,
"eval_accuracy": 0.8523956723338485,
"eval_f1": 0.8514088692604659,
"eval_loss": 0.7037173509597778,
"eval_precision": 0.850651377920994,
"eval_recall": 0.8523956723338485,
"eval_runtime": 13.5738,
"eval_samples_per_second": 95.331,
"eval_steps_per_second": 1.547,
"step": 380
},
{
"epoch": 19.49,
"learning_rate": 3.3333333333333333e-06,
"loss": 0.0445,
"step": 390
},
{
"epoch": 19.99,
"learning_rate": 0.0,
"loss": 0.0394,
"step": 400
},
{
"epoch": 19.99,
"eval_accuracy": 0.8562596599690881,
"eval_f1": 0.8552274649509984,
"eval_loss": 0.7093907594680786,
"eval_precision": 0.8545652818321074,
"eval_recall": 0.8562596599690881,
"eval_runtime": 12.9239,
"eval_samples_per_second": 100.124,
"eval_steps_per_second": 1.625,
"step": 400
},
{
"epoch": 19.99,
"step": 400,
"total_flos": 8.103254675374559e+18,
"train_loss": 0.18201538026332856,
"train_runtime": 1691.2716,
"train_samples_per_second": 61.185,
"train_steps_per_second": 0.237
}
],
"max_steps": 400,
"num_train_epochs": 20,
"total_flos": 8.103254675374559e+18,
"trial_name": null,
"trial_params": null
}