|
{ |
|
"best_metric": 0.7796974441892816, |
|
"best_model_checkpoint": "/home/hoan/projects/nsfw/models/efficientvit_l1.r224_in1k/run-hgfebf69/checkpoint-595", |
|
"epoch": 28.0, |
|
"eval_steps": 500, |
|
"global_step": 595, |
|
"is_hyper_param_search": true, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.61, |
|
"learning_rate": 1.452508274337144e-07, |
|
"loss": 1.5355, |
|
"step": 13 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"eval_accuracy": 0.3932926829268293, |
|
"eval_f1": 0.484929996783293, |
|
"eval_loss": 1.5276610851287842, |
|
"eval_precision": 0.6852684114434121, |
|
"eval_recall": 0.3932926829268293, |
|
"eval_runtime": 8.1255, |
|
"eval_samples_per_second": 444.032, |
|
"eval_steps_per_second": 3.569, |
|
"step": 21 |
|
}, |
|
{ |
|
"epoch": 1.22, |
|
"learning_rate": 2.905016548674288e-07, |
|
"loss": 1.5334, |
|
"step": 26 |
|
}, |
|
{ |
|
"epoch": 1.84, |
|
"learning_rate": 4.357524823011432e-07, |
|
"loss": 1.5242, |
|
"step": 39 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"eval_accuracy": 0.4584257206208426, |
|
"eval_f1": 0.5440289476561175, |
|
"eval_loss": 1.5126081705093384, |
|
"eval_precision": 0.6975641567116644, |
|
"eval_recall": 0.4584257206208426, |
|
"eval_runtime": 8.3776, |
|
"eval_samples_per_second": 430.674, |
|
"eval_steps_per_second": 3.462, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 2.45, |
|
"learning_rate": 5.810033097348576e-07, |
|
"loss": 1.5104, |
|
"step": 52 |
|
}, |
|
{ |
|
"epoch": 2.96, |
|
"eval_accuracy": 0.5296563192904656, |
|
"eval_f1": 0.5944990700609136, |
|
"eval_loss": 1.4862231016159058, |
|
"eval_precision": 0.6890568361070714, |
|
"eval_recall": 0.5296563192904656, |
|
"eval_runtime": 8.1023, |
|
"eval_samples_per_second": 445.304, |
|
"eval_steps_per_second": 3.579, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 3.06, |
|
"learning_rate": 7.262541371685721e-07, |
|
"loss": 1.493, |
|
"step": 65 |
|
}, |
|
{ |
|
"epoch": 3.67, |
|
"learning_rate": 8.715049646022864e-07, |
|
"loss": 1.4698, |
|
"step": 78 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.6513303769401331, |
|
"eval_f1": 0.6736289843952361, |
|
"eval_loss": 1.4428884983062744, |
|
"eval_precision": 0.7042447934146061, |
|
"eval_recall": 0.6513303769401331, |
|
"eval_runtime": 8.2686, |
|
"eval_samples_per_second": 436.352, |
|
"eval_steps_per_second": 3.507, |
|
"step": 85 |
|
}, |
|
{ |
|
"epoch": 4.28, |
|
"learning_rate": 1.0167557920360007e-06, |
|
"loss": 1.4457, |
|
"step": 91 |
|
}, |
|
{ |
|
"epoch": 4.89, |
|
"learning_rate": 1.1620066194697152e-06, |
|
"loss": 1.4126, |
|
"step": 104 |
|
}, |
|
{ |
|
"epoch": 4.99, |
|
"eval_accuracy": 0.7513858093126385, |
|
"eval_f1": 0.7236423084979209, |
|
"eval_loss": 1.3878988027572632, |
|
"eval_precision": 0.704223393234371, |
|
"eval_recall": 0.7513858093126385, |
|
"eval_runtime": 8.0477, |
|
"eval_samples_per_second": 448.328, |
|
"eval_steps_per_second": 3.604, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 5.51, |
|
"learning_rate": 1.3072574469034296e-06, |
|
"loss": 1.3745, |
|
"step": 117 |
|
}, |
|
{ |
|
"epoch": 5.98, |
|
"eval_accuracy": 0.8009977827050998, |
|
"eval_f1": 0.7446621793568696, |
|
"eval_loss": 1.3229458332061768, |
|
"eval_precision": 0.7198332904237893, |
|
"eval_recall": 0.8009977827050998, |
|
"eval_runtime": 8.341, |
|
"eval_samples_per_second": 432.564, |
|
"eval_steps_per_second": 3.477, |
|
"step": 127 |
|
}, |
|
{ |
|
"epoch": 6.12, |
|
"learning_rate": 1.4075969248184277e-06, |
|
"loss": 1.3395, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 6.73, |
|
"learning_rate": 1.4038673596551303e-06, |
|
"loss": 1.2941, |
|
"step": 143 |
|
}, |
|
{ |
|
"epoch": 6.96, |
|
"eval_accuracy": 0.8245565410199557, |
|
"eval_f1": 0.7506711729341005, |
|
"eval_loss": 1.2522051334381104, |
|
"eval_precision": 0.7225360812946281, |
|
"eval_recall": 0.8245565410199557, |
|
"eval_runtime": 8.1304, |
|
"eval_samples_per_second": 443.768, |
|
"eval_steps_per_second": 3.567, |
|
"step": 148 |
|
}, |
|
{ |
|
"epoch": 7.34, |
|
"learning_rate": 1.3955441156005382e-06, |
|
"loss": 1.2525, |
|
"step": 156 |
|
}, |
|
{ |
|
"epoch": 7.95, |
|
"learning_rate": 1.3826818162583345e-06, |
|
"loss": 1.2116, |
|
"step": 169 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8276053215077606, |
|
"eval_f1": 0.7512743652414022, |
|
"eval_loss": 1.1887985467910767, |
|
"eval_precision": 0.7288159081513773, |
|
"eval_recall": 0.8276053215077606, |
|
"eval_runtime": 8.187, |
|
"eval_samples_per_second": 440.697, |
|
"eval_steps_per_second": 3.542, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 8.56, |
|
"learning_rate": 1.3653648740447739e-06, |
|
"loss": 1.168, |
|
"step": 182 |
|
}, |
|
{ |
|
"epoch": 8.99, |
|
"eval_accuracy": 0.8284368070953437, |
|
"eval_f1": 0.7508179552480237, |
|
"eval_loss": 1.1201469898223877, |
|
"eval_precision": 0.6864978143631778, |
|
"eval_recall": 0.8284368070953437, |
|
"eval_runtime": 8.4146, |
|
"eval_samples_per_second": 428.78, |
|
"eval_steps_per_second": 3.446, |
|
"step": 191 |
|
}, |
|
{ |
|
"epoch": 9.18, |
|
"learning_rate": 1.343706936208727e-06, |
|
"loss": 1.1394, |
|
"step": 195 |
|
}, |
|
{ |
|
"epoch": 9.79, |
|
"learning_rate": 1.3178501389900054e-06, |
|
"loss": 1.1014, |
|
"step": 208 |
|
}, |
|
{ |
|
"epoch": 9.98, |
|
"eval_accuracy": 0.8287139689578714, |
|
"eval_f1": 0.7513704434640557, |
|
"eval_loss": 1.0765742063522339, |
|
"eval_precision": 0.7699235349840203, |
|
"eval_recall": 0.8287139689578714, |
|
"eval_runtime": 8.0122, |
|
"eval_samples_per_second": 450.311, |
|
"eval_steps_per_second": 3.619, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 10.4, |
|
"learning_rate": 1.2879641748107618e-06, |
|
"loss": 1.0706, |
|
"step": 221 |
|
}, |
|
{ |
|
"epoch": 10.96, |
|
"eval_accuracy": 0.8284368070953437, |
|
"eval_f1": 0.7507041432190336, |
|
"eval_loss": 1.0376129150390625, |
|
"eval_precision": 0.6863075433503277, |
|
"eval_recall": 0.8284368070953437, |
|
"eval_runtime": 8.5615, |
|
"eval_samples_per_second": 421.42, |
|
"eval_steps_per_second": 3.387, |
|
"step": 233 |
|
}, |
|
{ |
|
"epoch": 11.01, |
|
"learning_rate": 1.254245178621782e-06, |
|
"loss": 1.0439, |
|
"step": 234 |
|
}, |
|
{ |
|
"epoch": 11.62, |
|
"learning_rate": 1.2169144407123264e-06, |
|
"loss": 1.0194, |
|
"step": 247 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.8284368070953437, |
|
"eval_f1": 0.7508179552480237, |
|
"eval_loss": 1.0062154531478882, |
|
"eval_precision": 0.6864978143631778, |
|
"eval_recall": 0.8284368070953437, |
|
"eval_runtime": 8.4048, |
|
"eval_samples_per_second": 429.28, |
|
"eval_steps_per_second": 3.45, |
|
"step": 255 |
|
}, |
|
{ |
|
"epoch": 12.24, |
|
"learning_rate": 1.1762169544310694e-06, |
|
"loss": 1.0048, |
|
"step": 260 |
|
}, |
|
{ |
|
"epoch": 12.85, |
|
"learning_rate": 1.132419808349121e-06, |
|
"loss": 0.9997, |
|
"step": 273 |
|
}, |
|
{ |
|
"epoch": 12.99, |
|
"eval_accuracy": 0.8284368070953437, |
|
"eval_f1": 0.7508179552480237, |
|
"eval_loss": 0.9836404919624329, |
|
"eval_precision": 0.6864978143631778, |
|
"eval_recall": 0.8284368070953437, |
|
"eval_runtime": 8.5535, |
|
"eval_samples_per_second": 421.814, |
|
"eval_steps_per_second": 3.39, |
|
"step": 276 |
|
}, |
|
{ |
|
"epoch": 13.46, |
|
"learning_rate": 1.0858104334170029e-06, |
|
"loss": 0.9776, |
|
"step": 286 |
|
}, |
|
{ |
|
"epoch": 13.98, |
|
"eval_accuracy": 0.8284368070953437, |
|
"eval_f1": 0.7507041432190336, |
|
"eval_loss": 0.9691689610481262, |
|
"eval_precision": 0.6863075433503277, |
|
"eval_recall": 0.8284368070953437, |
|
"eval_runtime": 7.9567, |
|
"eval_samples_per_second": 453.453, |
|
"eval_steps_per_second": 3.645, |
|
"step": 297 |
|
}, |
|
{ |
|
"epoch": 14.07, |
|
"learning_rate": 1.0366947166191075e-06, |
|
"loss": 0.9671, |
|
"step": 299 |
|
}, |
|
{ |
|
"epoch": 14.68, |
|
"learning_rate": 9.853949935052988e-07, |
|
"loss": 0.9587, |
|
"step": 312 |
|
}, |
|
{ |
|
"epoch": 14.96, |
|
"eval_accuracy": 0.8292682926829268, |
|
"eval_f1": 0.7526922431410414, |
|
"eval_loss": 0.9562509059906006, |
|
"eval_precision": 0.7703043936882441, |
|
"eval_recall": 0.8292682926829268, |
|
"eval_runtime": 8.4186, |
|
"eval_samples_per_second": 428.574, |
|
"eval_steps_per_second": 3.445, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 15.29, |
|
"learning_rate": 9.32247932774231e-07, |
|
"loss": 0.9463, |
|
"step": 325 |
|
}, |
|
{ |
|
"epoch": 15.91, |
|
"learning_rate": 8.776023267913875e-07, |
|
"loss": 0.9492, |
|
"step": 338 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.83009977827051, |
|
"eval_f1": 0.7547519055308186, |
|
"eval_loss": 0.9446051120758057, |
|
"eval_precision": 0.7591494201844647, |
|
"eval_recall": 0.83009977827051, |
|
"eval_runtime": 8.2197, |
|
"eval_samples_per_second": 438.947, |
|
"eval_steps_per_second": 3.528, |
|
"step": 340 |
|
}, |
|
{ |
|
"epoch": 16.52, |
|
"learning_rate": 8.218168025421926e-07, |
|
"loss": 0.9437, |
|
"step": 351 |
|
}, |
|
{ |
|
"epoch": 16.99, |
|
"eval_accuracy": 0.83009977827051, |
|
"eval_f1": 0.7553598948352633, |
|
"eval_loss": 0.9370310306549072, |
|
"eval_precision": 0.7528714352407055, |
|
"eval_recall": 0.83009977827051, |
|
"eval_runtime": 8.2035, |
|
"eval_samples_per_second": 439.813, |
|
"eval_steps_per_second": 3.535, |
|
"step": 361 |
|
}, |
|
{ |
|
"epoch": 17.13, |
|
"learning_rate": 7.652574680426876e-07, |
|
"loss": 0.9358, |
|
"step": 364 |
|
}, |
|
{ |
|
"epoch": 17.74, |
|
"learning_rate": 7.082955096538664e-07, |
|
"loss": 0.9363, |
|
"step": 377 |
|
}, |
|
{ |
|
"epoch": 17.98, |
|
"eval_accuracy": 0.8317627494456763, |
|
"eval_f1": 0.758845429136837, |
|
"eval_loss": 0.9373316168785095, |
|
"eval_precision": 0.7519338830068296, |
|
"eval_recall": 0.8317627494456763, |
|
"eval_runtime": 8.2615, |
|
"eval_samples_per_second": 436.724, |
|
"eval_steps_per_second": 3.51, |
|
"step": 382 |
|
}, |
|
{ |
|
"epoch": 18.35, |
|
"learning_rate": 6.513047560679618e-07, |
|
"loss": 0.9316, |
|
"step": 390 |
|
}, |
|
{ |
|
"epoch": 18.96, |
|
"learning_rate": 5.94659224953694e-07, |
|
"loss": 0.9264, |
|
"step": 403 |
|
}, |
|
{ |
|
"epoch": 18.96, |
|
"eval_accuracy": 0.8323170731707317, |
|
"eval_f1": 0.7606463034975902, |
|
"eval_loss": 0.9292559027671814, |
|
"eval_precision": 0.7526638484809335, |
|
"eval_recall": 0.8323170731707317, |
|
"eval_runtime": 8.115, |
|
"eval_samples_per_second": 444.609, |
|
"eval_steps_per_second": 3.574, |
|
"step": 403 |
|
}, |
|
{ |
|
"epoch": 19.58, |
|
"learning_rate": 5.387306683613124e-07, |
|
"loss": 0.9316, |
|
"step": 416 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.8328713968957872, |
|
"eval_f1": 0.762008565582684, |
|
"eval_loss": 0.9269818067550659, |
|
"eval_precision": 0.7475944578147732, |
|
"eval_recall": 0.8328713968957872, |
|
"eval_runtime": 8.3826, |
|
"eval_samples_per_second": 430.415, |
|
"eval_steps_per_second": 3.46, |
|
"step": 425 |
|
}, |
|
{ |
|
"epoch": 20.19, |
|
"learning_rate": 4.838861329963851e-07, |
|
"loss": 0.92, |
|
"step": 429 |
|
}, |
|
{ |
|
"epoch": 20.8, |
|
"learning_rate": 4.304855513737253e-07, |
|
"loss": 0.9174, |
|
"step": 442 |
|
}, |
|
{ |
|
"epoch": 20.99, |
|
"eval_accuracy": 0.8350886917960089, |
|
"eval_f1": 0.766268232245012, |
|
"eval_loss": 0.9251817464828491, |
|
"eval_precision": 0.7611039143133754, |
|
"eval_recall": 0.8350886917960089, |
|
"eval_runtime": 7.7339, |
|
"eval_samples_per_second": 466.52, |
|
"eval_steps_per_second": 3.75, |
|
"step": 446 |
|
}, |
|
{ |
|
"epoch": 21.41, |
|
"learning_rate": 3.7887937966016937e-07, |
|
"loss": 0.9212, |
|
"step": 455 |
|
}, |
|
{ |
|
"epoch": 21.98, |
|
"eval_accuracy": 0.8364745011086474, |
|
"eval_f1": 0.7701721753563872, |
|
"eval_loss": 0.9216660261154175, |
|
"eval_precision": 0.7861397608879442, |
|
"eval_recall": 0.8364745011086474, |
|
"eval_runtime": 8.2364, |
|
"eval_samples_per_second": 438.057, |
|
"eval_steps_per_second": 3.521, |
|
"step": 467 |
|
}, |
|
{ |
|
"epoch": 22.02, |
|
"learning_rate": 3.29406297708525e-07, |
|
"loss": 0.9222, |
|
"step": 468 |
|
}, |
|
{ |
|
"epoch": 22.64, |
|
"learning_rate": 2.8239098637685624e-07, |
|
"loss": 0.9142, |
|
"step": 481 |
|
}, |
|
{ |
|
"epoch": 22.96, |
|
"eval_accuracy": 0.8389689578713969, |
|
"eval_f1": 0.7751934812972323, |
|
"eval_loss": 0.9198487997055054, |
|
"eval_precision": 0.7580660317760047, |
|
"eval_recall": 0.8389689578713969, |
|
"eval_runtime": 8.1907, |
|
"eval_samples_per_second": 440.497, |
|
"eval_steps_per_second": 3.541, |
|
"step": 488 |
|
}, |
|
{ |
|
"epoch": 23.25, |
|
"learning_rate": 2.3814199672006268e-07, |
|
"loss": 0.9239, |
|
"step": 494 |
|
}, |
|
{ |
|
"epoch": 23.86, |
|
"learning_rate": 1.9694972503777733e-07, |
|
"loss": 0.9178, |
|
"step": 507 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.8356430155210643, |
|
"eval_f1": 0.7695758947830811, |
|
"eval_loss": 0.9179719686508179, |
|
"eval_precision": 0.7756305393423396, |
|
"eval_recall": 0.8356430155210643, |
|
"eval_runtime": 8.0754, |
|
"eval_samples_per_second": 446.788, |
|
"eval_steps_per_second": 3.591, |
|
"step": 510 |
|
}, |
|
{ |
|
"epoch": 24.47, |
|
"learning_rate": 1.5908450706789677e-07, |
|
"loss": 0.9152, |
|
"step": 520 |
|
}, |
|
{ |
|
"epoch": 24.99, |
|
"eval_accuracy": 0.8395232815964523, |
|
"eval_f1": 0.7765057889032959, |
|
"eval_loss": 0.9176101088523865, |
|
"eval_precision": 0.7933438992755063, |
|
"eval_recall": 0.8395232815964523, |
|
"eval_runtime": 8.0393, |
|
"eval_samples_per_second": 448.793, |
|
"eval_steps_per_second": 3.607, |
|
"step": 531 |
|
}, |
|
{ |
|
"epoch": 25.08, |
|
"learning_rate": 1.2479484383312357e-07, |
|
"loss": 0.9204, |
|
"step": 533 |
|
}, |
|
{ |
|
"epoch": 25.69, |
|
"learning_rate": 9.430577078390059e-08, |
|
"loss": 0.9096, |
|
"step": 546 |
|
}, |
|
{ |
|
"epoch": 25.98, |
|
"eval_accuracy": 0.8398004434589801, |
|
"eval_f1": 0.7763506725004051, |
|
"eval_loss": 0.9181774258613586, |
|
"eval_precision": 0.7954486998022142, |
|
"eval_recall": 0.8398004434589801, |
|
"eval_runtime": 8.1901, |
|
"eval_samples_per_second": 440.533, |
|
"eval_steps_per_second": 3.541, |
|
"step": 552 |
|
}, |
|
{ |
|
"epoch": 26.31, |
|
"learning_rate": 6.781738094068847e-08, |
|
"loss": 0.9157, |
|
"step": 559 |
|
}, |
|
{ |
|
"epoch": 26.92, |
|
"learning_rate": 4.550351172787507e-08, |
|
"loss": 0.9211, |
|
"step": 572 |
|
}, |
|
{ |
|
"epoch": 26.96, |
|
"eval_accuracy": 0.8364745011086474, |
|
"eval_f1": 0.7710155859925437, |
|
"eval_loss": 0.9194357991218567, |
|
"eval_precision": 0.7851756179427326, |
|
"eval_recall": 0.8364745011086474, |
|
"eval_runtime": 8.2806, |
|
"eval_samples_per_second": 435.717, |
|
"eval_steps_per_second": 3.502, |
|
"step": 573 |
|
}, |
|
{ |
|
"epoch": 27.53, |
|
"learning_rate": 2.751060411733735e-08, |
|
"loss": 0.912, |
|
"step": 585 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_accuracy": 0.8409090909090909, |
|
"eval_f1": 0.7796974441892816, |
|
"eval_loss": 0.9164049625396729, |
|
"eval_precision": 0.796046494839443, |
|
"eval_recall": 0.8409090909090909, |
|
"eval_runtime": 8.3541, |
|
"eval_samples_per_second": 431.882, |
|
"eval_steps_per_second": 3.471, |
|
"step": 595 |
|
} |
|
], |
|
"logging_steps": 13, |
|
"max_steps": 630, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 30, |
|
"save_steps": 500, |
|
"total_flos": 0.0, |
|
"train_batch_size": 128, |
|
"trial_name": null, |
|
"trial_params": { |
|
"_wandb": {}, |
|
"assignments": {}, |
|
"label_smoothing_factor": 0.019838947875582387, |
|
"learning_rate": 1.4078157120498472e-06, |
|
"metric": "eval/loss", |
|
"weight_decay": 0.024972382732841077 |
|
} |
|
} |
|
|