|
{ |
|
"best_metric": 0.8950359984842744, |
|
"best_model_checkpoint": "wavlm-large/checkpoint-15000", |
|
"epoch": 31.998484082870135, |
|
"global_step": 15808, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.01, |
|
"learning_rate": 9.487666034155598e-06, |
|
"loss": 4.7405, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.0, |
|
"eval_loss": 5.152532577514648, |
|
"eval_precision": 0.0, |
|
"eval_runtime": 231.7392, |
|
"eval_samples_per_second": 11.388, |
|
"eval_steps_per_second": 0.949, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"learning_rate": 1.8975332068311197e-05, |
|
"loss": 4.4299, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.0, |
|
"eval_loss": 5.896852016448975, |
|
"eval_precision": 0.0, |
|
"eval_runtime": 229.527, |
|
"eval_samples_per_second": 11.498, |
|
"eval_steps_per_second": 0.958, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 3.04, |
|
"learning_rate": 2.846299810246679e-05, |
|
"loss": 4.2868, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.04, |
|
"eval_accuracy": 0.0018946570670708603, |
|
"eval_f1": 0.002260186233515175, |
|
"eval_loss": 4.930444717407227, |
|
"eval_precision": 0.0030713084224438304, |
|
"eval_runtime": 224.9204, |
|
"eval_samples_per_second": 11.733, |
|
"eval_steps_per_second": 0.978, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.05, |
|
"learning_rate": 2.9116468686300697e-05, |
|
"loss": 3.6242, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 4.05, |
|
"eval_accuracy": 0.04092459264873058, |
|
"eval_f1": 0.023734423060596616, |
|
"eval_loss": 4.339611053466797, |
|
"eval_precision": 0.02235030209371723, |
|
"eval_runtime": 231.3364, |
|
"eval_samples_per_second": 11.408, |
|
"eval_steps_per_second": 0.951, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.06, |
|
"learning_rate": 2.8062135376396992e-05, |
|
"loss": 2.686, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 5.06, |
|
"eval_accuracy": 0.054945054945054944, |
|
"eval_f1": 0.030815499275931264, |
|
"eval_loss": 3.9399423599243164, |
|
"eval_precision": 0.03198760556742773, |
|
"eval_runtime": 229.8015, |
|
"eval_samples_per_second": 11.484, |
|
"eval_steps_per_second": 0.957, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 6.07, |
|
"learning_rate": 2.700780206649329e-05, |
|
"loss": 1.9284, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 6.07, |
|
"eval_accuracy": 0.05001894657067071, |
|
"eval_f1": 0.044225493965773466, |
|
"eval_loss": 3.7735581398010254, |
|
"eval_precision": 0.07786075378351333, |
|
"eval_runtime": 229.6709, |
|
"eval_samples_per_second": 11.49, |
|
"eval_steps_per_second": 0.958, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 7.08, |
|
"learning_rate": 2.5953468756589585e-05, |
|
"loss": 1.3936, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 7.08, |
|
"eval_accuracy": 0.094732853353543, |
|
"eval_f1": 0.09155559566994678, |
|
"eval_loss": 3.537994146347046, |
|
"eval_precision": 0.13805010974816684, |
|
"eval_runtime": 222.7345, |
|
"eval_samples_per_second": 11.848, |
|
"eval_steps_per_second": 0.988, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 8.1, |
|
"learning_rate": 2.489913544668588e-05, |
|
"loss": 1.0764, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 8.1, |
|
"eval_accuracy": 0.15839333080712392, |
|
"eval_f1": 0.1838779712805326, |
|
"eval_loss": 3.328141689300537, |
|
"eval_precision": 0.35144388335355753, |
|
"eval_runtime": 231.5928, |
|
"eval_samples_per_second": 11.395, |
|
"eval_steps_per_second": 0.95, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 9.11, |
|
"learning_rate": 2.3844802136782175e-05, |
|
"loss": 0.872, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 9.11, |
|
"eval_accuracy": 0.2754831375521031, |
|
"eval_f1": 0.33153761364278084, |
|
"eval_loss": 2.959165096282959, |
|
"eval_precision": 0.6026709651704474, |
|
"eval_runtime": 229.3101, |
|
"eval_samples_per_second": 11.508, |
|
"eval_steps_per_second": 0.959, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 10.12, |
|
"learning_rate": 2.279046882687847e-05, |
|
"loss": 0.7026, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 10.12, |
|
"eval_accuracy": 0.3971201212580523, |
|
"eval_f1": 0.4587007542105457, |
|
"eval_loss": 2.504917860031128, |
|
"eval_precision": 0.6970861611172207, |
|
"eval_runtime": 229.0193, |
|
"eval_samples_per_second": 11.523, |
|
"eval_steps_per_second": 0.961, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 11.13, |
|
"learning_rate": 2.1736135516974768e-05, |
|
"loss": 0.603, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 11.13, |
|
"eval_accuracy": 0.5479348237968927, |
|
"eval_f1": 0.6128796045577696, |
|
"eval_loss": 2.1484670639038086, |
|
"eval_precision": 0.8073946450067734, |
|
"eval_runtime": 226.9343, |
|
"eval_samples_per_second": 11.629, |
|
"eval_steps_per_second": 0.969, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 12.15, |
|
"learning_rate": 2.0681802207071063e-05, |
|
"loss": 0.5042, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 12.15, |
|
"eval_accuracy": 0.7014020462296324, |
|
"eval_f1": 0.7543542303794953, |
|
"eval_loss": 1.6532080173492432, |
|
"eval_precision": 0.8604295269195706, |
|
"eval_runtime": 229.9455, |
|
"eval_samples_per_second": 11.477, |
|
"eval_steps_per_second": 0.957, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 13.16, |
|
"learning_rate": 1.9627468897167357e-05, |
|
"loss": 0.4542, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 13.16, |
|
"eval_accuracy": 0.7434634331186055, |
|
"eval_f1": 0.7989946253783239, |
|
"eval_loss": 1.4056562185287476, |
|
"eval_precision": 0.8941430548214513, |
|
"eval_runtime": 223.4311, |
|
"eval_samples_per_second": 11.811, |
|
"eval_steps_per_second": 0.985, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 14.17, |
|
"learning_rate": 1.8573135587263652e-05, |
|
"loss": 0.388, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 14.17, |
|
"eval_accuracy": 0.7802197802197802, |
|
"eval_f1": 0.8331608145111185, |
|
"eval_loss": 1.233764410018921, |
|
"eval_precision": 0.92185981522448, |
|
"eval_runtime": 231.0616, |
|
"eval_samples_per_second": 11.421, |
|
"eval_steps_per_second": 0.952, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 15.18, |
|
"learning_rate": 1.751880227735995e-05, |
|
"loss": 0.3515, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 15.18, |
|
"eval_accuracy": 0.8169761273209549, |
|
"eval_f1": 0.8681431492951, |
|
"eval_loss": 0.9898241758346558, |
|
"eval_precision": 0.9432737435443141, |
|
"eval_runtime": 229.2806, |
|
"eval_samples_per_second": 11.51, |
|
"eval_steps_per_second": 0.96, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 16.19, |
|
"learning_rate": 1.6464468967456245e-05, |
|
"loss": 0.3195, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 16.19, |
|
"eval_accuracy": 0.8067449791587723, |
|
"eval_f1": 0.8635483223798979, |
|
"eval_loss": 1.1404353380203247, |
|
"eval_precision": 0.9523356531691418, |
|
"eval_runtime": 224.231, |
|
"eval_samples_per_second": 11.769, |
|
"eval_steps_per_second": 0.981, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 17.21, |
|
"learning_rate": 1.541013565755254e-05, |
|
"loss": 0.2882, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 17.21, |
|
"eval_accuracy": 0.8177339901477833, |
|
"eval_f1": 0.8745687675592978, |
|
"eval_loss": 0.9810923933982849, |
|
"eval_precision": 0.9540040162889087, |
|
"eval_runtime": 230.2032, |
|
"eval_samples_per_second": 11.464, |
|
"eval_steps_per_second": 0.956, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 18.22, |
|
"learning_rate": 1.4355802347648837e-05, |
|
"loss": 0.2695, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 18.22, |
|
"eval_accuracy": 0.8317544524441076, |
|
"eval_f1": 0.8877909926292662, |
|
"eval_loss": 0.9483387470245361, |
|
"eval_precision": 0.9615575975196211, |
|
"eval_runtime": 227.4444, |
|
"eval_samples_per_second": 11.603, |
|
"eval_steps_per_second": 0.967, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 19.23, |
|
"learning_rate": 1.3301469037745133e-05, |
|
"loss": 0.2535, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 19.23, |
|
"eval_accuracy": 0.8844259189086775, |
|
"eval_f1": 0.9198466869617786, |
|
"eval_loss": 0.6694388389587402, |
|
"eval_precision": 0.9692367120798446, |
|
"eval_runtime": 229.887, |
|
"eval_samples_per_second": 11.48, |
|
"eval_steps_per_second": 0.957, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 20.24, |
|
"learning_rate": 1.2247135727841428e-05, |
|
"loss": 0.2437, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 20.24, |
|
"eval_accuracy": 0.870026525198939, |
|
"eval_f1": 0.9124563736238709, |
|
"eval_loss": 0.7545726299285889, |
|
"eval_precision": 0.9655808349316077, |
|
"eval_runtime": 228.7826, |
|
"eval_samples_per_second": 11.535, |
|
"eval_steps_per_second": 0.962, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 21.25, |
|
"learning_rate": 1.1192802417937724e-05, |
|
"loss": 0.2376, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 21.25, |
|
"eval_accuracy": 0.88101553618795, |
|
"eval_f1": 0.9202319275311999, |
|
"eval_loss": 0.669846773147583, |
|
"eval_precision": 0.9694585382786844, |
|
"eval_runtime": 225.8023, |
|
"eval_samples_per_second": 11.687, |
|
"eval_steps_per_second": 0.974, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 22.27, |
|
"learning_rate": 1.013846910803402e-05, |
|
"loss": 0.2214, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 22.27, |
|
"eval_accuracy": 0.8726790450928382, |
|
"eval_f1": 0.9174460541012326, |
|
"eval_loss": 0.7156072854995728, |
|
"eval_precision": 0.972619503520754, |
|
"eval_runtime": 230.4418, |
|
"eval_samples_per_second": 11.452, |
|
"eval_steps_per_second": 0.955, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 23.28, |
|
"learning_rate": 9.084135798130316e-06, |
|
"loss": 0.2148, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 23.28, |
|
"eval_accuracy": 0.8931413414172035, |
|
"eval_f1": 0.9285879507962082, |
|
"eval_loss": 0.5982441902160645, |
|
"eval_precision": 0.9711102757838663, |
|
"eval_runtime": 229.8221, |
|
"eval_samples_per_second": 11.483, |
|
"eval_steps_per_second": 0.957, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 24.29, |
|
"learning_rate": 8.029802488226612e-06, |
|
"loss": 0.2087, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 24.29, |
|
"eval_accuracy": 0.8813944676013642, |
|
"eval_f1": 0.9242728727643769, |
|
"eval_loss": 0.7108510732650757, |
|
"eval_precision": 0.975723189780374, |
|
"eval_runtime": 223.4291, |
|
"eval_samples_per_second": 11.811, |
|
"eval_steps_per_second": 0.985, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 25.3, |
|
"learning_rate": 6.975469178322908e-06, |
|
"loss": 0.2039, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 25.3, |
|
"eval_accuracy": 0.8897309586964759, |
|
"eval_f1": 0.93059059028571, |
|
"eval_loss": 0.6577169895172119, |
|
"eval_precision": 0.9799317453490524, |
|
"eval_runtime": 229.7405, |
|
"eval_samples_per_second": 11.487, |
|
"eval_steps_per_second": 0.958, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 26.32, |
|
"learning_rate": 5.9211358684192026e-06, |
|
"loss": 0.1997, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 26.32, |
|
"eval_accuracy": 0.874573702159909, |
|
"eval_f1": 0.9203192830080359, |
|
"eval_loss": 0.7307356595993042, |
|
"eval_precision": 0.9774472205704657, |
|
"eval_runtime": 226.7422, |
|
"eval_samples_per_second": 11.639, |
|
"eval_steps_per_second": 0.97, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 27.33, |
|
"learning_rate": 4.866802558515498e-06, |
|
"loss": 0.1896, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 27.33, |
|
"eval_accuracy": 0.8904888215233043, |
|
"eval_f1": 0.9289821714067877, |
|
"eval_loss": 0.614262044429779, |
|
"eval_precision": 0.9747583516326127, |
|
"eval_runtime": 226.7104, |
|
"eval_samples_per_second": 11.64, |
|
"eval_steps_per_second": 0.97, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 28.34, |
|
"learning_rate": 3.8124692486117947e-06, |
|
"loss": 0.1869, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 28.34, |
|
"eval_accuracy": 0.8908677529367185, |
|
"eval_f1": 0.9286976343726923, |
|
"eval_loss": 0.637986958026886, |
|
"eval_precision": 0.9738854766344701, |
|
"eval_runtime": 229.6341, |
|
"eval_samples_per_second": 11.492, |
|
"eval_steps_per_second": 0.958, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 29.35, |
|
"learning_rate": 2.7581359387080904e-06, |
|
"loss": 0.185, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 29.35, |
|
"eval_accuracy": 0.8870784388025768, |
|
"eval_f1": 0.9288845844124958, |
|
"eval_loss": 0.6932182908058167, |
|
"eval_precision": 0.979135119670676, |
|
"eval_runtime": 223.3771, |
|
"eval_samples_per_second": 11.814, |
|
"eval_steps_per_second": 0.985, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 30.36, |
|
"learning_rate": 1.7038026288043862e-06, |
|
"loss": 0.1813, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 30.36, |
|
"eval_accuracy": 0.8950359984842744, |
|
"eval_f1": 0.9333589015381497, |
|
"eval_loss": 0.5935563445091248, |
|
"eval_precision": 0.9789140060741345, |
|
"eval_runtime": 231.0332, |
|
"eval_samples_per_second": 11.423, |
|
"eval_steps_per_second": 0.952, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 31.38, |
|
"learning_rate": 6.494693189006819e-07, |
|
"loss": 0.1801, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 31.38, |
|
"eval_accuracy": 0.8946570670708601, |
|
"eval_f1": 0.9334021717198819, |
|
"eval_loss": 0.6150190234184265, |
|
"eval_precision": 0.9800558320669844, |
|
"eval_runtime": 224.8697, |
|
"eval_samples_per_second": 11.736, |
|
"eval_steps_per_second": 0.978, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"step": 15808, |
|
"total_flos": 1.2697230517064026e+20, |
|
"train_loss": 1.0038429288729, |
|
"train_runtime": 86553.4289, |
|
"train_samples_per_second": 8.78, |
|
"train_steps_per_second": 0.183 |
|
} |
|
], |
|
"max_steps": 15808, |
|
"num_train_epochs": 32, |
|
"total_flos": 1.2697230517064026e+20, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|