{ "best_metric": 0.8213908076286316, "best_model_checkpoint": "./wav2vec2-base-960h-paper/checkpoint-3352", "epoch": 49.64200477326969, "global_step": 5200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.99, "eval_loss": 5.683954238891602, "eval_runtime": 61.9414, "eval_samples_per_second": 13.594, "eval_steps_per_second": 0.856, "eval_wer": 1.0, "step": 104 }, { "epoch": 2.0, "eval_loss": 3.9771974086761475, "eval_runtime": 58.5656, "eval_samples_per_second": 14.377, "eval_steps_per_second": 0.905, "eval_wer": 1.0, "step": 209 }, { "epoch": 3.0, "eval_loss": 3.4203968048095703, "eval_runtime": 58.5182, "eval_samples_per_second": 14.389, "eval_steps_per_second": 0.906, "eval_wer": 1.0, "step": 314 }, { "epoch": 4.0, "eval_loss": 3.3691885471343994, "eval_runtime": 58.4394, "eval_samples_per_second": 14.408, "eval_steps_per_second": 0.907, "eval_wer": 1.0, "step": 419 }, { "epoch": 4.77, "learning_rate": 4.916317991631799e-05, "loss": 5.5612, "step": 500 }, { "epoch": 4.99, "eval_loss": 3.3944718837738037, "eval_runtime": 58.5781, "eval_samples_per_second": 14.374, "eval_steps_per_second": 0.905, "eval_wer": 1.0, "step": 523 }, { "epoch": 6.0, "eval_loss": 3.342637777328491, "eval_runtime": 58.3305, "eval_samples_per_second": 14.435, "eval_steps_per_second": 0.909, "eval_wer": 1.0, "step": 628 }, { "epoch": 7.0, "eval_loss": 3.3333232402801514, "eval_runtime": 58.4524, "eval_samples_per_second": 14.405, "eval_steps_per_second": 0.907, "eval_wer": 1.0, "step": 733 }, { "epoch": 8.0, "eval_loss": 3.329634428024292, "eval_runtime": 58.6528, "eval_samples_per_second": 14.356, "eval_steps_per_second": 0.904, "eval_wer": 1.0000659917906212, "step": 838 }, { "epoch": 8.99, "eval_loss": 3.1853039264678955, "eval_runtime": 58.7103, "eval_samples_per_second": 14.342, "eval_steps_per_second": 0.903, "eval_wer": 0.9999340082093787, "step": 942 }, { "epoch": 9.55, "learning_rate": 4.393305439330544e-05, "loss": 3.2743, "step": 1000 }, { "epoch": 10.0, "eval_loss": 2.1381497383117676, "eval_runtime": 58.7525, "eval_samples_per_second": 14.331, "eval_steps_per_second": 0.902, "eval_wer": 1.0245489461111037, "step": 1047 }, { "epoch": 11.0, "eval_loss": 1.6965396404266357, "eval_runtime": 58.7454, "eval_samples_per_second": 14.333, "eval_steps_per_second": 0.902, "eval_wer": 1.0141750366254438, "step": 1152 }, { "epoch": 12.0, "eval_loss": 1.4229621887207031, "eval_runtime": 58.8247, "eval_samples_per_second": 14.314, "eval_steps_per_second": 0.901, "eval_wer": 1.0011350587986854, "step": 1257 }, { "epoch": 12.99, "eval_loss": 1.2678765058517456, "eval_runtime": 58.7761, "eval_samples_per_second": 14.326, "eval_steps_per_second": 0.902, "eval_wer": 0.9873295762007206, "step": 1361 }, { "epoch": 14.0, "eval_loss": 1.1569700241088867, "eval_runtime": 58.6837, "eval_samples_per_second": 14.348, "eval_steps_per_second": 0.903, "eval_wer": 0.9835944408515581, "step": 1466 }, { "epoch": 14.32, "learning_rate": 3.870292887029289e-05, "loss": 1.5432, "step": 1500 }, { "epoch": 15.0, "eval_loss": 1.0858139991760254, "eval_runtime": 58.71, "eval_samples_per_second": 14.342, "eval_steps_per_second": 0.903, "eval_wer": 0.9784206844668524, "step": 1571 }, { "epoch": 16.0, "eval_loss": 1.0303007364273071, "eval_runtime": 58.7899, "eval_samples_per_second": 14.322, "eval_steps_per_second": 0.902, "eval_wer": 0.9768632782081909, "step": 1676 }, { "epoch": 16.99, "eval_loss": 0.985497236251831, "eval_runtime": 58.9329, "eval_samples_per_second": 14.287, "eval_steps_per_second": 0.899, "eval_wer": 0.97459316061082, "step": 1780 }, { "epoch": 18.0, "eval_loss": 0.9558756947517395, "eval_runtime": 58.7163, "eval_samples_per_second": 14.34, "eval_steps_per_second": 0.903, "eval_wer": 0.9709240170522787, "step": 1885 }, { "epoch": 19.0, "eval_loss": 0.93276047706604, "eval_runtime": 58.6741, "eval_samples_per_second": 14.35, "eval_steps_per_second": 0.903, "eval_wer": 0.9727981839059221, "step": 1990 }, { "epoch": 19.09, "learning_rate": 3.3472803347280334e-05, "loss": 0.902, "step": 2000 }, { "epoch": 20.0, "eval_loss": 0.916550874710083, "eval_runtime": 58.8598, "eval_samples_per_second": 14.305, "eval_steps_per_second": 0.9, "eval_wer": 0.9738144574814893, "step": 2095 }, { "epoch": 20.99, "eval_loss": 0.8990672826766968, "eval_runtime": 58.8033, "eval_samples_per_second": 14.319, "eval_steps_per_second": 0.901, "eval_wer": 0.9697625615373447, "step": 2199 }, { "epoch": 22.0, "eval_loss": 0.8716745376586914, "eval_runtime": 58.795, "eval_samples_per_second": 14.321, "eval_steps_per_second": 0.901, "eval_wer": 0.9680731716974409, "step": 2304 }, { "epoch": 23.0, "eval_loss": 0.8665304780006409, "eval_runtime": 58.9314, "eval_samples_per_second": 14.288, "eval_steps_per_second": 0.899, "eval_wer": 0.9669249145406311, "step": 2409 }, { "epoch": 23.87, "learning_rate": 2.824267782426778e-05, "loss": 0.7003, "step": 2500 }, { "epoch": 24.0, "eval_loss": 0.8588829636573792, "eval_runtime": 58.6586, "eval_samples_per_second": 14.354, "eval_steps_per_second": 0.904, "eval_wer": 0.9670173030475009, "step": 2514 }, { "epoch": 24.99, "eval_loss": 0.8419524431228638, "eval_runtime": 58.7876, "eval_samples_per_second": 14.323, "eval_steps_per_second": 0.902, "eval_wer": 0.9659086409650639, "step": 2618 }, { "epoch": 26.0, "eval_loss": 0.8473154306411743, "eval_runtime": 59.0243, "eval_samples_per_second": 14.265, "eval_steps_per_second": 0.898, "eval_wer": 0.9660538229044306, "step": 2723 }, { "epoch": 27.0, "eval_loss": 0.8542926907539368, "eval_runtime": 58.7124, "eval_samples_per_second": 14.341, "eval_steps_per_second": 0.903, "eval_wer": 0.9666345506618976, "step": 2828 }, { "epoch": 28.0, "eval_loss": 0.8315206170082092, "eval_runtime": 58.7261, "eval_samples_per_second": 14.338, "eval_steps_per_second": 0.902, "eval_wer": 0.9622922908390196, "step": 2933 }, { "epoch": 28.64, "learning_rate": 2.301255230125523e-05, "loss": 0.5914, "step": 3000 }, { "epoch": 28.99, "eval_loss": 0.8280870914459229, "eval_runtime": 58.9202, "eval_samples_per_second": 14.291, "eval_steps_per_second": 0.9, "eval_wer": 0.9625694563596289, "step": 3037 }, { "epoch": 30.0, "eval_loss": 0.8315181732177734, "eval_runtime": 58.6719, "eval_samples_per_second": 14.351, "eval_steps_per_second": 0.903, "eval_wer": 0.9625430596433804, "step": 3142 }, { "epoch": 31.0, "eval_loss": 0.826146125793457, "eval_runtime": 58.8509, "eval_samples_per_second": 14.307, "eval_steps_per_second": 0.901, "eval_wer": 0.9619623318859134, "step": 3247 }, { "epoch": 32.0, "eval_loss": 0.8213908076286316, "eval_runtime": 58.6666, "eval_samples_per_second": 14.352, "eval_steps_per_second": 0.903, "eval_wer": 0.9639684823207993, "step": 3352 }, { "epoch": 32.99, "eval_loss": 0.8309536576271057, "eval_runtime": 58.499, "eval_samples_per_second": 14.393, "eval_steps_per_second": 0.906, "eval_wer": 0.9633745562052081, "step": 3456 }, { "epoch": 33.41, "learning_rate": 1.7782426778242676e-05, "loss": 0.5157, "step": 3500 }, { "epoch": 34.0, "eval_loss": 0.8252176642417908, "eval_runtime": 58.5446, "eval_samples_per_second": 14.382, "eval_steps_per_second": 0.905, "eval_wer": 0.9634669447120778, "step": 3561 }, { "epoch": 35.0, "eval_loss": 0.8372853398323059, "eval_runtime": 58.5403, "eval_samples_per_second": 14.383, "eval_steps_per_second": 0.905, "eval_wer": 0.9638101020233083, "step": 3666 }, { "epoch": 36.0, "eval_loss": 0.8421617746353149, "eval_runtime": 58.6533, "eval_samples_per_second": 14.356, "eval_steps_per_second": 0.904, "eval_wer": 0.9629258120289836, "step": 3771 }, { "epoch": 36.99, "eval_loss": 0.8294224143028259, "eval_runtime": 58.6527, "eval_samples_per_second": 14.356, "eval_steps_per_second": 0.904, "eval_wer": 0.9631897791914685, "step": 3875 }, { "epoch": 38.0, "eval_loss": 0.8332000374794006, "eval_runtime": 58.5856, "eval_samples_per_second": 14.372, "eval_steps_per_second": 0.905, "eval_wer": 0.9576332704211596, "step": 3980 }, { "epoch": 38.19, "learning_rate": 1.2552301255230125e-05, "loss": 0.4655, "step": 4000 }, { "epoch": 39.0, "eval_loss": 0.8329895734786987, "eval_runtime": 58.7603, "eval_samples_per_second": 14.329, "eval_steps_per_second": 0.902, "eval_wer": 0.959507437274803, "step": 4085 }, { "epoch": 40.0, "eval_loss": 0.8296785950660706, "eval_runtime": 58.6153, "eval_samples_per_second": 14.365, "eval_steps_per_second": 0.904, "eval_wer": 0.9625034645690076, "step": 4190 }, { "epoch": 40.99, "eval_loss": 0.8365075588226318, "eval_runtime": 58.6008, "eval_samples_per_second": 14.368, "eval_steps_per_second": 0.904, "eval_wer": 0.9620547203927832, "step": 4294 }, { "epoch": 42.0, "eval_loss": 0.8360996842384338, "eval_runtime": 58.6605, "eval_samples_per_second": 14.354, "eval_steps_per_second": 0.904, "eval_wer": 0.9621339105415286, "step": 4399 }, { "epoch": 42.96, "learning_rate": 7.3221757322175736e-06, "loss": 0.4266, "step": 4500 }, { "epoch": 43.0, "eval_loss": 0.8416324853897095, "eval_runtime": 58.5672, "eval_samples_per_second": 14.377, "eval_steps_per_second": 0.905, "eval_wer": 0.9625034645690076, "step": 4504 }, { "epoch": 44.0, "eval_loss": 0.8381497859954834, "eval_runtime": 58.6851, "eval_samples_per_second": 14.348, "eval_steps_per_second": 0.903, "eval_wer": 0.9633745562052081, "step": 4609 }, { "epoch": 44.99, "eval_loss": 0.8447730541229248, "eval_runtime": 58.6902, "eval_samples_per_second": 14.347, "eval_steps_per_second": 0.903, "eval_wer": 0.9644964166457692, "step": 4713 }, { "epoch": 46.0, "eval_loss": 0.8447101712226868, "eval_runtime": 58.8118, "eval_samples_per_second": 14.317, "eval_steps_per_second": 0.901, "eval_wer": 0.9624902662108834, "step": 4818 }, { "epoch": 47.0, "eval_loss": 0.8463994264602661, "eval_runtime": 58.6459, "eval_samples_per_second": 14.357, "eval_steps_per_second": 0.904, "eval_wer": 0.9641268626182903, "step": 4923 }, { "epoch": 47.73, "learning_rate": 2.092050209205021e-06, "loss": 0.4019, "step": 5000 }, { "epoch": 48.0, "eval_loss": 0.8449317216873169, "eval_runtime": 58.893, "eval_samples_per_second": 14.297, "eval_steps_per_second": 0.9, "eval_wer": 0.9627542333733684, "step": 5028 }, { "epoch": 48.99, "eval_loss": 0.8487057089805603, "eval_runtime": 58.7287, "eval_samples_per_second": 14.337, "eval_steps_per_second": 0.902, "eval_wer": 0.9625562580015046, "step": 5132 }, { "epoch": 49.64, "eval_loss": 0.846527636051178, "eval_runtime": 58.7826, "eval_samples_per_second": 14.324, "eval_steps_per_second": 0.902, "eval_wer": 0.9629126136708593, "step": 5200 }, { "epoch": 49.64, "step": 5200, "total_flos": 4.180377449644987e+19, "train_loss": 1.3979950288625864, "train_runtime": 89308.2068, "train_samples_per_second": 1.876, "train_steps_per_second": 0.058 } ], "max_steps": 5200, "num_train_epochs": 50, "total_flos": 4.180377449644987e+19, "trial_name": null, "trial_params": null }