diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,7100 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 14.059452701764133, + "global_step": 50600, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.03, + "learning_rate": 0.0001, + "loss": 7.817, + "step": 100 + }, + { + "epoch": 0.03, + "eval_loss": 3.791971206665039, + "eval_runtime": 17.0609, + "eval_samples_per_second": 5.803, + "eval_wer": 1.0, + "step": 100 + }, + { + "epoch": 0.06, + "learning_rate": 9.999444259197512e-05, + "loss": 3.0102, + "step": 200 + }, + { + "epoch": 0.06, + "eval_loss": 3.3802108764648438, + "eval_runtime": 17.1385, + "eval_samples_per_second": 5.776, + "eval_wer": 1.0, + "step": 200 + }, + { + "epoch": 0.08, + "learning_rate": 9.99888851839502e-05, + "loss": 2.929, + "step": 300 + }, + { + "epoch": 0.08, + "eval_loss": 3.4951775074005127, + "eval_runtime": 17.7008, + "eval_samples_per_second": 5.593, + "eval_wer": 1.0, + "step": 300 + }, + { + "epoch": 0.11, + "learning_rate": 9.998332777592532e-05, + "loss": 2.918, + "step": 400 + }, + { + "epoch": 0.11, + "eval_loss": 3.2080225944519043, + "eval_runtime": 17.3326, + "eval_samples_per_second": 5.712, + "eval_wer": 1.0, + "step": 400 + }, + { + "epoch": 0.14, + "learning_rate": 9.997777036790042e-05, + "loss": 2.8855, + "step": 500 + }, + { + "epoch": 0.14, + "eval_loss": 3.1997480392456055, + "eval_runtime": 17.2803, + "eval_samples_per_second": 5.729, + "eval_wer": 1.0, + "step": 500 + }, + { + "epoch": 0.17, + "learning_rate": 9.997221295987552e-05, + "loss": 2.8791, + "step": 600 + }, + { + "epoch": 0.17, + "eval_loss": 3.0948541164398193, + "eval_runtime": 17.1794, + "eval_samples_per_second": 5.763, + "eval_wer": 1.0, + "step": 600 + }, + { + "epoch": 0.19, + "learning_rate": 9.996665555185062e-05, + "loss": 2.8751, + "step": 700 + }, + { + "epoch": 0.19, + "eval_loss": 3.1061549186706543, + "eval_runtime": 17.4783, + "eval_samples_per_second": 5.664, + "eval_wer": 1.0, + "step": 700 + }, + { + "epoch": 0.22, + "learning_rate": 9.996109814382572e-05, + "loss": 2.8643, + "step": 800 + }, + { + "epoch": 0.22, + "eval_loss": 3.0063648223876953, + "eval_runtime": 17.252, + "eval_samples_per_second": 5.738, + "eval_wer": 1.0, + "step": 800 + }, + { + "epoch": 0.25, + "learning_rate": 9.995554073580082e-05, + "loss": 2.8587, + "step": 900 + }, + { + "epoch": 0.25, + "eval_loss": 2.9906227588653564, + "eval_runtime": 17.2628, + "eval_samples_per_second": 5.735, + "eval_wer": 1.0, + "step": 900 + }, + { + "epoch": 0.28, + "learning_rate": 9.994998332777594e-05, + "loss": 2.7566, + "step": 1000 + }, + { + "epoch": 0.28, + "eval_loss": 2.6209235191345215, + "eval_runtime": 17.3238, + "eval_samples_per_second": 5.715, + "eval_wer": 1.0, + "step": 1000 + }, + { + "epoch": 0.31, + "learning_rate": 9.994442591975102e-05, + "loss": 2.1468, + "step": 1100 + }, + { + "epoch": 0.31, + "eval_loss": 1.8421308994293213, + "eval_runtime": 17.1871, + "eval_samples_per_second": 5.76, + "eval_wer": 0.9896907216494846, + "step": 1100 + }, + { + "epoch": 0.33, + "learning_rate": 9.993886851172614e-05, + "loss": 1.4695, + "step": 1200 + }, + { + "epoch": 0.33, + "eval_loss": 1.4311132431030273, + "eval_runtime": 17.4523, + "eval_samples_per_second": 5.673, + "eval_wer": 0.875, + "step": 1200 + }, + { + "epoch": 0.36, + "learning_rate": 9.993331110370124e-05, + "loss": 1.1334, + "step": 1300 + }, + { + "epoch": 0.36, + "eval_loss": 1.2780916690826416, + "eval_runtime": 17.1785, + "eval_samples_per_second": 5.763, + "eval_wer": 0.854381443298969, + "step": 1300 + }, + { + "epoch": 0.39, + "learning_rate": 9.992775369567634e-05, + "loss": 0.9951, + "step": 1400 + }, + { + "epoch": 0.39, + "eval_loss": 1.0466135740280151, + "eval_runtime": 16.9445, + "eval_samples_per_second": 5.843, + "eval_wer": 0.7306701030927835, + "step": 1400 + }, + { + "epoch": 0.42, + "learning_rate": 9.992219628765145e-05, + "loss": 0.9161, + "step": 1500 + }, + { + "epoch": 0.42, + "eval_loss": 1.0910567045211792, + "eval_runtime": 17.1529, + "eval_samples_per_second": 5.772, + "eval_wer": 0.7345360824742269, + "step": 1500 + }, + { + "epoch": 0.44, + "learning_rate": 9.991663887962654e-05, + "loss": 0.8162, + "step": 1600 + }, + { + "epoch": 0.44, + "eval_loss": 0.9578825831413269, + "eval_runtime": 17.0661, + "eval_samples_per_second": 5.801, + "eval_wer": 0.6842783505154639, + "step": 1600 + }, + { + "epoch": 0.47, + "learning_rate": 9.991108147160165e-05, + "loss": 0.7552, + "step": 1700 + }, + { + "epoch": 0.47, + "eval_loss": 0.9620718955993652, + "eval_runtime": 17.1705, + "eval_samples_per_second": 5.766, + "eval_wer": 0.6288659793814433, + "step": 1700 + }, + { + "epoch": 0.5, + "learning_rate": 9.990552406357675e-05, + "loss": 0.752, + "step": 1800 + }, + { + "epoch": 0.5, + "eval_loss": 0.9395142197608948, + "eval_runtime": 17.1773, + "eval_samples_per_second": 5.763, + "eval_wer": 0.6172680412371134, + "step": 1800 + }, + { + "epoch": 0.53, + "learning_rate": 9.989996665555186e-05, + "loss": 0.6846, + "step": 1900 + }, + { + "epoch": 0.53, + "eval_loss": 1.0008608102798462, + "eval_runtime": 17.3332, + "eval_samples_per_second": 5.712, + "eval_wer": 0.5786082474226805, + "step": 1900 + }, + { + "epoch": 0.56, + "learning_rate": 9.989440924752696e-05, + "loss": 0.6402, + "step": 2000 + }, + { + "epoch": 0.56, + "eval_loss": 0.8784067034721375, + "eval_runtime": 17.1604, + "eval_samples_per_second": 5.769, + "eval_wer": 0.5489690721649485, + "step": 2000 + }, + { + "epoch": 0.58, + "learning_rate": 9.988885183950206e-05, + "loss": 0.6582, + "step": 2100 + }, + { + "epoch": 0.58, + "eval_loss": 0.9032992720603943, + "eval_runtime": 17.1447, + "eval_samples_per_second": 5.774, + "eval_wer": 0.5631443298969072, + "step": 2100 + }, + { + "epoch": 0.61, + "learning_rate": 9.988329443147716e-05, + "loss": 0.5984, + "step": 2200 + }, + { + "epoch": 0.61, + "eval_loss": 0.8451138138771057, + "eval_runtime": 17.25, + "eval_samples_per_second": 5.739, + "eval_wer": 0.5283505154639175, + "step": 2200 + }, + { + "epoch": 0.64, + "learning_rate": 9.987773702345227e-05, + "loss": 0.6265, + "step": 2300 + }, + { + "epoch": 0.64, + "eval_loss": 0.7656041383743286, + "eval_runtime": 17.2036, + "eval_samples_per_second": 5.755, + "eval_wer": 0.5373711340206185, + "step": 2300 + }, + { + "epoch": 0.67, + "learning_rate": 9.987217961542737e-05, + "loss": 0.5903, + "step": 2400 + }, + { + "epoch": 0.67, + "eval_loss": 0.8390687108039856, + "eval_runtime": 17.1101, + "eval_samples_per_second": 5.786, + "eval_wer": 0.5167525773195877, + "step": 2400 + }, + { + "epoch": 0.69, + "learning_rate": 9.986662220740247e-05, + "loss": 0.5788, + "step": 2500 + }, + { + "epoch": 0.69, + "eval_loss": 0.8256884217262268, + "eval_runtime": 17.1636, + "eval_samples_per_second": 5.768, + "eval_wer": 0.5064432989690721, + "step": 2500 + }, + { + "epoch": 0.72, + "learning_rate": 9.986106479937759e-05, + "loss": 0.583, + "step": 2600 + }, + { + "epoch": 0.72, + "eval_loss": 0.7550874352455139, + "eval_runtime": 17.1812, + "eval_samples_per_second": 5.762, + "eval_wer": 0.5335051546391752, + "step": 2600 + }, + { + "epoch": 0.75, + "learning_rate": 9.985550739135267e-05, + "loss": 0.5805, + "step": 2700 + }, + { + "epoch": 0.75, + "eval_loss": 0.8099715709686279, + "eval_runtime": 17.1988, + "eval_samples_per_second": 5.756, + "eval_wer": 0.5193298969072165, + "step": 2700 + }, + { + "epoch": 0.78, + "learning_rate": 9.984994998332779e-05, + "loss": 0.5465, + "step": 2800 + }, + { + "epoch": 0.78, + "eval_loss": 0.7341137528419495, + "eval_runtime": 17.1767, + "eval_samples_per_second": 5.764, + "eval_wer": 0.4884020618556701, + "step": 2800 + }, + { + "epoch": 0.81, + "learning_rate": 9.984439257530287e-05, + "loss": 0.556, + "step": 2900 + }, + { + "epoch": 0.81, + "eval_loss": 0.845912516117096, + "eval_runtime": 17.2763, + "eval_samples_per_second": 5.73, + "eval_wer": 0.5025773195876289, + "step": 2900 + }, + { + "epoch": 0.83, + "learning_rate": 9.983883516727799e-05, + "loss": 0.5141, + "step": 3000 + }, + { + "epoch": 0.83, + "eval_loss": 0.822607696056366, + "eval_runtime": 17.5294, + "eval_samples_per_second": 5.648, + "eval_wer": 0.5038659793814433, + "step": 3000 + }, + { + "epoch": 0.86, + "learning_rate": 9.983327775925309e-05, + "loss": 0.5257, + "step": 3100 + }, + { + "epoch": 0.86, + "eval_loss": 0.8175485134124756, + "eval_runtime": 17.1702, + "eval_samples_per_second": 5.766, + "eval_wer": 0.4948453608247423, + "step": 3100 + }, + { + "epoch": 0.89, + "learning_rate": 9.982772035122819e-05, + "loss": 0.501, + "step": 3200 + }, + { + "epoch": 0.89, + "eval_loss": 0.7639488577842712, + "eval_runtime": 17.3806, + "eval_samples_per_second": 5.696, + "eval_wer": 0.4806701030927835, + "step": 3200 + }, + { + "epoch": 0.92, + "learning_rate": 9.982216294320329e-05, + "loss": 0.5081, + "step": 3300 + }, + { + "epoch": 0.92, + "eval_loss": 0.7297512888908386, + "eval_runtime": 17.1321, + "eval_samples_per_second": 5.779, + "eval_wer": 0.48711340206185566, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 9.98166055351784e-05, + "loss": 0.4741, + "step": 3400 + }, + { + "epoch": 0.94, + "eval_loss": 0.9208475947380066, + "eval_runtime": 17.2201, + "eval_samples_per_second": 5.749, + "eval_wer": 0.49355670103092786, + "step": 3400 + }, + { + "epoch": 0.97, + "learning_rate": 9.98110481271535e-05, + "loss": 0.4848, + "step": 3500 + }, + { + "epoch": 0.97, + "eval_loss": 0.8245986104011536, + "eval_runtime": 17.1126, + "eval_samples_per_second": 5.785, + "eval_wer": 0.48582474226804123, + "step": 3500 + }, + { + "epoch": 1.0, + "learning_rate": 9.98054907191286e-05, + "loss": 0.4794, + "step": 3600 + }, + { + "epoch": 1.0, + "eval_loss": 0.7197224497795105, + "eval_runtime": 17.3562, + "eval_samples_per_second": 5.704, + "eval_wer": 0.4677835051546392, + "step": 3600 + }, + { + "epoch": 1.03, + "learning_rate": 9.97999333111037e-05, + "loss": 0.4189, + "step": 3700 + }, + { + "epoch": 1.03, + "eval_loss": 0.7290377616882324, + "eval_runtime": 17.1757, + "eval_samples_per_second": 5.764, + "eval_wer": 0.48195876288659795, + "step": 3700 + }, + { + "epoch": 1.06, + "learning_rate": 9.97943759030788e-05, + "loss": 0.4133, + "step": 3800 + }, + { + "epoch": 1.06, + "eval_loss": 0.8328794240951538, + "eval_runtime": 17.375, + "eval_samples_per_second": 5.698, + "eval_wer": 0.47164948453608246, + "step": 3800 + }, + { + "epoch": 1.08, + "learning_rate": 9.978881849505392e-05, + "loss": 0.43, + "step": 3900 + }, + { + "epoch": 1.08, + "eval_loss": 0.7619199156761169, + "eval_runtime": 17.4527, + "eval_samples_per_second": 5.672, + "eval_wer": 0.46649484536082475, + "step": 3900 + }, + { + "epoch": 1.11, + "learning_rate": 9.978326108702901e-05, + "loss": 0.4274, + "step": 4000 + }, + { + "epoch": 1.11, + "eval_loss": 0.8476623892784119, + "eval_runtime": 17.2396, + "eval_samples_per_second": 5.743, + "eval_wer": 0.5103092783505154, + "step": 4000 + }, + { + "epoch": 1.14, + "learning_rate": 9.977770367900412e-05, + "loss": 0.4586, + "step": 4100 + }, + { + "epoch": 1.14, + "eval_loss": 0.8450866937637329, + "eval_runtime": 17.5121, + "eval_samples_per_second": 5.653, + "eval_wer": 0.48711340206185566, + "step": 4100 + }, + { + "epoch": 1.17, + "learning_rate": 9.977214627097922e-05, + "loss": 0.3902, + "step": 4200 + }, + { + "epoch": 1.17, + "eval_loss": 1.0022594928741455, + "eval_runtime": 17.3099, + "eval_samples_per_second": 5.719, + "eval_wer": 0.520618556701031, + "step": 4200 + }, + { + "epoch": 1.19, + "learning_rate": 9.976658886295432e-05, + "loss": 0.3995, + "step": 4300 + }, + { + "epoch": 1.19, + "eval_loss": 0.825476884841919, + "eval_runtime": 17.3054, + "eval_samples_per_second": 5.721, + "eval_wer": 0.5038659793814433, + "step": 4300 + }, + { + "epoch": 1.22, + "learning_rate": 9.976103145492942e-05, + "loss": 0.3952, + "step": 4400 + }, + { + "epoch": 1.22, + "eval_loss": 0.7960893511772156, + "eval_runtime": 17.2244, + "eval_samples_per_second": 5.748, + "eval_wer": 0.48711340206185566, + "step": 4400 + }, + { + "epoch": 1.25, + "learning_rate": 9.975547404690452e-05, + "loss": 0.4177, + "step": 4500 + }, + { + "epoch": 1.25, + "eval_loss": 0.7501189112663269, + "eval_runtime": 17.0905, + "eval_samples_per_second": 5.793, + "eval_wer": 0.47164948453608246, + "step": 4500 + }, + { + "epoch": 1.28, + "learning_rate": 9.974991663887962e-05, + "loss": 0.4054, + "step": 4600 + }, + { + "epoch": 1.28, + "eval_loss": 0.7024160027503967, + "eval_runtime": 17.2738, + "eval_samples_per_second": 5.731, + "eval_wer": 0.4884020618556701, + "step": 4600 + }, + { + "epoch": 1.31, + "learning_rate": 9.974435923085474e-05, + "loss": 0.4029, + "step": 4700 + }, + { + "epoch": 1.31, + "eval_loss": 0.7287462949752808, + "eval_runtime": 17.6417, + "eval_samples_per_second": 5.612, + "eval_wer": 0.45103092783505155, + "step": 4700 + }, + { + "epoch": 1.33, + "learning_rate": 9.973880182282984e-05, + "loss": 0.3967, + "step": 4800 + }, + { + "epoch": 1.33, + "eval_loss": 0.7488074898719788, + "eval_runtime": 17.3755, + "eval_samples_per_second": 5.698, + "eval_wer": 0.49097938144329895, + "step": 4800 + }, + { + "epoch": 1.36, + "learning_rate": 9.973324441480494e-05, + "loss": 0.4053, + "step": 4900 + }, + { + "epoch": 1.36, + "eval_loss": 0.7065747976303101, + "eval_runtime": 17.3999, + "eval_samples_per_second": 5.69, + "eval_wer": 0.4652061855670103, + "step": 4900 + }, + { + "epoch": 1.39, + "learning_rate": 9.972768700678004e-05, + "loss": 0.4165, + "step": 5000 + }, + { + "epoch": 1.39, + "eval_loss": 0.7919918894767761, + "eval_runtime": 17.0704, + "eval_samples_per_second": 5.799, + "eval_wer": 0.46649484536082475, + "step": 5000 + }, + { + "epoch": 1.42, + "learning_rate": 9.972212959875514e-05, + "loss": 0.4001, + "step": 5100 + }, + { + "epoch": 1.42, + "eval_loss": 0.758572518825531, + "eval_runtime": 17.1616, + "eval_samples_per_second": 5.769, + "eval_wer": 0.47036082474226804, + "step": 5100 + }, + { + "epoch": 1.44, + "learning_rate": 9.971657219073025e-05, + "loss": 0.3736, + "step": 5200 + }, + { + "epoch": 1.44, + "eval_loss": 0.8151732683181763, + "eval_runtime": 17.3692, + "eval_samples_per_second": 5.7, + "eval_wer": 0.5025773195876289, + "step": 5200 + }, + { + "epoch": 1.47, + "learning_rate": 9.971101478270534e-05, + "loss": 0.3694, + "step": 5300 + }, + { + "epoch": 1.47, + "eval_loss": 0.823724627494812, + "eval_runtime": 17.36, + "eval_samples_per_second": 5.703, + "eval_wer": 0.5025773195876289, + "step": 5300 + }, + { + "epoch": 1.5, + "learning_rate": 9.970545737468046e-05, + "loss": 0.3748, + "step": 5400 + }, + { + "epoch": 1.5, + "eval_loss": 0.7445100545883179, + "eval_runtime": 17.4369, + "eval_samples_per_second": 5.678, + "eval_wer": 0.44458762886597936, + "step": 5400 + }, + { + "epoch": 1.53, + "learning_rate": 9.969989996665556e-05, + "loss": 0.3645, + "step": 5500 + }, + { + "epoch": 1.53, + "eval_loss": 0.7235777378082275, + "eval_runtime": 17.1581, + "eval_samples_per_second": 5.77, + "eval_wer": 0.47680412371134023, + "step": 5500 + }, + { + "epoch": 1.56, + "learning_rate": 9.969434255863066e-05, + "loss": 0.3905, + "step": 5600 + }, + { + "epoch": 1.56, + "eval_loss": 0.739282488822937, + "eval_runtime": 17.2125, + "eval_samples_per_second": 5.752, + "eval_wer": 0.4793814432989691, + "step": 5600 + }, + { + "epoch": 1.58, + "learning_rate": 9.968878515060576e-05, + "loss": 0.3723, + "step": 5700 + }, + { + "epoch": 1.58, + "eval_loss": 0.762248158454895, + "eval_runtime": 17.4572, + "eval_samples_per_second": 5.671, + "eval_wer": 0.4652061855670103, + "step": 5700 + }, + { + "epoch": 1.61, + "learning_rate": 9.968322774258087e-05, + "loss": 0.3611, + "step": 5800 + }, + { + "epoch": 1.61, + "eval_loss": 0.7599887251853943, + "eval_runtime": 17.487, + "eval_samples_per_second": 5.661, + "eval_wer": 0.46649484536082475, + "step": 5800 + }, + { + "epoch": 1.64, + "learning_rate": 9.967767033455597e-05, + "loss": 0.3747, + "step": 5900 + }, + { + "epoch": 1.64, + "eval_loss": 0.7197273373603821, + "eval_runtime": 17.4419, + "eval_samples_per_second": 5.676, + "eval_wer": 0.47680412371134023, + "step": 5900 + }, + { + "epoch": 1.67, + "learning_rate": 9.967211292653107e-05, + "loss": 0.3736, + "step": 6000 + }, + { + "epoch": 1.67, + "eval_loss": 0.7508798241615295, + "eval_runtime": 17.1575, + "eval_samples_per_second": 5.77, + "eval_wer": 0.47036082474226804, + "step": 6000 + }, + { + "epoch": 1.69, + "learning_rate": 9.966655551850617e-05, + "loss": 0.3828, + "step": 6100 + }, + { + "epoch": 1.69, + "eval_loss": 0.7594204545021057, + "eval_runtime": 17.2159, + "eval_samples_per_second": 5.75, + "eval_wer": 0.4652061855670103, + "step": 6100 + }, + { + "epoch": 1.72, + "learning_rate": 9.966099811048127e-05, + "loss": 0.3717, + "step": 6200 + }, + { + "epoch": 1.72, + "eval_loss": 0.6831815838813782, + "eval_runtime": 17.2288, + "eval_samples_per_second": 5.746, + "eval_wer": 0.4639175257731959, + "step": 6200 + }, + { + "epoch": 1.75, + "learning_rate": 9.965544070245639e-05, + "loss": 0.3605, + "step": 6300 + }, + { + "epoch": 1.75, + "eval_loss": 0.8021068572998047, + "eval_runtime": 17.2637, + "eval_samples_per_second": 5.735, + "eval_wer": 0.46262886597938147, + "step": 6300 + }, + { + "epoch": 1.78, + "learning_rate": 9.964988329443147e-05, + "loss": 0.3868, + "step": 6400 + }, + { + "epoch": 1.78, + "eval_loss": 0.7559285759925842, + "eval_runtime": 17.2295, + "eval_samples_per_second": 5.746, + "eval_wer": 0.46262886597938147, + "step": 6400 + }, + { + "epoch": 1.81, + "learning_rate": 9.964432588640659e-05, + "loss": 0.3762, + "step": 6500 + }, + { + "epoch": 1.81, + "eval_loss": 0.6938344240188599, + "eval_runtime": 17.2273, + "eval_samples_per_second": 5.747, + "eval_wer": 0.44587628865979384, + "step": 6500 + }, + { + "epoch": 1.83, + "learning_rate": 9.963876847838169e-05, + "loss": 0.3335, + "step": 6600 + }, + { + "epoch": 1.83, + "eval_loss": 0.7515353560447693, + "eval_runtime": 17.2748, + "eval_samples_per_second": 5.731, + "eval_wer": 0.4652061855670103, + "step": 6600 + }, + { + "epoch": 1.86, + "learning_rate": 9.963321107035679e-05, + "loss": 0.3761, + "step": 6700 + }, + { + "epoch": 1.86, + "eval_loss": 0.6331177353858948, + "eval_runtime": 17.2836, + "eval_samples_per_second": 5.728, + "eval_wer": 0.43556701030927836, + "step": 6700 + }, + { + "epoch": 1.89, + "learning_rate": 9.962765366233189e-05, + "loss": 0.3597, + "step": 6800 + }, + { + "epoch": 1.89, + "eval_loss": 0.7062612771987915, + "eval_runtime": 17.0606, + "eval_samples_per_second": 5.803, + "eval_wer": 0.46262886597938147, + "step": 6800 + }, + { + "epoch": 1.92, + "learning_rate": 9.962209625430699e-05, + "loss": 0.3489, + "step": 6900 + }, + { + "epoch": 1.92, + "eval_loss": 0.7171001434326172, + "eval_runtime": 17.3915, + "eval_samples_per_second": 5.692, + "eval_wer": 0.4587628865979381, + "step": 6900 + }, + { + "epoch": 1.94, + "learning_rate": 9.96165388462821e-05, + "loss": 0.3492, + "step": 7000 + }, + { + "epoch": 1.94, + "eval_loss": 0.8369248509407043, + "eval_runtime": 17.2963, + "eval_samples_per_second": 5.724, + "eval_wer": 0.4845360824742268, + "step": 7000 + }, + { + "epoch": 1.97, + "learning_rate": 9.96109814382572e-05, + "loss": 0.3581, + "step": 7100 + }, + { + "epoch": 1.97, + "eval_loss": 0.7614104747772217, + "eval_runtime": 17.1514, + "eval_samples_per_second": 5.772, + "eval_wer": 0.4484536082474227, + "step": 7100 + }, + { + "epoch": 2.0, + "learning_rate": 9.96054240302323e-05, + "loss": 0.3617, + "step": 7200 + }, + { + "epoch": 2.0, + "eval_loss": 0.7410733699798584, + "eval_runtime": 16.8873, + "eval_samples_per_second": 5.862, + "eval_wer": 0.45103092783505155, + "step": 7200 + }, + { + "epoch": 2.03, + "learning_rate": 9.95998666222074e-05, + "loss": 0.3044, + "step": 7300 + }, + { + "epoch": 2.03, + "eval_loss": 0.8537248373031616, + "eval_runtime": 16.8753, + "eval_samples_per_second": 5.867, + "eval_wer": 0.4793814432989691, + "step": 7300 + }, + { + "epoch": 2.06, + "learning_rate": 9.959430921418251e-05, + "loss": 0.2982, + "step": 7400 + }, + { + "epoch": 2.06, + "eval_loss": 0.7687365412712097, + "eval_runtime": 17.2864, + "eval_samples_per_second": 5.727, + "eval_wer": 0.48582474226804123, + "step": 7400 + }, + { + "epoch": 2.08, + "learning_rate": 9.958875180615761e-05, + "loss": 0.3035, + "step": 7500 + }, + { + "epoch": 2.08, + "eval_loss": 0.8554800152778625, + "eval_runtime": 17.1923, + "eval_samples_per_second": 5.758, + "eval_wer": 0.4536082474226804, + "step": 7500 + }, + { + "epoch": 2.11, + "learning_rate": 9.958319439813272e-05, + "loss": 0.3032, + "step": 7600 + }, + { + "epoch": 2.11, + "eval_loss": 0.8073357343673706, + "eval_runtime": 17.2402, + "eval_samples_per_second": 5.742, + "eval_wer": 0.47551546391752575, + "step": 7600 + }, + { + "epoch": 2.14, + "learning_rate": 9.957763699010781e-05, + "loss": 0.3336, + "step": 7700 + }, + { + "epoch": 2.14, + "eval_loss": 0.8232630491256714, + "eval_runtime": 17.1702, + "eval_samples_per_second": 5.766, + "eval_wer": 0.4574742268041237, + "step": 7700 + }, + { + "epoch": 2.17, + "learning_rate": 9.957207958208292e-05, + "loss": 0.3062, + "step": 7800 + }, + { + "epoch": 2.17, + "eval_loss": 0.73056960105896, + "eval_runtime": 17.1533, + "eval_samples_per_second": 5.771, + "eval_wer": 0.45489690721649484, + "step": 7800 + }, + { + "epoch": 2.2, + "learning_rate": 9.956652217405802e-05, + "loss": 0.3278, + "step": 7900 + }, + { + "epoch": 2.2, + "eval_loss": 0.7208071351051331, + "eval_runtime": 17.2805, + "eval_samples_per_second": 5.729, + "eval_wer": 0.4742268041237113, + "step": 7900 + }, + { + "epoch": 2.22, + "learning_rate": 9.956096476603312e-05, + "loss": 0.3116, + "step": 8000 + }, + { + "epoch": 2.22, + "eval_loss": 0.7529891133308411, + "eval_runtime": 17.1791, + "eval_samples_per_second": 5.763, + "eval_wer": 0.4574742268041237, + "step": 8000 + }, + { + "epoch": 2.25, + "learning_rate": 9.955540735800824e-05, + "loss": 0.2909, + "step": 8100 + }, + { + "epoch": 2.25, + "eval_loss": 0.7208893299102783, + "eval_runtime": 17.1849, + "eval_samples_per_second": 5.761, + "eval_wer": 0.4536082474226804, + "step": 8100 + }, + { + "epoch": 2.28, + "learning_rate": 9.954984994998332e-05, + "loss": 0.2998, + "step": 8200 + }, + { + "epoch": 2.28, + "eval_loss": 0.7474488615989685, + "eval_runtime": 17.1962, + "eval_samples_per_second": 5.757, + "eval_wer": 0.44072164948453607, + "step": 8200 + }, + { + "epoch": 2.31, + "learning_rate": 9.954429254195844e-05, + "loss": 0.3007, + "step": 8300 + }, + { + "epoch": 2.31, + "eval_loss": 0.8237383365631104, + "eval_runtime": 17.1897, + "eval_samples_per_second": 5.759, + "eval_wer": 0.47164948453608246, + "step": 8300 + }, + { + "epoch": 2.33, + "learning_rate": 9.953873513393354e-05, + "loss": 0.3047, + "step": 8400 + }, + { + "epoch": 2.33, + "eval_loss": 0.7258074879646301, + "eval_runtime": 17.2814, + "eval_samples_per_second": 5.729, + "eval_wer": 0.46005154639175255, + "step": 8400 + }, + { + "epoch": 2.36, + "learning_rate": 9.953317772590864e-05, + "loss": 0.3224, + "step": 8500 + }, + { + "epoch": 2.36, + "eval_loss": 0.9189648032188416, + "eval_runtime": 17.2837, + "eval_samples_per_second": 5.728, + "eval_wer": 0.4652061855670103, + "step": 8500 + }, + { + "epoch": 2.39, + "learning_rate": 9.952762031788374e-05, + "loss": 0.3126, + "step": 8600 + }, + { + "epoch": 2.39, + "eval_loss": 0.7851585745811462, + "eval_runtime": 17.2252, + "eval_samples_per_second": 5.747, + "eval_wer": 0.4574742268041237, + "step": 8600 + }, + { + "epoch": 2.42, + "learning_rate": 9.952206290985885e-05, + "loss": 0.2806, + "step": 8700 + }, + { + "epoch": 2.42, + "eval_loss": 0.9620941877365112, + "eval_runtime": 17.2564, + "eval_samples_per_second": 5.737, + "eval_wer": 0.46649484536082475, + "step": 8700 + }, + { + "epoch": 2.45, + "learning_rate": 9.951650550183394e-05, + "loss": 0.3057, + "step": 8800 + }, + { + "epoch": 2.45, + "eval_loss": 0.6678251624107361, + "eval_runtime": 17.2795, + "eval_samples_per_second": 5.729, + "eval_wer": 0.422680412371134, + "step": 8800 + }, + { + "epoch": 2.47, + "learning_rate": 9.951094809380906e-05, + "loss": 0.3066, + "step": 8900 + }, + { + "epoch": 2.47, + "eval_loss": 0.7364962100982666, + "eval_runtime": 17.3954, + "eval_samples_per_second": 5.691, + "eval_wer": 0.43427835051546393, + "step": 8900 + }, + { + "epoch": 2.5, + "learning_rate": 9.950539068578416e-05, + "loss": 0.2891, + "step": 9000 + }, + { + "epoch": 2.5, + "eval_loss": 0.7602680921554565, + "eval_runtime": 17.2544, + "eval_samples_per_second": 5.738, + "eval_wer": 0.4574742268041237, + "step": 9000 + }, + { + "epoch": 2.53, + "learning_rate": 9.949983327775926e-05, + "loss": 0.2857, + "step": 9100 + }, + { + "epoch": 2.53, + "eval_loss": 0.7446552515029907, + "eval_runtime": 17.5308, + "eval_samples_per_second": 5.647, + "eval_wer": 0.4497422680412371, + "step": 9100 + }, + { + "epoch": 2.56, + "learning_rate": 9.949427586973437e-05, + "loss": 0.333, + "step": 9200 + }, + { + "epoch": 2.56, + "eval_loss": 0.7369379997253418, + "eval_runtime": 17.5237, + "eval_samples_per_second": 5.649, + "eval_wer": 0.4484536082474227, + "step": 9200 + }, + { + "epoch": 2.58, + "learning_rate": 9.948871846170946e-05, + "loss": 0.3125, + "step": 9300 + }, + { + "epoch": 2.58, + "eval_loss": 0.7238438725471497, + "eval_runtime": 17.2568, + "eval_samples_per_second": 5.737, + "eval_wer": 0.452319587628866, + "step": 9300 + }, + { + "epoch": 2.61, + "learning_rate": 9.948316105368457e-05, + "loss": 0.3182, + "step": 9400 + }, + { + "epoch": 2.61, + "eval_loss": 0.7532787919044495, + "eval_runtime": 17.267, + "eval_samples_per_second": 5.733, + "eval_wer": 0.4536082474226804, + "step": 9400 + }, + { + "epoch": 2.64, + "learning_rate": 9.947760364565967e-05, + "loss": 0.2925, + "step": 9500 + }, + { + "epoch": 2.64, + "eval_loss": 0.7420103549957275, + "eval_runtime": 17.2284, + "eval_samples_per_second": 5.746, + "eval_wer": 0.45489690721649484, + "step": 9500 + }, + { + "epoch": 2.67, + "learning_rate": 9.947204623763477e-05, + "loss": 0.3078, + "step": 9600 + }, + { + "epoch": 2.67, + "eval_loss": 0.7169169187545776, + "eval_runtime": 17.501, + "eval_samples_per_second": 5.657, + "eval_wer": 0.4536082474226804, + "step": 9600 + }, + { + "epoch": 2.7, + "learning_rate": 9.946648882960987e-05, + "loss": 0.2922, + "step": 9700 + }, + { + "epoch": 2.7, + "eval_loss": 0.8229072093963623, + "eval_runtime": 17.3292, + "eval_samples_per_second": 5.713, + "eval_wer": 0.4832474226804124, + "step": 9700 + }, + { + "epoch": 2.72, + "learning_rate": 9.946093142158497e-05, + "loss": 0.2934, + "step": 9800 + }, + { + "epoch": 2.72, + "eval_loss": 0.6904311776161194, + "eval_runtime": 17.3862, + "eval_samples_per_second": 5.694, + "eval_wer": 0.4536082474226804, + "step": 9800 + }, + { + "epoch": 2.75, + "learning_rate": 9.945537401356007e-05, + "loss": 0.2655, + "step": 9900 + }, + { + "epoch": 2.75, + "eval_loss": 0.7936742901802063, + "eval_runtime": 17.2939, + "eval_samples_per_second": 5.725, + "eval_wer": 0.46134020618556704, + "step": 9900 + }, + { + "epoch": 2.78, + "learning_rate": 9.944981660553519e-05, + "loss": 0.2764, + "step": 10000 + }, + { + "epoch": 2.78, + "eval_loss": 0.7943949103355408, + "eval_runtime": 17.0681, + "eval_samples_per_second": 5.8, + "eval_wer": 0.45103092783505155, + "step": 10000 + }, + { + "epoch": 2.81, + "learning_rate": 9.944425919751028e-05, + "loss": 0.2991, + "step": 10100 + }, + { + "epoch": 2.81, + "eval_loss": 0.7811460494995117, + "eval_runtime": 17.292, + "eval_samples_per_second": 5.725, + "eval_wer": 0.46005154639175255, + "step": 10100 + }, + { + "epoch": 2.83, + "learning_rate": 9.943870178948539e-05, + "loss": 0.2866, + "step": 10200 + }, + { + "epoch": 2.83, + "eval_loss": 0.7307493686676025, + "eval_runtime": 17.5153, + "eval_samples_per_second": 5.652, + "eval_wer": 0.47164948453608246, + "step": 10200 + }, + { + "epoch": 2.86, + "learning_rate": 9.943314438146049e-05, + "loss": 0.2973, + "step": 10300 + }, + { + "epoch": 2.86, + "eval_loss": 0.7479050755500793, + "eval_runtime": 17.4352, + "eval_samples_per_second": 5.678, + "eval_wer": 0.4420103092783505, + "step": 10300 + }, + { + "epoch": 2.89, + "learning_rate": 9.942758697343559e-05, + "loss": 0.3063, + "step": 10400 + }, + { + "epoch": 2.89, + "eval_loss": 0.6997365951538086, + "eval_runtime": 17.2367, + "eval_samples_per_second": 5.744, + "eval_wer": 0.44072164948453607, + "step": 10400 + }, + { + "epoch": 2.92, + "learning_rate": 9.94220295654107e-05, + "loss": 0.2738, + "step": 10500 + }, + { + "epoch": 2.92, + "eval_loss": 0.6006211042404175, + "eval_runtime": 17.0511, + "eval_samples_per_second": 5.806, + "eval_wer": 0.43170103092783507, + "step": 10500 + }, + { + "epoch": 2.95, + "learning_rate": 9.941647215738579e-05, + "loss": 0.282, + "step": 10600 + }, + { + "epoch": 2.95, + "eval_loss": 0.7482351660728455, + "eval_runtime": 17.5673, + "eval_samples_per_second": 5.635, + "eval_wer": 0.47164948453608246, + "step": 10600 + }, + { + "epoch": 2.97, + "learning_rate": 9.94109147493609e-05, + "loss": 0.2666, + "step": 10700 + }, + { + "epoch": 2.97, + "eval_loss": 0.7779076099395752, + "eval_runtime": 17.5922, + "eval_samples_per_second": 5.628, + "eval_wer": 0.45489690721649484, + "step": 10700 + }, + { + "epoch": 3.0, + "learning_rate": 9.9405357341336e-05, + "loss": 0.28, + "step": 10800 + }, + { + "epoch": 3.0, + "eval_loss": 0.7526705265045166, + "eval_runtime": 17.6203, + "eval_samples_per_second": 5.619, + "eval_wer": 0.44587628865979384, + "step": 10800 + }, + { + "epoch": 3.03, + "learning_rate": 9.939979993331111e-05, + "loss": 0.2516, + "step": 10900 + }, + { + "epoch": 3.03, + "eval_loss": 0.7915493249893188, + "eval_runtime": 17.3797, + "eval_samples_per_second": 5.696, + "eval_wer": 0.45489690721649484, + "step": 10900 + }, + { + "epoch": 3.06, + "learning_rate": 9.939424252528621e-05, + "loss": 0.2777, + "step": 11000 + }, + { + "epoch": 3.06, + "eval_loss": 0.7125186920166016, + "eval_runtime": 17.4703, + "eval_samples_per_second": 5.667, + "eval_wer": 0.44458762886597936, + "step": 11000 + }, + { + "epoch": 3.08, + "learning_rate": 9.938868511726132e-05, + "loss": 0.2502, + "step": 11100 + }, + { + "epoch": 3.08, + "eval_loss": 0.7668015360832214, + "eval_runtime": 17.4017, + "eval_samples_per_second": 5.689, + "eval_wer": 0.4265463917525773, + "step": 11100 + }, + { + "epoch": 3.11, + "learning_rate": 9.938312770923641e-05, + "loss": 0.2432, + "step": 11200 + }, + { + "epoch": 3.11, + "eval_loss": 0.8193698525428772, + "eval_runtime": 17.3292, + "eval_samples_per_second": 5.713, + "eval_wer": 0.47164948453608246, + "step": 11200 + }, + { + "epoch": 3.14, + "learning_rate": 9.937757030121152e-05, + "loss": 0.2593, + "step": 11300 + }, + { + "epoch": 3.14, + "eval_loss": 0.831807017326355, + "eval_runtime": 17.591, + "eval_samples_per_second": 5.628, + "eval_wer": 0.44329896907216493, + "step": 11300 + }, + { + "epoch": 3.17, + "learning_rate": 9.937201289318662e-05, + "loss": 0.2706, + "step": 11400 + }, + { + "epoch": 3.17, + "eval_loss": 0.7298266291618347, + "eval_runtime": 17.4027, + "eval_samples_per_second": 5.689, + "eval_wer": 0.4420103092783505, + "step": 11400 + }, + { + "epoch": 3.2, + "learning_rate": 9.936645548516172e-05, + "loss": 0.2561, + "step": 11500 + }, + { + "epoch": 3.2, + "eval_loss": 0.695881724357605, + "eval_runtime": 17.3517, + "eval_samples_per_second": 5.705, + "eval_wer": 0.45618556701030927, + "step": 11500 + }, + { + "epoch": 3.22, + "learning_rate": 9.936089807713684e-05, + "loss": 0.2648, + "step": 11600 + }, + { + "epoch": 3.22, + "eval_loss": 0.7764458656311035, + "eval_runtime": 17.4577, + "eval_samples_per_second": 5.671, + "eval_wer": 0.46134020618556704, + "step": 11600 + }, + { + "epoch": 3.25, + "learning_rate": 9.935534066911193e-05, + "loss": 0.2547, + "step": 11700 + }, + { + "epoch": 3.25, + "eval_loss": 0.6394737958908081, + "eval_runtime": 17.2603, + "eval_samples_per_second": 5.736, + "eval_wer": 0.45489690721649484, + "step": 11700 + }, + { + "epoch": 3.28, + "learning_rate": 9.934978326108704e-05, + "loss": 0.2746, + "step": 11800 + }, + { + "epoch": 3.28, + "eval_loss": 0.7559604048728943, + "eval_runtime": 17.4736, + "eval_samples_per_second": 5.666, + "eval_wer": 0.4484536082474227, + "step": 11800 + }, + { + "epoch": 3.31, + "learning_rate": 9.934422585306214e-05, + "loss": 0.2406, + "step": 11900 + }, + { + "epoch": 3.31, + "eval_loss": 0.7239082455635071, + "eval_runtime": 17.7291, + "eval_samples_per_second": 5.584, + "eval_wer": 0.43170103092783507, + "step": 11900 + }, + { + "epoch": 3.33, + "learning_rate": 9.933866844503724e-05, + "loss": 0.2394, + "step": 12000 + }, + { + "epoch": 3.33, + "eval_loss": 0.7092143297195435, + "eval_runtime": 17.5081, + "eval_samples_per_second": 5.655, + "eval_wer": 0.4420103092783505, + "step": 12000 + }, + { + "epoch": 3.36, + "learning_rate": 9.933311103701234e-05, + "loss": 0.2696, + "step": 12100 + }, + { + "epoch": 3.36, + "eval_loss": 0.7482930421829224, + "eval_runtime": 17.1766, + "eval_samples_per_second": 5.764, + "eval_wer": 0.4381443298969072, + "step": 12100 + }, + { + "epoch": 3.39, + "learning_rate": 9.932755362898744e-05, + "loss": 0.2737, + "step": 12200 + }, + { + "epoch": 3.39, + "eval_loss": 0.7534049153327942, + "eval_runtime": 17.5047, + "eval_samples_per_second": 5.656, + "eval_wer": 0.45103092783505155, + "step": 12200 + }, + { + "epoch": 3.42, + "learning_rate": 9.932199622096254e-05, + "loss": 0.2796, + "step": 12300 + }, + { + "epoch": 3.42, + "eval_loss": 0.7405951619148254, + "eval_runtime": 17.3851, + "eval_samples_per_second": 5.695, + "eval_wer": 0.4536082474226804, + "step": 12300 + }, + { + "epoch": 3.45, + "learning_rate": 9.931643881293766e-05, + "loss": 0.2442, + "step": 12400 + }, + { + "epoch": 3.45, + "eval_loss": 0.7737710475921631, + "eval_runtime": 17.4053, + "eval_samples_per_second": 5.688, + "eval_wer": 0.45618556701030927, + "step": 12400 + }, + { + "epoch": 3.47, + "learning_rate": 9.931088140491276e-05, + "loss": 0.2286, + "step": 12500 + }, + { + "epoch": 3.47, + "eval_loss": 0.7984783053398132, + "eval_runtime": 17.2754, + "eval_samples_per_second": 5.731, + "eval_wer": 0.46005154639175255, + "step": 12500 + }, + { + "epoch": 3.5, + "learning_rate": 9.930532399688786e-05, + "loss": 0.2778, + "step": 12600 + }, + { + "epoch": 3.5, + "eval_loss": 0.73711758852005, + "eval_runtime": 17.2963, + "eval_samples_per_second": 5.724, + "eval_wer": 0.44072164948453607, + "step": 12600 + }, + { + "epoch": 3.53, + "learning_rate": 9.929976658886296e-05, + "loss": 0.2456, + "step": 12700 + }, + { + "epoch": 3.53, + "eval_loss": 0.7433577179908752, + "eval_runtime": 17.1925, + "eval_samples_per_second": 5.758, + "eval_wer": 0.4368556701030928, + "step": 12700 + }, + { + "epoch": 3.56, + "learning_rate": 9.929420918083806e-05, + "loss": 0.252, + "step": 12800 + }, + { + "epoch": 3.56, + "eval_loss": 0.6638050079345703, + "eval_runtime": 17.2159, + "eval_samples_per_second": 5.75, + "eval_wer": 0.4329896907216495, + "step": 12800 + }, + { + "epoch": 3.58, + "learning_rate": 9.928865177281317e-05, + "loss": 0.2733, + "step": 12900 + }, + { + "epoch": 3.58, + "eval_loss": 0.6307669878005981, + "eval_runtime": 17.3572, + "eval_samples_per_second": 5.704, + "eval_wer": 0.44587628865979384, + "step": 12900 + }, + { + "epoch": 3.61, + "learning_rate": 9.928309436478826e-05, + "loss": 0.255, + "step": 13000 + }, + { + "epoch": 3.61, + "eval_loss": 0.6689628958702087, + "eval_runtime": 17.5354, + "eval_samples_per_second": 5.646, + "eval_wer": 0.4420103092783505, + "step": 13000 + }, + { + "epoch": 3.64, + "learning_rate": 9.927753695676337e-05, + "loss": 0.2663, + "step": 13100 + }, + { + "epoch": 3.64, + "eval_loss": 0.6840199828147888, + "eval_runtime": 17.5476, + "eval_samples_per_second": 5.642, + "eval_wer": 0.4536082474226804, + "step": 13100 + }, + { + "epoch": 3.67, + "learning_rate": 9.927197954873847e-05, + "loss": 0.2666, + "step": 13200 + }, + { + "epoch": 3.67, + "eval_loss": 0.6798214912414551, + "eval_runtime": 17.5852, + "eval_samples_per_second": 5.63, + "eval_wer": 0.4368556701030928, + "step": 13200 + }, + { + "epoch": 3.7, + "learning_rate": 9.926642214071357e-05, + "loss": 0.2515, + "step": 13300 + }, + { + "epoch": 3.7, + "eval_loss": 0.7858713269233704, + "eval_runtime": 17.2073, + "eval_samples_per_second": 5.753, + "eval_wer": 0.4536082474226804, + "step": 13300 + }, + { + "epoch": 3.72, + "learning_rate": 9.926086473268867e-05, + "loss": 0.2474, + "step": 13400 + }, + { + "epoch": 3.72, + "eval_loss": 0.6592583060264587, + "eval_runtime": 17.613, + "eval_samples_per_second": 5.621, + "eval_wer": 0.45489690721649484, + "step": 13400 + }, + { + "epoch": 3.75, + "learning_rate": 9.925530732466378e-05, + "loss": 0.2619, + "step": 13500 + }, + { + "epoch": 3.75, + "eval_loss": 0.7771138548851013, + "eval_runtime": 17.4838, + "eval_samples_per_second": 5.662, + "eval_wer": 0.4484536082474227, + "step": 13500 + }, + { + "epoch": 3.78, + "learning_rate": 9.924974991663888e-05, + "loss": 0.2541, + "step": 13600 + }, + { + "epoch": 3.78, + "eval_loss": 0.6582715511322021, + "eval_runtime": 17.4038, + "eval_samples_per_second": 5.688, + "eval_wer": 0.42783505154639173, + "step": 13600 + }, + { + "epoch": 3.81, + "learning_rate": 9.924419250861399e-05, + "loss": 0.2335, + "step": 13700 + }, + { + "epoch": 3.81, + "eval_loss": 0.7495954036712646, + "eval_runtime": 17.2322, + "eval_samples_per_second": 5.745, + "eval_wer": 0.4381443298969072, + "step": 13700 + }, + { + "epoch": 3.83, + "learning_rate": 9.923863510058909e-05, + "loss": 0.2546, + "step": 13800 + }, + { + "epoch": 3.83, + "eval_loss": 0.7367487549781799, + "eval_runtime": 17.4399, + "eval_samples_per_second": 5.677, + "eval_wer": 0.45103092783505155, + "step": 13800 + }, + { + "epoch": 3.86, + "learning_rate": 9.923307769256419e-05, + "loss": 0.2369, + "step": 13900 + }, + { + "epoch": 3.86, + "eval_loss": 0.7236208915710449, + "eval_runtime": 17.2973, + "eval_samples_per_second": 5.723, + "eval_wer": 0.43943298969072164, + "step": 13900 + }, + { + "epoch": 3.89, + "learning_rate": 9.92275202845393e-05, + "loss": 0.2518, + "step": 14000 + }, + { + "epoch": 3.89, + "eval_loss": 0.6668509840965271, + "eval_runtime": 17.3127, + "eval_samples_per_second": 5.718, + "eval_wer": 0.44072164948453607, + "step": 14000 + }, + { + "epoch": 3.92, + "learning_rate": 9.922196287651439e-05, + "loss": 0.2336, + "step": 14100 + }, + { + "epoch": 3.92, + "eval_loss": 0.6360946297645569, + "eval_runtime": 17.457, + "eval_samples_per_second": 5.671, + "eval_wer": 0.43170103092783507, + "step": 14100 + }, + { + "epoch": 3.95, + "learning_rate": 9.92164054684895e-05, + "loss": 0.2519, + "step": 14200 + }, + { + "epoch": 3.95, + "eval_loss": 0.7355924844741821, + "eval_runtime": 17.2736, + "eval_samples_per_second": 5.731, + "eval_wer": 0.4381443298969072, + "step": 14200 + }, + { + "epoch": 3.97, + "learning_rate": 9.921084806046461e-05, + "loss": 0.2505, + "step": 14300 + }, + { + "epoch": 3.97, + "eval_loss": 0.6415805816650391, + "eval_runtime": 17.406, + "eval_samples_per_second": 5.688, + "eval_wer": 0.44458762886597936, + "step": 14300 + }, + { + "epoch": 4.0, + "learning_rate": 9.920529065243971e-05, + "loss": 0.2671, + "step": 14400 + }, + { + "epoch": 4.0, + "eval_loss": 0.764227032661438, + "eval_runtime": 17.2386, + "eval_samples_per_second": 5.743, + "eval_wer": 0.43556701030927836, + "step": 14400 + }, + { + "epoch": 4.03, + "learning_rate": 9.919973324441481e-05, + "loss": 0.202, + "step": 14500 + }, + { + "epoch": 4.03, + "eval_loss": 0.7409430742263794, + "eval_runtime": 17.3261, + "eval_samples_per_second": 5.714, + "eval_wer": 0.4484536082474227, + "step": 14500 + }, + { + "epoch": 4.06, + "learning_rate": 9.919417583638991e-05, + "loss": 0.2304, + "step": 14600 + }, + { + "epoch": 4.06, + "eval_loss": 0.7179251909255981, + "eval_runtime": 17.3235, + "eval_samples_per_second": 5.715, + "eval_wer": 0.43943298969072164, + "step": 14600 + }, + { + "epoch": 4.08, + "learning_rate": 9.918861842836501e-05, + "loss": 0.2391, + "step": 14700 + }, + { + "epoch": 4.08, + "eval_loss": 0.6860632300376892, + "eval_runtime": 17.2579, + "eval_samples_per_second": 5.737, + "eval_wer": 0.43556701030927836, + "step": 14700 + }, + { + "epoch": 4.11, + "learning_rate": 9.918306102034012e-05, + "loss": 0.2302, + "step": 14800 + }, + { + "epoch": 4.11, + "eval_loss": 0.7088943719863892, + "eval_runtime": 17.4142, + "eval_samples_per_second": 5.685, + "eval_wer": 0.44072164948453607, + "step": 14800 + }, + { + "epoch": 4.14, + "learning_rate": 9.917750361231522e-05, + "loss": 0.2395, + "step": 14900 + }, + { + "epoch": 4.14, + "eval_loss": 0.8547905683517456, + "eval_runtime": 17.2308, + "eval_samples_per_second": 5.746, + "eval_wer": 0.44587628865979384, + "step": 14900 + }, + { + "epoch": 4.17, + "learning_rate": 9.917194620429032e-05, + "loss": 0.2108, + "step": 15000 + }, + { + "epoch": 4.17, + "eval_loss": 0.7243941426277161, + "eval_runtime": 17.2836, + "eval_samples_per_second": 5.728, + "eval_wer": 0.42783505154639173, + "step": 15000 + }, + { + "epoch": 4.2, + "learning_rate": 9.916638879626542e-05, + "loss": 0.2479, + "step": 15100 + }, + { + "epoch": 4.2, + "eval_loss": 0.721064567565918, + "eval_runtime": 17.3846, + "eval_samples_per_second": 5.695, + "eval_wer": 0.43170103092783507, + "step": 15100 + }, + { + "epoch": 4.22, + "learning_rate": 9.916083138824053e-05, + "loss": 0.228, + "step": 15200 + }, + { + "epoch": 4.22, + "eval_loss": 0.6933774352073669, + "eval_runtime": 17.4588, + "eval_samples_per_second": 5.671, + "eval_wer": 0.44587628865979384, + "step": 15200 + }, + { + "epoch": 4.25, + "learning_rate": 9.915527398021564e-05, + "loss": 0.2089, + "step": 15300 + }, + { + "epoch": 4.25, + "eval_loss": 0.6892577409744263, + "eval_runtime": 17.334, + "eval_samples_per_second": 5.711, + "eval_wer": 0.43427835051546393, + "step": 15300 + }, + { + "epoch": 4.28, + "learning_rate": 9.914971657219073e-05, + "loss": 0.2647, + "step": 15400 + }, + { + "epoch": 4.28, + "eval_loss": 0.7205445170402527, + "eval_runtime": 17.3769, + "eval_samples_per_second": 5.697, + "eval_wer": 0.43943298969072164, + "step": 15400 + }, + { + "epoch": 4.31, + "learning_rate": 9.914415916416584e-05, + "loss": 0.2111, + "step": 15500 + }, + { + "epoch": 4.31, + "eval_loss": 0.7887137532234192, + "eval_runtime": 17.5118, + "eval_samples_per_second": 5.653, + "eval_wer": 0.4484536082474227, + "step": 15500 + }, + { + "epoch": 4.33, + "learning_rate": 9.913860175614094e-05, + "loss": 0.2395, + "step": 15600 + }, + { + "epoch": 4.33, + "eval_loss": 0.7880820631980896, + "eval_runtime": 17.4336, + "eval_samples_per_second": 5.679, + "eval_wer": 0.4574742268041237, + "step": 15600 + }, + { + "epoch": 4.36, + "learning_rate": 9.913304434811604e-05, + "loss": 0.2283, + "step": 15700 + }, + { + "epoch": 4.36, + "eval_loss": 0.7957388162612915, + "eval_runtime": 17.4422, + "eval_samples_per_second": 5.676, + "eval_wer": 0.45618556701030927, + "step": 15700 + }, + { + "epoch": 4.39, + "learning_rate": 9.912748694009114e-05, + "loss": 0.2315, + "step": 15800 + }, + { + "epoch": 4.39, + "eval_loss": 0.7855367064476013, + "eval_runtime": 17.8336, + "eval_samples_per_second": 5.551, + "eval_wer": 0.44716494845360827, + "step": 15800 + }, + { + "epoch": 4.42, + "learning_rate": 9.912192953206624e-05, + "loss": 0.2161, + "step": 15900 + }, + { + "epoch": 4.42, + "eval_loss": 0.8106959462165833, + "eval_runtime": 17.4952, + "eval_samples_per_second": 5.659, + "eval_wer": 0.4420103092783505, + "step": 15900 + }, + { + "epoch": 4.45, + "learning_rate": 9.911637212404136e-05, + "loss": 0.21, + "step": 16000 + }, + { + "epoch": 4.45, + "eval_loss": 0.7481738924980164, + "eval_runtime": 17.3874, + "eval_samples_per_second": 5.694, + "eval_wer": 0.42396907216494845, + "step": 16000 + }, + { + "epoch": 4.47, + "learning_rate": 9.911081471601646e-05, + "loss": 0.2208, + "step": 16100 + }, + { + "epoch": 4.47, + "eval_loss": 0.8416795134544373, + "eval_runtime": 17.3637, + "eval_samples_per_second": 5.702, + "eval_wer": 0.44458762886597936, + "step": 16100 + }, + { + "epoch": 4.5, + "learning_rate": 9.910525730799156e-05, + "loss": 0.2339, + "step": 16200 + }, + { + "epoch": 4.5, + "eval_loss": 0.7456889152526855, + "eval_runtime": 17.6094, + "eval_samples_per_second": 5.622, + "eval_wer": 0.4574742268041237, + "step": 16200 + }, + { + "epoch": 4.53, + "learning_rate": 9.909969989996666e-05, + "loss": 0.2184, + "step": 16300 + }, + { + "epoch": 4.53, + "eval_loss": 0.7151892185211182, + "eval_runtime": 17.6465, + "eval_samples_per_second": 5.61, + "eval_wer": 0.42783505154639173, + "step": 16300 + }, + { + "epoch": 4.56, + "learning_rate": 9.909414249194177e-05, + "loss": 0.2538, + "step": 16400 + }, + { + "epoch": 4.56, + "eval_loss": 0.6038363575935364, + "eval_runtime": 17.6191, + "eval_samples_per_second": 5.619, + "eval_wer": 0.43556701030927836, + "step": 16400 + }, + { + "epoch": 4.58, + "learning_rate": 9.908858508391686e-05, + "loss": 0.2241, + "step": 16500 + }, + { + "epoch": 4.58, + "eval_loss": 0.7377514243125916, + "eval_runtime": 17.3266, + "eval_samples_per_second": 5.714, + "eval_wer": 0.43943298969072164, + "step": 16500 + }, + { + "epoch": 4.61, + "learning_rate": 9.908302767589197e-05, + "loss": 0.2301, + "step": 16600 + }, + { + "epoch": 4.61, + "eval_loss": 0.72115558385849, + "eval_runtime": 17.2905, + "eval_samples_per_second": 5.726, + "eval_wer": 0.44587628865979384, + "step": 16600 + }, + { + "epoch": 4.64, + "learning_rate": 9.907747026786707e-05, + "loss": 0.2154, + "step": 16700 + }, + { + "epoch": 4.64, + "eval_loss": 0.6517682075500488, + "eval_runtime": 17.2953, + "eval_samples_per_second": 5.724, + "eval_wer": 0.44716494845360827, + "step": 16700 + }, + { + "epoch": 4.67, + "learning_rate": 9.907191285984217e-05, + "loss": 0.2293, + "step": 16800 + }, + { + "epoch": 4.67, + "eval_loss": 0.7426177263259888, + "eval_runtime": 17.4692, + "eval_samples_per_second": 5.667, + "eval_wer": 0.44458762886597936, + "step": 16800 + }, + { + "epoch": 4.7, + "learning_rate": 9.906635545181728e-05, + "loss": 0.2189, + "step": 16900 + }, + { + "epoch": 4.7, + "eval_loss": 0.7251791954040527, + "eval_runtime": 17.5699, + "eval_samples_per_second": 5.635, + "eval_wer": 0.44072164948453607, + "step": 16900 + }, + { + "epoch": 4.72, + "learning_rate": 9.906079804379238e-05, + "loss": 0.2137, + "step": 17000 + }, + { + "epoch": 4.72, + "eval_loss": 0.810121476650238, + "eval_runtime": 17.5304, + "eval_samples_per_second": 5.647, + "eval_wer": 0.45103092783505155, + "step": 17000 + }, + { + "epoch": 4.75, + "learning_rate": 9.905524063576749e-05, + "loss": 0.2294, + "step": 17100 + }, + { + "epoch": 4.75, + "eval_loss": 0.7991353273391724, + "eval_runtime": 17.5411, + "eval_samples_per_second": 5.644, + "eval_wer": 0.422680412371134, + "step": 17100 + }, + { + "epoch": 4.78, + "learning_rate": 9.904968322774259e-05, + "loss": 0.1986, + "step": 17200 + }, + { + "epoch": 4.78, + "eval_loss": 0.7718966603279114, + "eval_runtime": 17.3818, + "eval_samples_per_second": 5.696, + "eval_wer": 0.4381443298969072, + "step": 17200 + }, + { + "epoch": 4.81, + "learning_rate": 9.904412581971769e-05, + "loss": 0.2058, + "step": 17300 + }, + { + "epoch": 4.81, + "eval_loss": 0.7458451986312866, + "eval_runtime": 17.525, + "eval_samples_per_second": 5.649, + "eval_wer": 0.43427835051546393, + "step": 17300 + }, + { + "epoch": 4.83, + "learning_rate": 9.903856841169279e-05, + "loss": 0.2611, + "step": 17400 + }, + { + "epoch": 4.83, + "eval_loss": 0.694915235042572, + "eval_runtime": 17.7415, + "eval_samples_per_second": 5.58, + "eval_wer": 0.422680412371134, + "step": 17400 + }, + { + "epoch": 4.86, + "learning_rate": 9.903301100366789e-05, + "loss": 0.2072, + "step": 17500 + }, + { + "epoch": 4.86, + "eval_loss": 0.7110035419464111, + "eval_runtime": 17.4436, + "eval_samples_per_second": 5.675, + "eval_wer": 0.43170103092783507, + "step": 17500 + }, + { + "epoch": 4.89, + "learning_rate": 9.902745359564299e-05, + "loss": 0.2245, + "step": 17600 + }, + { + "epoch": 4.89, + "eval_loss": 0.7854979038238525, + "eval_runtime": 17.6469, + "eval_samples_per_second": 5.61, + "eval_wer": 0.4536082474226804, + "step": 17600 + }, + { + "epoch": 4.92, + "learning_rate": 9.90218961876181e-05, + "loss": 0.2456, + "step": 17700 + }, + { + "epoch": 4.92, + "eval_loss": 0.860173761844635, + "eval_runtime": 17.567, + "eval_samples_per_second": 5.636, + "eval_wer": 0.4652061855670103, + "step": 17700 + }, + { + "epoch": 4.95, + "learning_rate": 9.90163387795932e-05, + "loss": 0.2196, + "step": 17800 + }, + { + "epoch": 4.95, + "eval_loss": 0.7404292225837708, + "eval_runtime": 17.3988, + "eval_samples_per_second": 5.69, + "eval_wer": 0.44329896907216493, + "step": 17800 + }, + { + "epoch": 4.97, + "learning_rate": 9.901078137156831e-05, + "loss": 0.2153, + "step": 17900 + }, + { + "epoch": 4.97, + "eval_loss": 0.8624671101570129, + "eval_runtime": 17.5005, + "eval_samples_per_second": 5.657, + "eval_wer": 0.4652061855670103, + "step": 17900 + }, + { + "epoch": 5.0, + "learning_rate": 9.900522396354341e-05, + "loss": 0.2307, + "step": 18000 + }, + { + "epoch": 5.0, + "eval_loss": 0.702769935131073, + "eval_runtime": 17.8612, + "eval_samples_per_second": 5.543, + "eval_wer": 0.44329896907216493, + "step": 18000 + }, + { + "epoch": 5.03, + "learning_rate": 9.899966655551851e-05, + "loss": 0.2018, + "step": 18100 + }, + { + "epoch": 5.03, + "eval_loss": 0.7851367592811584, + "eval_runtime": 17.3766, + "eval_samples_per_second": 5.697, + "eval_wer": 0.44458762886597936, + "step": 18100 + }, + { + "epoch": 5.06, + "learning_rate": 9.899410914749362e-05, + "loss": 0.2057, + "step": 18200 + }, + { + "epoch": 5.06, + "eval_loss": 0.7941185832023621, + "eval_runtime": 17.5072, + "eval_samples_per_second": 5.655, + "eval_wer": 0.4536082474226804, + "step": 18200 + }, + { + "epoch": 5.08, + "learning_rate": 9.898855173946871e-05, + "loss": 0.2075, + "step": 18300 + }, + { + "epoch": 5.08, + "eval_loss": 0.6440731287002563, + "eval_runtime": 17.3683, + "eval_samples_per_second": 5.7, + "eval_wer": 0.4368556701030928, + "step": 18300 + }, + { + "epoch": 5.11, + "learning_rate": 9.898299433144382e-05, + "loss": 0.2042, + "step": 18400 + }, + { + "epoch": 5.11, + "eval_loss": 0.7736424803733826, + "eval_runtime": 17.3679, + "eval_samples_per_second": 5.7, + "eval_wer": 0.4329896907216495, + "step": 18400 + }, + { + "epoch": 5.14, + "learning_rate": 9.897743692341892e-05, + "loss": 0.208, + "step": 18500 + }, + { + "epoch": 5.14, + "eval_loss": 0.7068067789077759, + "eval_runtime": 17.8158, + "eval_samples_per_second": 5.557, + "eval_wer": 0.43943298969072164, + "step": 18500 + }, + { + "epoch": 5.17, + "learning_rate": 9.897187951539403e-05, + "loss": 0.2056, + "step": 18600 + }, + { + "epoch": 5.17, + "eval_loss": 0.8301738500595093, + "eval_runtime": 17.4918, + "eval_samples_per_second": 5.66, + "eval_wer": 0.45103092783505155, + "step": 18600 + }, + { + "epoch": 5.2, + "learning_rate": 9.896632210736913e-05, + "loss": 0.2037, + "step": 18700 + }, + { + "epoch": 5.2, + "eval_loss": 0.7583587169647217, + "eval_runtime": 17.3452, + "eval_samples_per_second": 5.708, + "eval_wer": 0.4381443298969072, + "step": 18700 + }, + { + "epoch": 5.22, + "learning_rate": 9.896076469934423e-05, + "loss": 0.204, + "step": 18800 + }, + { + "epoch": 5.22, + "eval_loss": 0.7550833821296692, + "eval_runtime": 17.4638, + "eval_samples_per_second": 5.669, + "eval_wer": 0.4742268041237113, + "step": 18800 + }, + { + "epoch": 5.25, + "learning_rate": 9.895520729131933e-05, + "loss": 0.2118, + "step": 18900 + }, + { + "epoch": 5.25, + "eval_loss": 0.7639862895011902, + "eval_runtime": 17.3009, + "eval_samples_per_second": 5.722, + "eval_wer": 0.4420103092783505, + "step": 18900 + }, + { + "epoch": 5.28, + "learning_rate": 9.894964988329444e-05, + "loss": 0.2005, + "step": 19000 + }, + { + "epoch": 5.28, + "eval_loss": 0.7661750912666321, + "eval_runtime": 17.8661, + "eval_samples_per_second": 5.541, + "eval_wer": 0.45103092783505155, + "step": 19000 + }, + { + "epoch": 5.31, + "learning_rate": 9.894409247526953e-05, + "loss": 0.2234, + "step": 19100 + }, + { + "epoch": 5.31, + "eval_loss": 0.7485219836235046, + "eval_runtime": 17.886, + "eval_samples_per_second": 5.535, + "eval_wer": 0.44716494845360827, + "step": 19100 + }, + { + "epoch": 5.33, + "learning_rate": 9.893853506724464e-05, + "loss": 0.2204, + "step": 19200 + }, + { + "epoch": 5.33, + "eval_loss": 0.827965497970581, + "eval_runtime": 17.4582, + "eval_samples_per_second": 5.671, + "eval_wer": 0.4420103092783505, + "step": 19200 + }, + { + "epoch": 5.36, + "learning_rate": 9.893297765921976e-05, + "loss": 0.233, + "step": 19300 + }, + { + "epoch": 5.36, + "eval_loss": 0.750889778137207, + "eval_runtime": 17.5168, + "eval_samples_per_second": 5.652, + "eval_wer": 0.452319587628866, + "step": 19300 + }, + { + "epoch": 5.39, + "learning_rate": 9.892742025119484e-05, + "loss": 0.217, + "step": 19400 + }, + { + "epoch": 5.39, + "eval_loss": 0.8290805220603943, + "eval_runtime": 17.3789, + "eval_samples_per_second": 5.697, + "eval_wer": 0.452319587628866, + "step": 19400 + }, + { + "epoch": 5.42, + "learning_rate": 9.892186284316996e-05, + "loss": 0.2061, + "step": 19500 + }, + { + "epoch": 5.42, + "eval_loss": 0.7057229280471802, + "eval_runtime": 17.3775, + "eval_samples_per_second": 5.697, + "eval_wer": 0.45103092783505155, + "step": 19500 + }, + { + "epoch": 5.45, + "learning_rate": 9.891630543514506e-05, + "loss": 0.2044, + "step": 19600 + }, + { + "epoch": 5.45, + "eval_loss": 0.7502852082252502, + "eval_runtime": 17.4524, + "eval_samples_per_second": 5.673, + "eval_wer": 0.4484536082474227, + "step": 19600 + }, + { + "epoch": 5.47, + "learning_rate": 9.891074802712016e-05, + "loss": 0.2063, + "step": 19700 + }, + { + "epoch": 5.47, + "eval_loss": 0.7316065430641174, + "eval_runtime": 17.2186, + "eval_samples_per_second": 5.75, + "eval_wer": 0.4368556701030928, + "step": 19700 + }, + { + "epoch": 5.5, + "learning_rate": 9.890519061909526e-05, + "loss": 0.1778, + "step": 19800 + }, + { + "epoch": 5.5, + "eval_loss": 0.7007728219032288, + "eval_runtime": 17.1646, + "eval_samples_per_second": 5.768, + "eval_wer": 0.44587628865979384, + "step": 19800 + }, + { + "epoch": 5.53, + "learning_rate": 9.889963321107036e-05, + "loss": 0.2153, + "step": 19900 + }, + { + "epoch": 5.53, + "eval_loss": 0.6902391314506531, + "eval_runtime": 17.7569, + "eval_samples_per_second": 5.575, + "eval_wer": 0.43170103092783507, + "step": 19900 + }, + { + "epoch": 5.56, + "learning_rate": 9.889407580304546e-05, + "loss": 0.1939, + "step": 20000 + }, + { + "epoch": 5.56, + "eval_loss": 0.7636317014694214, + "eval_runtime": 17.4399, + "eval_samples_per_second": 5.677, + "eval_wer": 0.4484536082474227, + "step": 20000 + }, + { + "epoch": 5.58, + "learning_rate": 9.888851839502057e-05, + "loss": 0.204, + "step": 20100 + }, + { + "epoch": 5.58, + "eval_loss": 0.7957937121391296, + "eval_runtime": 17.6575, + "eval_samples_per_second": 5.607, + "eval_wer": 0.44072164948453607, + "step": 20100 + }, + { + "epoch": 5.61, + "learning_rate": 9.888296098699566e-05, + "loss": 0.1844, + "step": 20200 + }, + { + "epoch": 5.61, + "eval_loss": 0.7200835347175598, + "eval_runtime": 17.5413, + "eval_samples_per_second": 5.644, + "eval_wer": 0.4420103092783505, + "step": 20200 + }, + { + "epoch": 5.64, + "learning_rate": 9.887740357897077e-05, + "loss": 0.2165, + "step": 20300 + }, + { + "epoch": 5.64, + "eval_loss": 0.8324032425880432, + "eval_runtime": 17.4764, + "eval_samples_per_second": 5.665, + "eval_wer": 0.45489690721649484, + "step": 20300 + }, + { + "epoch": 5.67, + "learning_rate": 9.887184617094588e-05, + "loss": 0.2087, + "step": 20400 + }, + { + "epoch": 5.67, + "eval_loss": 0.7996511459350586, + "eval_runtime": 17.4391, + "eval_samples_per_second": 5.677, + "eval_wer": 0.45618556701030927, + "step": 20400 + }, + { + "epoch": 5.7, + "learning_rate": 9.886628876292098e-05, + "loss": 0.2297, + "step": 20500 + }, + { + "epoch": 5.7, + "eval_loss": 0.8123847842216492, + "eval_runtime": 17.4148, + "eval_samples_per_second": 5.685, + "eval_wer": 0.4574742268041237, + "step": 20500 + }, + { + "epoch": 5.72, + "learning_rate": 9.886073135489609e-05, + "loss": 0.2202, + "step": 20600 + }, + { + "epoch": 5.72, + "eval_loss": 0.8624526262283325, + "eval_runtime": 17.5176, + "eval_samples_per_second": 5.651, + "eval_wer": 0.452319587628866, + "step": 20600 + }, + { + "epoch": 5.75, + "learning_rate": 9.885517394687118e-05, + "loss": 0.2093, + "step": 20700 + }, + { + "epoch": 5.75, + "eval_loss": 0.8562197685241699, + "eval_runtime": 17.5151, + "eval_samples_per_second": 5.652, + "eval_wer": 0.46262886597938147, + "step": 20700 + }, + { + "epoch": 5.78, + "learning_rate": 9.884961653884629e-05, + "loss": 0.2093, + "step": 20800 + }, + { + "epoch": 5.78, + "eval_loss": 0.8221404552459717, + "eval_runtime": 17.6305, + "eval_samples_per_second": 5.615, + "eval_wer": 0.47164948453608246, + "step": 20800 + }, + { + "epoch": 5.81, + "learning_rate": 9.884405913082139e-05, + "loss": 0.2303, + "step": 20900 + }, + { + "epoch": 5.81, + "eval_loss": 0.7461365461349487, + "eval_runtime": 17.3023, + "eval_samples_per_second": 5.722, + "eval_wer": 0.43943298969072164, + "step": 20900 + }, + { + "epoch": 5.83, + "learning_rate": 9.883850172279649e-05, + "loss": 0.2137, + "step": 21000 + }, + { + "epoch": 5.83, + "eval_loss": 0.8054025769233704, + "eval_runtime": 17.4479, + "eval_samples_per_second": 5.674, + "eval_wer": 0.4536082474226804, + "step": 21000 + }, + { + "epoch": 5.86, + "learning_rate": 9.883294431477159e-05, + "loss": 0.2042, + "step": 21100 + }, + { + "epoch": 5.86, + "eval_loss": 0.7558605074882507, + "eval_runtime": 17.4077, + "eval_samples_per_second": 5.687, + "eval_wer": 0.44716494845360827, + "step": 21100 + }, + { + "epoch": 5.89, + "learning_rate": 9.88273869067467e-05, + "loss": 0.1955, + "step": 21200 + }, + { + "epoch": 5.89, + "eval_loss": 0.8814973831176758, + "eval_runtime": 17.5114, + "eval_samples_per_second": 5.653, + "eval_wer": 0.44329896907216493, + "step": 21200 + }, + { + "epoch": 5.92, + "learning_rate": 9.88218294987218e-05, + "loss": 0.2004, + "step": 21300 + }, + { + "epoch": 5.92, + "eval_loss": 0.8037664294242859, + "eval_runtime": 17.5704, + "eval_samples_per_second": 5.634, + "eval_wer": 0.46649484536082475, + "step": 21300 + }, + { + "epoch": 5.95, + "learning_rate": 9.881627209069691e-05, + "loss": 0.2085, + "step": 21400 + }, + { + "epoch": 5.95, + "eval_loss": 0.7956470251083374, + "eval_runtime": 17.3299, + "eval_samples_per_second": 5.713, + "eval_wer": 0.452319587628866, + "step": 21400 + }, + { + "epoch": 5.97, + "learning_rate": 9.881071468267201e-05, + "loss": 0.2049, + "step": 21500 + }, + { + "epoch": 5.97, + "eval_loss": 0.7397593259811401, + "eval_runtime": 17.4776, + "eval_samples_per_second": 5.664, + "eval_wer": 0.4368556701030928, + "step": 21500 + }, + { + "epoch": 6.0, + "learning_rate": 9.880515727464711e-05, + "loss": 0.1847, + "step": 21600 + }, + { + "epoch": 6.0, + "eval_loss": 0.7041661143302917, + "eval_runtime": 17.5194, + "eval_samples_per_second": 5.651, + "eval_wer": 0.42396907216494845, + "step": 21600 + }, + { + "epoch": 6.03, + "learning_rate": 9.879959986662222e-05, + "loss": 0.1834, + "step": 21700 + }, + { + "epoch": 6.03, + "eval_loss": 0.7885836362838745, + "eval_runtime": 17.3117, + "eval_samples_per_second": 5.719, + "eval_wer": 0.4729381443298969, + "step": 21700 + }, + { + "epoch": 6.06, + "learning_rate": 9.879404245859731e-05, + "loss": 0.1682, + "step": 21800 + }, + { + "epoch": 6.06, + "eval_loss": 0.7541030049324036, + "eval_runtime": 17.3759, + "eval_samples_per_second": 5.698, + "eval_wer": 0.43041237113402064, + "step": 21800 + }, + { + "epoch": 6.09, + "learning_rate": 9.878848505057242e-05, + "loss": 0.1658, + "step": 21900 + }, + { + "epoch": 6.09, + "eval_loss": 0.7061160206794739, + "eval_runtime": 17.5618, + "eval_samples_per_second": 5.637, + "eval_wer": 0.44458762886597936, + "step": 21900 + }, + { + "epoch": 6.11, + "learning_rate": 9.878292764254752e-05, + "loss": 0.1986, + "step": 22000 + }, + { + "epoch": 6.11, + "eval_loss": 0.7886027097702026, + "eval_runtime": 17.6462, + "eval_samples_per_second": 5.61, + "eval_wer": 0.4329896907216495, + "step": 22000 + }, + { + "epoch": 6.14, + "learning_rate": 9.877737023452263e-05, + "loss": 0.1833, + "step": 22100 + }, + { + "epoch": 6.14, + "eval_loss": 0.6864758729934692, + "eval_runtime": 17.5319, + "eval_samples_per_second": 5.647, + "eval_wer": 0.43041237113402064, + "step": 22100 + }, + { + "epoch": 6.17, + "learning_rate": 9.877181282649773e-05, + "loss": 0.2008, + "step": 22200 + }, + { + "epoch": 6.17, + "eval_loss": 0.7436667680740356, + "eval_runtime": 17.6401, + "eval_samples_per_second": 5.612, + "eval_wer": 0.42010309278350516, + "step": 22200 + }, + { + "epoch": 6.2, + "learning_rate": 9.876625541847283e-05, + "loss": 0.2114, + "step": 22300 + }, + { + "epoch": 6.2, + "eval_loss": 0.7265353798866272, + "eval_runtime": 17.6855, + "eval_samples_per_second": 5.598, + "eval_wer": 0.44329896907216493, + "step": 22300 + }, + { + "epoch": 6.22, + "learning_rate": 9.876069801044793e-05, + "loss": 0.1848, + "step": 22400 + }, + { + "epoch": 6.22, + "eval_loss": 0.663320779800415, + "eval_runtime": 17.7987, + "eval_samples_per_second": 5.562, + "eval_wer": 0.43170103092783507, + "step": 22400 + }, + { + "epoch": 6.25, + "learning_rate": 9.875514060242304e-05, + "loss": 0.1877, + "step": 22500 + }, + { + "epoch": 6.25, + "eval_loss": 0.6840032935142517, + "eval_runtime": 18.0706, + "eval_samples_per_second": 5.479, + "eval_wer": 0.45489690721649484, + "step": 22500 + }, + { + "epoch": 6.28, + "learning_rate": 9.874958319439813e-05, + "loss": 0.1667, + "step": 22600 + }, + { + "epoch": 6.28, + "eval_loss": 0.6797974109649658, + "eval_runtime": 17.8615, + "eval_samples_per_second": 5.543, + "eval_wer": 0.44329896907216493, + "step": 22600 + }, + { + "epoch": 6.31, + "learning_rate": 9.874402578637324e-05, + "loss": 0.1786, + "step": 22700 + }, + { + "epoch": 6.31, + "eval_loss": 0.7095053195953369, + "eval_runtime": 18.0172, + "eval_samples_per_second": 5.495, + "eval_wer": 0.4536082474226804, + "step": 22700 + }, + { + "epoch": 6.34, + "learning_rate": 9.873846837834834e-05, + "loss": 0.1952, + "step": 22800 + }, + { + "epoch": 6.34, + "eval_loss": 0.6215536594390869, + "eval_runtime": 17.9111, + "eval_samples_per_second": 5.527, + "eval_wer": 0.43170103092783507, + "step": 22800 + }, + { + "epoch": 6.36, + "learning_rate": 9.873291097032344e-05, + "loss": 0.2022, + "step": 22900 + }, + { + "epoch": 6.36, + "eval_loss": 0.6748619675636292, + "eval_runtime": 17.9802, + "eval_samples_per_second": 5.506, + "eval_wer": 0.4587628865979381, + "step": 22900 + }, + { + "epoch": 6.39, + "learning_rate": 9.872735356229856e-05, + "loss": 0.1906, + "step": 23000 + }, + { + "epoch": 6.39, + "eval_loss": 0.6207524538040161, + "eval_runtime": 17.8119, + "eval_samples_per_second": 5.558, + "eval_wer": 0.44072164948453607, + "step": 23000 + }, + { + "epoch": 6.42, + "learning_rate": 9.872179615427364e-05, + "loss": 0.1926, + "step": 23100 + }, + { + "epoch": 6.42, + "eval_loss": 0.7496910691261292, + "eval_runtime": 18.1906, + "eval_samples_per_second": 5.442, + "eval_wer": 0.4574742268041237, + "step": 23100 + }, + { + "epoch": 6.45, + "learning_rate": 9.871623874624876e-05, + "loss": 0.1854, + "step": 23200 + }, + { + "epoch": 6.45, + "eval_loss": 0.685153603553772, + "eval_runtime": 17.9086, + "eval_samples_per_second": 5.528, + "eval_wer": 0.46005154639175255, + "step": 23200 + }, + { + "epoch": 6.47, + "learning_rate": 9.871068133822386e-05, + "loss": 0.1576, + "step": 23300 + }, + { + "epoch": 6.47, + "eval_loss": 0.649712085723877, + "eval_runtime": 17.9237, + "eval_samples_per_second": 5.523, + "eval_wer": 0.4497422680412371, + "step": 23300 + }, + { + "epoch": 6.5, + "learning_rate": 9.870512393019896e-05, + "loss": 0.1823, + "step": 23400 + }, + { + "epoch": 6.5, + "eval_loss": 0.7309712767601013, + "eval_runtime": 18.1848, + "eval_samples_per_second": 5.444, + "eval_wer": 0.44329896907216493, + "step": 23400 + }, + { + "epoch": 6.53, + "learning_rate": 9.869956652217406e-05, + "loss": 0.1693, + "step": 23500 + }, + { + "epoch": 6.53, + "eval_loss": 0.7329779863357544, + "eval_runtime": 17.7531, + "eval_samples_per_second": 5.576, + "eval_wer": 0.4652061855670103, + "step": 23500 + }, + { + "epoch": 6.56, + "learning_rate": 9.869400911414916e-05, + "loss": 0.1861, + "step": 23600 + }, + { + "epoch": 6.56, + "eval_loss": 0.8161032795906067, + "eval_runtime": 17.6576, + "eval_samples_per_second": 5.607, + "eval_wer": 0.46649484536082475, + "step": 23600 + }, + { + "epoch": 6.59, + "learning_rate": 9.868845170612426e-05, + "loss": 0.1955, + "step": 23700 + }, + { + "epoch": 6.59, + "eval_loss": 0.7811844944953918, + "eval_runtime": 18.1639, + "eval_samples_per_second": 5.45, + "eval_wer": 0.4652061855670103, + "step": 23700 + }, + { + "epoch": 6.61, + "learning_rate": 9.868289429809938e-05, + "loss": 0.1801, + "step": 23800 + }, + { + "epoch": 6.61, + "eval_loss": 0.7747323513031006, + "eval_runtime": 17.4915, + "eval_samples_per_second": 5.66, + "eval_wer": 0.4652061855670103, + "step": 23800 + }, + { + "epoch": 6.64, + "learning_rate": 9.867733689007448e-05, + "loss": 0.1954, + "step": 23900 + }, + { + "epoch": 6.64, + "eval_loss": 0.8298807144165039, + "eval_runtime": 17.8544, + "eval_samples_per_second": 5.545, + "eval_wer": 0.4690721649484536, + "step": 23900 + }, + { + "epoch": 6.67, + "learning_rate": 9.867177948204958e-05, + "loss": 0.1976, + "step": 24000 + }, + { + "epoch": 6.67, + "eval_loss": 0.8623689413070679, + "eval_runtime": 17.5465, + "eval_samples_per_second": 5.642, + "eval_wer": 0.452319587628866, + "step": 24000 + }, + { + "epoch": 6.7, + "learning_rate": 9.866622207402468e-05, + "loss": 0.1839, + "step": 24100 + }, + { + "epoch": 6.7, + "eval_loss": 0.8633375763893127, + "eval_runtime": 17.7487, + "eval_samples_per_second": 5.578, + "eval_wer": 0.45103092783505155, + "step": 24100 + }, + { + "epoch": 6.72, + "learning_rate": 9.866066466599978e-05, + "loss": 0.1858, + "step": 24200 + }, + { + "epoch": 6.72, + "eval_loss": 1.0021711587905884, + "eval_runtime": 17.7581, + "eval_samples_per_second": 5.575, + "eval_wer": 0.4845360824742268, + "step": 24200 + }, + { + "epoch": 6.75, + "learning_rate": 9.865510725797489e-05, + "loss": 0.1753, + "step": 24300 + }, + { + "epoch": 6.75, + "eval_loss": 0.904293417930603, + "eval_runtime": 18.4007, + "eval_samples_per_second": 5.38, + "eval_wer": 0.46649484536082475, + "step": 24300 + }, + { + "epoch": 6.78, + "learning_rate": 9.864954984994998e-05, + "loss": 0.1829, + "step": 24400 + }, + { + "epoch": 6.78, + "eval_loss": 0.7328855991363525, + "eval_runtime": 17.5994, + "eval_samples_per_second": 5.625, + "eval_wer": 0.44458762886597936, + "step": 24400 + }, + { + "epoch": 6.81, + "learning_rate": 9.864399244192509e-05, + "loss": 0.1984, + "step": 24500 + }, + { + "epoch": 6.81, + "eval_loss": 0.7215154767036438, + "eval_runtime": 17.6361, + "eval_samples_per_second": 5.613, + "eval_wer": 0.43556701030927836, + "step": 24500 + }, + { + "epoch": 6.84, + "learning_rate": 9.863843503390019e-05, + "loss": 0.2195, + "step": 24600 + }, + { + "epoch": 6.84, + "eval_loss": 0.7022905945777893, + "eval_runtime": 17.8301, + "eval_samples_per_second": 5.552, + "eval_wer": 0.46005154639175255, + "step": 24600 + }, + { + "epoch": 6.86, + "learning_rate": 9.86328776258753e-05, + "loss": 0.2079, + "step": 24700 + }, + { + "epoch": 6.86, + "eval_loss": 0.7629209756851196, + "eval_runtime": 18.0665, + "eval_samples_per_second": 5.48, + "eval_wer": 0.4639175257731959, + "step": 24700 + }, + { + "epoch": 6.89, + "learning_rate": 9.86273202178504e-05, + "loss": 0.2118, + "step": 24800 + }, + { + "epoch": 6.89, + "eval_loss": 0.6994808316230774, + "eval_runtime": 17.5504, + "eval_samples_per_second": 5.641, + "eval_wer": 0.43556701030927836, + "step": 24800 + }, + { + "epoch": 6.92, + "learning_rate": 9.862176280982551e-05, + "loss": 0.2154, + "step": 24900 + }, + { + "epoch": 6.92, + "eval_loss": 0.6871984601020813, + "eval_runtime": 18.0511, + "eval_samples_per_second": 5.484, + "eval_wer": 0.4484536082474227, + "step": 24900 + }, + { + "epoch": 6.95, + "learning_rate": 9.861620540180061e-05, + "loss": 0.1823, + "step": 25000 + }, + { + "epoch": 6.95, + "eval_loss": 0.5884273052215576, + "eval_runtime": 17.6454, + "eval_samples_per_second": 5.611, + "eval_wer": 0.4420103092783505, + "step": 25000 + }, + { + "epoch": 6.97, + "learning_rate": 9.861064799377571e-05, + "loss": 0.1786, + "step": 25100 + }, + { + "epoch": 6.97, + "eval_loss": 0.7519210577011108, + "eval_runtime": 17.8606, + "eval_samples_per_second": 5.543, + "eval_wer": 0.46262886597938147, + "step": 25100 + }, + { + "epoch": 7.0, + "learning_rate": 9.860509058575081e-05, + "loss": 0.1841, + "step": 25200 + }, + { + "epoch": 7.0, + "eval_loss": 0.7630220651626587, + "eval_runtime": 17.5638, + "eval_samples_per_second": 5.637, + "eval_wer": 0.4420103092783505, + "step": 25200 + }, + { + "epoch": 7.03, + "learning_rate": 9.859953317772591e-05, + "loss": 0.1866, + "step": 25300 + }, + { + "epoch": 7.03, + "eval_loss": 0.7063058614730835, + "eval_runtime": 17.2492, + "eval_samples_per_second": 5.739, + "eval_wer": 0.45618556701030927, + "step": 25300 + }, + { + "epoch": 7.06, + "learning_rate": 9.859397576970102e-05, + "loss": 0.1756, + "step": 25400 + }, + { + "epoch": 7.06, + "eval_loss": 0.6924075484275818, + "eval_runtime": 18.1923, + "eval_samples_per_second": 5.442, + "eval_wer": 0.45618556701030927, + "step": 25400 + }, + { + "epoch": 7.09, + "learning_rate": 9.858841836167611e-05, + "loss": 0.1834, + "step": 25500 + }, + { + "epoch": 7.09, + "eval_loss": 0.7205408215522766, + "eval_runtime": 17.5655, + "eval_samples_per_second": 5.636, + "eval_wer": 0.4420103092783505, + "step": 25500 + }, + { + "epoch": 7.11, + "learning_rate": 9.858286095365123e-05, + "loss": 0.1556, + "step": 25600 + }, + { + "epoch": 7.11, + "eval_loss": 0.9185993671417236, + "eval_runtime": 17.8154, + "eval_samples_per_second": 5.557, + "eval_wer": 0.44458762886597936, + "step": 25600 + }, + { + "epoch": 7.14, + "learning_rate": 9.857730354562633e-05, + "loss": 0.1736, + "step": 25700 + }, + { + "epoch": 7.14, + "eval_loss": 0.7671197652816772, + "eval_runtime": 17.8195, + "eval_samples_per_second": 5.556, + "eval_wer": 0.44329896907216493, + "step": 25700 + }, + { + "epoch": 7.17, + "learning_rate": 9.857174613760143e-05, + "loss": 0.1535, + "step": 25800 + }, + { + "epoch": 7.17, + "eval_loss": 0.813725471496582, + "eval_runtime": 17.458, + "eval_samples_per_second": 5.671, + "eval_wer": 0.44716494845360827, + "step": 25800 + }, + { + "epoch": 7.2, + "learning_rate": 9.856618872957653e-05, + "loss": 0.1725, + "step": 25900 + }, + { + "epoch": 7.2, + "eval_loss": 0.860133707523346, + "eval_runtime": 17.7915, + "eval_samples_per_second": 5.564, + "eval_wer": 0.45618556701030927, + "step": 25900 + }, + { + "epoch": 7.22, + "learning_rate": 9.856063132155163e-05, + "loss": 0.1883, + "step": 26000 + }, + { + "epoch": 7.22, + "eval_loss": 0.846496045589447, + "eval_runtime": 17.5964, + "eval_samples_per_second": 5.626, + "eval_wer": 0.4690721649484536, + "step": 26000 + }, + { + "epoch": 7.25, + "learning_rate": 9.855507391352674e-05, + "loss": 0.1626, + "step": 26100 + }, + { + "epoch": 7.25, + "eval_loss": 0.6927329301834106, + "eval_runtime": 17.582, + "eval_samples_per_second": 5.631, + "eval_wer": 0.42783505154639173, + "step": 26100 + }, + { + "epoch": 7.28, + "learning_rate": 9.854951650550184e-05, + "loss": 0.1758, + "step": 26200 + }, + { + "epoch": 7.28, + "eval_loss": 0.7043600082397461, + "eval_runtime": 18.8361, + "eval_samples_per_second": 5.256, + "eval_wer": 0.4252577319587629, + "step": 26200 + }, + { + "epoch": 7.31, + "learning_rate": 9.854395909747694e-05, + "loss": 0.1568, + "step": 26300 + }, + { + "epoch": 7.31, + "eval_loss": 0.7357842326164246, + "eval_runtime": 18.3695, + "eval_samples_per_second": 5.389, + "eval_wer": 0.44587628865979384, + "step": 26300 + }, + { + "epoch": 7.34, + "learning_rate": 9.853840168945204e-05, + "loss": 0.1583, + "step": 26400 + }, + { + "epoch": 7.34, + "eval_loss": 0.7848875522613525, + "eval_runtime": 17.9559, + "eval_samples_per_second": 5.513, + "eval_wer": 0.4420103092783505, + "step": 26400 + }, + { + "epoch": 7.36, + "learning_rate": 9.853284428142714e-05, + "loss": 0.167, + "step": 26500 + }, + { + "epoch": 7.36, + "eval_loss": 0.7771514654159546, + "eval_runtime": 17.8217, + "eval_samples_per_second": 5.555, + "eval_wer": 0.4420103092783505, + "step": 26500 + }, + { + "epoch": 7.39, + "learning_rate": 9.852728687340224e-05, + "loss": 0.1659, + "step": 26600 + }, + { + "epoch": 7.39, + "eval_loss": 0.8126515746116638, + "eval_runtime": 18.1033, + "eval_samples_per_second": 5.469, + "eval_wer": 0.4420103092783505, + "step": 26600 + }, + { + "epoch": 7.42, + "learning_rate": 9.852172946537736e-05, + "loss": 0.1909, + "step": 26700 + }, + { + "epoch": 7.42, + "eval_loss": 0.7457703948020935, + "eval_runtime": 18.2622, + "eval_samples_per_second": 5.421, + "eval_wer": 0.43427835051546393, + "step": 26700 + }, + { + "epoch": 7.45, + "learning_rate": 9.851617205735245e-05, + "loss": 0.1842, + "step": 26800 + }, + { + "epoch": 7.45, + "eval_loss": 0.7543534636497498, + "eval_runtime": 18.2488, + "eval_samples_per_second": 5.425, + "eval_wer": 0.45103092783505155, + "step": 26800 + }, + { + "epoch": 7.47, + "learning_rate": 9.851061464932756e-05, + "loss": 0.1839, + "step": 26900 + }, + { + "epoch": 7.47, + "eval_loss": 0.7522377371788025, + "eval_runtime": 18.0753, + "eval_samples_per_second": 5.477, + "eval_wer": 0.43170103092783507, + "step": 26900 + }, + { + "epoch": 7.5, + "learning_rate": 9.850505724130266e-05, + "loss": 0.158, + "step": 27000 + }, + { + "epoch": 7.5, + "eval_loss": 0.7622743844985962, + "eval_runtime": 17.6407, + "eval_samples_per_second": 5.612, + "eval_wer": 0.4265463917525773, + "step": 27000 + }, + { + "epoch": 7.53, + "learning_rate": 9.849949983327776e-05, + "loss": 0.1685, + "step": 27100 + }, + { + "epoch": 7.53, + "eval_loss": 0.7140101194381714, + "eval_runtime": 17.3617, + "eval_samples_per_second": 5.702, + "eval_wer": 0.4368556701030928, + "step": 27100 + }, + { + "epoch": 7.56, + "learning_rate": 9.849394242525287e-05, + "loss": 0.1785, + "step": 27200 + }, + { + "epoch": 7.56, + "eval_loss": 0.7777717709541321, + "eval_runtime": 17.2778, + "eval_samples_per_second": 5.73, + "eval_wer": 0.4097938144329897, + "step": 27200 + }, + { + "epoch": 7.59, + "learning_rate": 9.848838501722798e-05, + "loss": 0.1633, + "step": 27300 + }, + { + "epoch": 7.59, + "eval_loss": 0.7742789387702942, + "eval_runtime": 17.358, + "eval_samples_per_second": 5.703, + "eval_wer": 0.41881443298969073, + "step": 27300 + }, + { + "epoch": 7.61, + "learning_rate": 9.848282760920308e-05, + "loss": 0.1841, + "step": 27400 + }, + { + "epoch": 7.61, + "eval_loss": 0.794254720211029, + "eval_runtime": 17.5933, + "eval_samples_per_second": 5.627, + "eval_wer": 0.4368556701030928, + "step": 27400 + }, + { + "epoch": 7.64, + "learning_rate": 9.847727020117818e-05, + "loss": 0.176, + "step": 27500 + }, + { + "epoch": 7.64, + "eval_loss": 0.7638439536094666, + "eval_runtime": 17.3793, + "eval_samples_per_second": 5.696, + "eval_wer": 0.45489690721649484, + "step": 27500 + }, + { + "epoch": 7.67, + "learning_rate": 9.847171279315328e-05, + "loss": 0.158, + "step": 27600 + }, + { + "epoch": 7.67, + "eval_loss": 0.7681997418403625, + "eval_runtime": 17.46, + "eval_samples_per_second": 5.67, + "eval_wer": 0.4574742268041237, + "step": 27600 + }, + { + "epoch": 7.7, + "learning_rate": 9.846615538512838e-05, + "loss": 0.1915, + "step": 27700 + }, + { + "epoch": 7.7, + "eval_loss": 0.7488833069801331, + "eval_runtime": 17.731, + "eval_samples_per_second": 5.583, + "eval_wer": 0.44072164948453607, + "step": 27700 + }, + { + "epoch": 7.72, + "learning_rate": 9.846059797710349e-05, + "loss": 0.1634, + "step": 27800 + }, + { + "epoch": 7.72, + "eval_loss": 0.7865298390388489, + "eval_runtime": 17.4124, + "eval_samples_per_second": 5.686, + "eval_wer": 0.43556701030927836, + "step": 27800 + }, + { + "epoch": 7.75, + "learning_rate": 9.845504056907858e-05, + "loss": 0.2035, + "step": 27900 + }, + { + "epoch": 7.75, + "eval_loss": 0.7207059860229492, + "eval_runtime": 17.7628, + "eval_samples_per_second": 5.573, + "eval_wer": 0.4252577319587629, + "step": 27900 + }, + { + "epoch": 7.78, + "learning_rate": 9.844948316105369e-05, + "loss": 0.1679, + "step": 28000 + }, + { + "epoch": 7.78, + "eval_loss": 0.7208133339881897, + "eval_runtime": 17.4884, + "eval_samples_per_second": 5.661, + "eval_wer": 0.4484536082474227, + "step": 28000 + }, + { + "epoch": 7.81, + "learning_rate": 9.84439257530288e-05, + "loss": 0.1646, + "step": 28100 + }, + { + "epoch": 7.81, + "eval_loss": 0.7599995136260986, + "eval_runtime": 17.4136, + "eval_samples_per_second": 5.685, + "eval_wer": 0.45103092783505155, + "step": 28100 + }, + { + "epoch": 7.84, + "learning_rate": 9.84383683450039e-05, + "loss": 0.1781, + "step": 28200 + }, + { + "epoch": 7.84, + "eval_loss": 0.7319245934486389, + "eval_runtime": 17.5926, + "eval_samples_per_second": 5.627, + "eval_wer": 0.4265463917525773, + "step": 28200 + }, + { + "epoch": 7.86, + "learning_rate": 9.843281093697901e-05, + "loss": 0.19, + "step": 28300 + }, + { + "epoch": 7.86, + "eval_loss": 0.7298288345336914, + "eval_runtime": 17.6158, + "eval_samples_per_second": 5.62, + "eval_wer": 0.43170103092783507, + "step": 28300 + }, + { + "epoch": 7.89, + "learning_rate": 9.84272535289541e-05, + "loss": 0.1792, + "step": 28400 + }, + { + "epoch": 7.89, + "eval_loss": 0.7053973078727722, + "eval_runtime": 17.3878, + "eval_samples_per_second": 5.694, + "eval_wer": 0.4381443298969072, + "step": 28400 + }, + { + "epoch": 7.92, + "learning_rate": 9.842169612092921e-05, + "loss": 0.1709, + "step": 28500 + }, + { + "epoch": 7.92, + "eval_loss": 0.8577209115028381, + "eval_runtime": 17.4901, + "eval_samples_per_second": 5.66, + "eval_wer": 0.4265463917525773, + "step": 28500 + }, + { + "epoch": 7.95, + "learning_rate": 9.841613871290431e-05, + "loss": 0.2003, + "step": 28600 + }, + { + "epoch": 7.95, + "eval_loss": 0.7145041227340698, + "eval_runtime": 17.3386, + "eval_samples_per_second": 5.71, + "eval_wer": 0.41881443298969073, + "step": 28600 + }, + { + "epoch": 7.97, + "learning_rate": 9.841058130487941e-05, + "loss": 0.1722, + "step": 28700 + }, + { + "epoch": 7.97, + "eval_loss": 0.7263432741165161, + "eval_runtime": 17.3569, + "eval_samples_per_second": 5.704, + "eval_wer": 0.4175257731958763, + "step": 28700 + }, + { + "epoch": 8.0, + "learning_rate": 9.840502389685451e-05, + "loss": 0.157, + "step": 28800 + }, + { + "epoch": 8.0, + "eval_loss": 0.7807848453521729, + "eval_runtime": 18.0075, + "eval_samples_per_second": 5.498, + "eval_wer": 0.41881443298969073, + "step": 28800 + }, + { + "epoch": 8.03, + "learning_rate": 9.839946648882961e-05, + "loss": 0.1728, + "step": 28900 + }, + { + "epoch": 8.03, + "eval_loss": 0.7600880861282349, + "eval_runtime": 17.8814, + "eval_samples_per_second": 5.536, + "eval_wer": 0.4329896907216495, + "step": 28900 + }, + { + "epoch": 8.06, + "learning_rate": 9.839390908080471e-05, + "loss": 0.1859, + "step": 29000 + }, + { + "epoch": 8.06, + "eval_loss": 0.7904886603355408, + "eval_runtime": 17.4997, + "eval_samples_per_second": 5.657, + "eval_wer": 0.41365979381443296, + "step": 29000 + }, + { + "epoch": 8.09, + "learning_rate": 9.838835167277983e-05, + "loss": 0.1759, + "step": 29100 + }, + { + "epoch": 8.09, + "eval_loss": 0.8925608396530151, + "eval_runtime": 17.4355, + "eval_samples_per_second": 5.678, + "eval_wer": 0.43556701030927836, + "step": 29100 + }, + { + "epoch": 8.11, + "learning_rate": 9.838279426475491e-05, + "loss": 0.1689, + "step": 29200 + }, + { + "epoch": 8.11, + "eval_loss": 0.7167654037475586, + "eval_runtime": 17.7948, + "eval_samples_per_second": 5.563, + "eval_wer": 0.43427835051546393, + "step": 29200 + }, + { + "epoch": 8.14, + "learning_rate": 9.837723685673003e-05, + "loss": 0.1708, + "step": 29300 + }, + { + "epoch": 8.14, + "eval_loss": 0.7209995985031128, + "eval_runtime": 17.5008, + "eval_samples_per_second": 5.657, + "eval_wer": 0.42912371134020616, + "step": 29300 + }, + { + "epoch": 8.17, + "learning_rate": 9.837167944870513e-05, + "loss": 0.1549, + "step": 29400 + }, + { + "epoch": 8.17, + "eval_loss": 0.7742015719413757, + "eval_runtime": 17.5354, + "eval_samples_per_second": 5.646, + "eval_wer": 0.4420103092783505, + "step": 29400 + }, + { + "epoch": 8.2, + "learning_rate": 9.836612204068023e-05, + "loss": 0.1605, + "step": 29500 + }, + { + "epoch": 8.2, + "eval_loss": 0.7685571312904358, + "eval_runtime": 17.5794, + "eval_samples_per_second": 5.632, + "eval_wer": 0.42783505154639173, + "step": 29500 + }, + { + "epoch": 8.22, + "learning_rate": 9.836056463265534e-05, + "loss": 0.1443, + "step": 29600 + }, + { + "epoch": 8.22, + "eval_loss": 0.8935885429382324, + "eval_runtime": 17.5375, + "eval_samples_per_second": 5.645, + "eval_wer": 0.43556701030927836, + "step": 29600 + }, + { + "epoch": 8.25, + "learning_rate": 9.835500722463043e-05, + "loss": 0.1492, + "step": 29700 + }, + { + "epoch": 8.25, + "eval_loss": 0.7365788221359253, + "eval_runtime": 17.3626, + "eval_samples_per_second": 5.702, + "eval_wer": 0.42912371134020616, + "step": 29700 + }, + { + "epoch": 8.28, + "learning_rate": 9.834944981660554e-05, + "loss": 0.1505, + "step": 29800 + }, + { + "epoch": 8.28, + "eval_loss": 0.7134827375411987, + "eval_runtime": 17.6924, + "eval_samples_per_second": 5.596, + "eval_wer": 0.42010309278350516, + "step": 29800 + }, + { + "epoch": 8.31, + "learning_rate": 9.834389240858064e-05, + "loss": 0.1662, + "step": 29900 + }, + { + "epoch": 8.31, + "eval_loss": 0.7517086863517761, + "eval_runtime": 17.6753, + "eval_samples_per_second": 5.601, + "eval_wer": 0.422680412371134, + "step": 29900 + }, + { + "epoch": 8.34, + "learning_rate": 9.833833500055574e-05, + "loss": 0.1557, + "step": 30000 + }, + { + "epoch": 8.34, + "eval_loss": 0.8542296290397644, + "eval_runtime": 17.6307, + "eval_samples_per_second": 5.615, + "eval_wer": 0.4368556701030928, + "step": 30000 + }, + { + "epoch": 8.36, + "learning_rate": 9.833277759253084e-05, + "loss": 0.1532, + "step": 30100 + }, + { + "epoch": 8.36, + "eval_loss": 0.7641463875770569, + "eval_runtime": 17.5001, + "eval_samples_per_second": 5.657, + "eval_wer": 0.42396907216494845, + "step": 30100 + }, + { + "epoch": 8.39, + "learning_rate": 9.832722018450596e-05, + "loss": 0.1636, + "step": 30200 + }, + { + "epoch": 8.39, + "eval_loss": 0.8011400699615479, + "eval_runtime": 17.3521, + "eval_samples_per_second": 5.705, + "eval_wer": 0.44458762886597936, + "step": 30200 + }, + { + "epoch": 8.42, + "learning_rate": 9.832166277648105e-05, + "loss": 0.1503, + "step": 30300 + }, + { + "epoch": 8.42, + "eval_loss": 0.7441977858543396, + "eval_runtime": 17.6318, + "eval_samples_per_second": 5.615, + "eval_wer": 0.42912371134020616, + "step": 30300 + }, + { + "epoch": 8.45, + "learning_rate": 9.831610536845616e-05, + "loss": 0.157, + "step": 30400 + }, + { + "epoch": 8.45, + "eval_loss": 0.7959823608398438, + "eval_runtime": 17.5355, + "eval_samples_per_second": 5.646, + "eval_wer": 0.43170103092783507, + "step": 30400 + }, + { + "epoch": 8.47, + "learning_rate": 9.831054796043126e-05, + "loss": 0.1934, + "step": 30500 + }, + { + "epoch": 8.47, + "eval_loss": 0.7789689898490906, + "eval_runtime": 17.4458, + "eval_samples_per_second": 5.675, + "eval_wer": 0.4497422680412371, + "step": 30500 + }, + { + "epoch": 8.5, + "learning_rate": 9.830499055240636e-05, + "loss": 0.1822, + "step": 30600 + }, + { + "epoch": 8.5, + "eval_loss": 0.6615021228790283, + "eval_runtime": 17.5369, + "eval_samples_per_second": 5.645, + "eval_wer": 0.4252577319587629, + "step": 30600 + }, + { + "epoch": 8.53, + "learning_rate": 9.829943314438148e-05, + "loss": 0.155, + "step": 30700 + }, + { + "epoch": 8.53, + "eval_loss": 0.7741401791572571, + "eval_runtime": 17.7325, + "eval_samples_per_second": 5.583, + "eval_wer": 0.43041237113402064, + "step": 30700 + }, + { + "epoch": 8.56, + "learning_rate": 9.829387573635656e-05, + "loss": 0.1626, + "step": 30800 + }, + { + "epoch": 8.56, + "eval_loss": 0.7389179468154907, + "eval_runtime": 17.6894, + "eval_samples_per_second": 5.597, + "eval_wer": 0.4381443298969072, + "step": 30800 + }, + { + "epoch": 8.59, + "learning_rate": 9.828831832833168e-05, + "loss": 0.1872, + "step": 30900 + }, + { + "epoch": 8.59, + "eval_loss": 0.6793811917304993, + "eval_runtime": 17.4718, + "eval_samples_per_second": 5.666, + "eval_wer": 0.4381443298969072, + "step": 30900 + }, + { + "epoch": 8.61, + "learning_rate": 9.828276092030678e-05, + "loss": 0.1521, + "step": 31000 + }, + { + "epoch": 8.61, + "eval_loss": 0.720003068447113, + "eval_runtime": 17.8272, + "eval_samples_per_second": 5.553, + "eval_wer": 0.42396907216494845, + "step": 31000 + }, + { + "epoch": 8.64, + "learning_rate": 9.827720351228188e-05, + "loss": 0.1776, + "step": 31100 + }, + { + "epoch": 8.64, + "eval_loss": 0.7978392243385315, + "eval_runtime": 17.9635, + "eval_samples_per_second": 5.511, + "eval_wer": 0.43427835051546393, + "step": 31100 + }, + { + "epoch": 8.67, + "learning_rate": 9.827164610425698e-05, + "loss": 0.1639, + "step": 31200 + }, + { + "epoch": 8.67, + "eval_loss": 0.6895660161972046, + "eval_runtime": 17.433, + "eval_samples_per_second": 5.679, + "eval_wer": 0.43170103092783507, + "step": 31200 + }, + { + "epoch": 8.7, + "learning_rate": 9.826608869623208e-05, + "loss": 0.1811, + "step": 31300 + }, + { + "epoch": 8.7, + "eval_loss": 0.6539278030395508, + "eval_runtime": 17.6188, + "eval_samples_per_second": 5.619, + "eval_wer": 0.4497422680412371, + "step": 31300 + }, + { + "epoch": 8.72, + "learning_rate": 9.826053128820718e-05, + "loss": 0.1783, + "step": 31400 + }, + { + "epoch": 8.72, + "eval_loss": 0.8889223337173462, + "eval_runtime": 17.4796, + "eval_samples_per_second": 5.664, + "eval_wer": 0.44458762886597936, + "step": 31400 + }, + { + "epoch": 8.75, + "learning_rate": 9.825497388018229e-05, + "loss": 0.1706, + "step": 31500 + }, + { + "epoch": 8.75, + "eval_loss": 0.7976836562156677, + "eval_runtime": 17.3817, + "eval_samples_per_second": 5.696, + "eval_wer": 0.42396907216494845, + "step": 31500 + }, + { + "epoch": 8.78, + "learning_rate": 9.824941647215738e-05, + "loss": 0.1666, + "step": 31600 + }, + { + "epoch": 8.78, + "eval_loss": 0.8039941787719727, + "eval_runtime": 17.7238, + "eval_samples_per_second": 5.586, + "eval_wer": 0.43556701030927836, + "step": 31600 + }, + { + "epoch": 8.81, + "learning_rate": 9.82438590641325e-05, + "loss": 0.1493, + "step": 31700 + }, + { + "epoch": 8.81, + "eval_loss": 0.9158120155334473, + "eval_runtime": 17.3559, + "eval_samples_per_second": 5.704, + "eval_wer": 0.4368556701030928, + "step": 31700 + }, + { + "epoch": 8.84, + "learning_rate": 9.82383016561076e-05, + "loss": 0.1558, + "step": 31800 + }, + { + "epoch": 8.84, + "eval_loss": 0.7148767113685608, + "eval_runtime": 17.5657, + "eval_samples_per_second": 5.636, + "eval_wer": 0.4213917525773196, + "step": 31800 + }, + { + "epoch": 8.86, + "learning_rate": 9.82327442480827e-05, + "loss": 0.1689, + "step": 31900 + }, + { + "epoch": 8.86, + "eval_loss": 0.6876005530357361, + "eval_runtime": 17.4155, + "eval_samples_per_second": 5.685, + "eval_wer": 0.43170103092783507, + "step": 31900 + }, + { + "epoch": 8.89, + "learning_rate": 9.822718684005781e-05, + "loss": 0.1657, + "step": 32000 + }, + { + "epoch": 8.89, + "eval_loss": 0.702477216720581, + "eval_runtime": 17.5273, + "eval_samples_per_second": 5.648, + "eval_wer": 0.44329896907216493, + "step": 32000 + }, + { + "epoch": 8.92, + "learning_rate": 9.82216294320329e-05, + "loss": 0.1887, + "step": 32100 + }, + { + "epoch": 8.92, + "eval_loss": 0.670263946056366, + "eval_runtime": 18.0974, + "eval_samples_per_second": 5.47, + "eval_wer": 0.4252577319587629, + "step": 32100 + }, + { + "epoch": 8.95, + "learning_rate": 9.821607202400801e-05, + "loss": 0.1743, + "step": 32200 + }, + { + "epoch": 8.95, + "eval_loss": 0.6662067174911499, + "eval_runtime": 17.5027, + "eval_samples_per_second": 5.656, + "eval_wer": 0.44072164948453607, + "step": 32200 + }, + { + "epoch": 8.97, + "learning_rate": 9.821051461598311e-05, + "loss": 0.1697, + "step": 32300 + }, + { + "epoch": 8.97, + "eval_loss": 0.6950443983078003, + "eval_runtime": 17.4463, + "eval_samples_per_second": 5.675, + "eval_wer": 0.42783505154639173, + "step": 32300 + }, + { + "epoch": 9.0, + "learning_rate": 9.820495720795821e-05, + "loss": 0.1565, + "step": 32400 + }, + { + "epoch": 9.0, + "eval_loss": 0.682771623134613, + "eval_runtime": 17.574, + "eval_samples_per_second": 5.633, + "eval_wer": 0.422680412371134, + "step": 32400 + }, + { + "epoch": 9.03, + "learning_rate": 9.819939979993331e-05, + "loss": 0.154, + "step": 32500 + }, + { + "epoch": 9.03, + "eval_loss": 0.7133552432060242, + "eval_runtime": 17.5006, + "eval_samples_per_second": 5.657, + "eval_wer": 0.4329896907216495, + "step": 32500 + }, + { + "epoch": 9.06, + "learning_rate": 9.819384239190843e-05, + "loss": 0.159, + "step": 32600 + }, + { + "epoch": 9.06, + "eval_loss": 0.7330553531646729, + "eval_runtime": 17.2801, + "eval_samples_per_second": 5.729, + "eval_wer": 0.4420103092783505, + "step": 32600 + }, + { + "epoch": 9.09, + "learning_rate": 9.818828498388351e-05, + "loss": 0.1585, + "step": 32700 + }, + { + "epoch": 9.09, + "eval_loss": 0.696050763130188, + "eval_runtime": 17.5298, + "eval_samples_per_second": 5.648, + "eval_wer": 0.4213917525773196, + "step": 32700 + }, + { + "epoch": 9.11, + "learning_rate": 9.818272757585863e-05, + "loss": 0.1595, + "step": 32800 + }, + { + "epoch": 9.11, + "eval_loss": 0.7466849088668823, + "eval_runtime": 17.3402, + "eval_samples_per_second": 5.709, + "eval_wer": 0.42783505154639173, + "step": 32800 + }, + { + "epoch": 9.14, + "learning_rate": 9.817717016783373e-05, + "loss": 0.1507, + "step": 32900 + }, + { + "epoch": 9.14, + "eval_loss": 0.7582687735557556, + "eval_runtime": 17.6824, + "eval_samples_per_second": 5.599, + "eval_wer": 0.43041237113402064, + "step": 32900 + }, + { + "epoch": 9.17, + "learning_rate": 9.817161275980883e-05, + "loss": 0.1586, + "step": 33000 + }, + { + "epoch": 9.17, + "eval_loss": 0.7383239269256592, + "eval_runtime": 17.5908, + "eval_samples_per_second": 5.628, + "eval_wer": 0.4265463917525773, + "step": 33000 + }, + { + "epoch": 9.2, + "learning_rate": 9.816605535178394e-05, + "loss": 0.1498, + "step": 33100 + }, + { + "epoch": 9.2, + "eval_loss": 0.9060437083244324, + "eval_runtime": 17.5173, + "eval_samples_per_second": 5.652, + "eval_wer": 0.43943298969072164, + "step": 33100 + }, + { + "epoch": 9.22, + "learning_rate": 9.816049794375903e-05, + "loss": 0.1415, + "step": 33200 + }, + { + "epoch": 9.22, + "eval_loss": 1.02446448802948, + "eval_runtime": 17.6833, + "eval_samples_per_second": 5.598, + "eval_wer": 0.46134020618556704, + "step": 33200 + }, + { + "epoch": 9.25, + "learning_rate": 9.815494053573414e-05, + "loss": 0.1465, + "step": 33300 + }, + { + "epoch": 9.25, + "eval_loss": 1.0142923593521118, + "eval_runtime": 17.6092, + "eval_samples_per_second": 5.622, + "eval_wer": 0.46005154639175255, + "step": 33300 + }, + { + "epoch": 9.28, + "learning_rate": 9.814938312770924e-05, + "loss": 0.155, + "step": 33400 + }, + { + "epoch": 9.28, + "eval_loss": 0.8718487620353699, + "eval_runtime": 17.6525, + "eval_samples_per_second": 5.608, + "eval_wer": 0.4536082474226804, + "step": 33400 + }, + { + "epoch": 9.31, + "learning_rate": 9.814382571968434e-05, + "loss": 0.1459, + "step": 33500 + }, + { + "epoch": 9.31, + "eval_loss": 0.6963269114494324, + "eval_runtime": 17.6886, + "eval_samples_per_second": 5.597, + "eval_wer": 0.42912371134020616, + "step": 33500 + }, + { + "epoch": 9.34, + "learning_rate": 9.813826831165944e-05, + "loss": 0.1598, + "step": 33600 + }, + { + "epoch": 9.34, + "eval_loss": 0.9281795024871826, + "eval_runtime": 17.3291, + "eval_samples_per_second": 5.713, + "eval_wer": 0.45103092783505155, + "step": 33600 + }, + { + "epoch": 9.36, + "learning_rate": 9.813271090363455e-05, + "loss": 0.1823, + "step": 33700 + }, + { + "epoch": 9.36, + "eval_loss": 0.9645785093307495, + "eval_runtime": 17.1301, + "eval_samples_per_second": 5.779, + "eval_wer": 0.4497422680412371, + "step": 33700 + }, + { + "epoch": 9.39, + "learning_rate": 9.812715349560965e-05, + "loss": 0.167, + "step": 33800 + }, + { + "epoch": 9.39, + "eval_loss": 0.9201110005378723, + "eval_runtime": 17.7043, + "eval_samples_per_second": 5.592, + "eval_wer": 0.4420103092783505, + "step": 33800 + }, + { + "epoch": 9.42, + "learning_rate": 9.812159608758476e-05, + "loss": 0.1381, + "step": 33900 + }, + { + "epoch": 9.42, + "eval_loss": 0.8799803853034973, + "eval_runtime": 17.5771, + "eval_samples_per_second": 5.632, + "eval_wer": 0.4420103092783505, + "step": 33900 + }, + { + "epoch": 9.45, + "learning_rate": 9.811603867955986e-05, + "loss": 0.1651, + "step": 34000 + }, + { + "epoch": 9.45, + "eval_loss": 0.8249523043632507, + "eval_runtime": 17.7685, + "eval_samples_per_second": 5.572, + "eval_wer": 0.44329896907216493, + "step": 34000 + }, + { + "epoch": 9.47, + "learning_rate": 9.811048127153496e-05, + "loss": 0.1583, + "step": 34100 + }, + { + "epoch": 9.47, + "eval_loss": 0.7931082248687744, + "eval_runtime": 17.569, + "eval_samples_per_second": 5.635, + "eval_wer": 0.42783505154639173, + "step": 34100 + }, + { + "epoch": 9.5, + "learning_rate": 9.810492386351006e-05, + "loss": 0.1443, + "step": 34200 + }, + { + "epoch": 9.5, + "eval_loss": 0.9122607111930847, + "eval_runtime": 17.381, + "eval_samples_per_second": 5.696, + "eval_wer": 0.44072164948453607, + "step": 34200 + }, + { + "epoch": 9.53, + "learning_rate": 9.809936645548516e-05, + "loss": 0.1597, + "step": 34300 + }, + { + "epoch": 9.53, + "eval_loss": 0.7589895725250244, + "eval_runtime": 17.8656, + "eval_samples_per_second": 5.541, + "eval_wer": 0.4162371134020619, + "step": 34300 + }, + { + "epoch": 9.56, + "learning_rate": 9.809380904746028e-05, + "loss": 0.1477, + "step": 34400 + }, + { + "epoch": 9.56, + "eval_loss": 0.7940624356269836, + "eval_runtime": 17.883, + "eval_samples_per_second": 5.536, + "eval_wer": 0.4420103092783505, + "step": 34400 + }, + { + "epoch": 9.59, + "learning_rate": 9.808825163943536e-05, + "loss": 0.1602, + "step": 34500 + }, + { + "epoch": 9.59, + "eval_loss": 0.8617969155311584, + "eval_runtime": 17.5334, + "eval_samples_per_second": 5.646, + "eval_wer": 0.4381443298969072, + "step": 34500 + }, + { + "epoch": 9.61, + "learning_rate": 9.808269423141048e-05, + "loss": 0.1788, + "step": 34600 + }, + { + "epoch": 9.61, + "eval_loss": 0.8317437767982483, + "eval_runtime": 17.4731, + "eval_samples_per_second": 5.666, + "eval_wer": 0.4175257731958763, + "step": 34600 + }, + { + "epoch": 9.64, + "learning_rate": 9.807713682338558e-05, + "loss": 0.1574, + "step": 34700 + }, + { + "epoch": 9.64, + "eval_loss": 0.8786133527755737, + "eval_runtime": 17.691, + "eval_samples_per_second": 5.596, + "eval_wer": 0.4420103092783505, + "step": 34700 + }, + { + "epoch": 9.67, + "learning_rate": 9.807157941536068e-05, + "loss": 0.1572, + "step": 34800 + }, + { + "epoch": 9.67, + "eval_loss": 0.9068703055381775, + "eval_runtime": 17.5185, + "eval_samples_per_second": 5.651, + "eval_wer": 0.46005154639175255, + "step": 34800 + }, + { + "epoch": 9.7, + "learning_rate": 9.806602200733578e-05, + "loss": 0.1644, + "step": 34900 + }, + { + "epoch": 9.7, + "eval_loss": 0.7928957939147949, + "eval_runtime": 17.6768, + "eval_samples_per_second": 5.601, + "eval_wer": 0.452319587628866, + "step": 34900 + }, + { + "epoch": 9.72, + "learning_rate": 9.806046459931088e-05, + "loss": 0.1592, + "step": 35000 + }, + { + "epoch": 9.72, + "eval_loss": 0.7851370573043823, + "eval_runtime": 17.4073, + "eval_samples_per_second": 5.687, + "eval_wer": 0.42783505154639173, + "step": 35000 + }, + { + "epoch": 9.75, + "learning_rate": 9.8054907191286e-05, + "loss": 0.1419, + "step": 35100 + }, + { + "epoch": 9.75, + "eval_loss": 0.7190160155296326, + "eval_runtime": 17.1768, + "eval_samples_per_second": 5.764, + "eval_wer": 0.42783505154639173, + "step": 35100 + }, + { + "epoch": 9.78, + "learning_rate": 9.80493497832611e-05, + "loss": 0.1658, + "step": 35200 + }, + { + "epoch": 9.78, + "eval_loss": 0.7918796539306641, + "eval_runtime": 17.3718, + "eval_samples_per_second": 5.699, + "eval_wer": 0.422680412371134, + "step": 35200 + }, + { + "epoch": 9.81, + "learning_rate": 9.80437923752362e-05, + "loss": 0.1711, + "step": 35300 + }, + { + "epoch": 9.81, + "eval_loss": 0.8889212012290955, + "eval_runtime": 17.1156, + "eval_samples_per_second": 5.784, + "eval_wer": 0.4652061855670103, + "step": 35300 + }, + { + "epoch": 9.84, + "learning_rate": 9.80382349672113e-05, + "loss": 0.162, + "step": 35400 + }, + { + "epoch": 9.84, + "eval_loss": 0.9033122062683105, + "eval_runtime": 17.4865, + "eval_samples_per_second": 5.662, + "eval_wer": 0.43943298969072164, + "step": 35400 + }, + { + "epoch": 9.86, + "learning_rate": 9.803267755918641e-05, + "loss": 0.1599, + "step": 35500 + }, + { + "epoch": 9.86, + "eval_loss": 0.7897907495498657, + "eval_runtime": 17.0639, + "eval_samples_per_second": 5.802, + "eval_wer": 0.45103092783505155, + "step": 35500 + }, + { + "epoch": 9.89, + "learning_rate": 9.80271201511615e-05, + "loss": 0.136, + "step": 35600 + }, + { + "epoch": 9.89, + "eval_loss": 0.8795129060745239, + "eval_runtime": 18.3203, + "eval_samples_per_second": 5.404, + "eval_wer": 0.43943298969072164, + "step": 35600 + }, + { + "epoch": 9.92, + "learning_rate": 9.802156274313661e-05, + "loss": 0.1543, + "step": 35700 + }, + { + "epoch": 9.92, + "eval_loss": 0.940313994884491, + "eval_runtime": 17.5084, + "eval_samples_per_second": 5.654, + "eval_wer": 0.4497422680412371, + "step": 35700 + }, + { + "epoch": 9.95, + "learning_rate": 9.801600533511171e-05, + "loss": 0.1531, + "step": 35800 + }, + { + "epoch": 9.95, + "eval_loss": 0.9860208034515381, + "eval_runtime": 17.6284, + "eval_samples_per_second": 5.616, + "eval_wer": 0.4484536082474227, + "step": 35800 + }, + { + "epoch": 9.97, + "learning_rate": 9.801044792708681e-05, + "loss": 0.1537, + "step": 35900 + }, + { + "epoch": 9.97, + "eval_loss": 0.910431444644928, + "eval_runtime": 17.5953, + "eval_samples_per_second": 5.626, + "eval_wer": 0.45489690721649484, + "step": 35900 + }, + { + "epoch": 10.0, + "learning_rate": 9.800489051906191e-05, + "loss": 0.1525, + "step": 36000 + }, + { + "epoch": 10.0, + "eval_loss": 0.9185177087783813, + "eval_runtime": 17.5837, + "eval_samples_per_second": 5.63, + "eval_wer": 0.4381443298969072, + "step": 36000 + }, + { + "epoch": 10.03, + "learning_rate": 9.799933311103701e-05, + "loss": 0.1323, + "step": 36100 + }, + { + "epoch": 10.03, + "eval_loss": 0.9509208798408508, + "eval_runtime": 17.3541, + "eval_samples_per_second": 5.705, + "eval_wer": 0.4265463917525773, + "step": 36100 + }, + { + "epoch": 10.06, + "learning_rate": 9.799377570301213e-05, + "loss": 0.1411, + "step": 36200 + }, + { + "epoch": 10.06, + "eval_loss": 0.9488706588745117, + "eval_runtime": 17.624, + "eval_samples_per_second": 5.617, + "eval_wer": 0.4420103092783505, + "step": 36200 + }, + { + "epoch": 10.09, + "learning_rate": 9.798821829498723e-05, + "loss": 0.1376, + "step": 36300 + }, + { + "epoch": 10.09, + "eval_loss": 0.9858886003494263, + "eval_runtime": 17.6205, + "eval_samples_per_second": 5.618, + "eval_wer": 0.47164948453608246, + "step": 36300 + }, + { + "epoch": 10.11, + "learning_rate": 9.798266088696233e-05, + "loss": 0.1711, + "step": 36400 + }, + { + "epoch": 10.11, + "eval_loss": 0.9317906498908997, + "eval_runtime": 17.6122, + "eval_samples_per_second": 5.621, + "eval_wer": 0.4587628865979381, + "step": 36400 + }, + { + "epoch": 10.14, + "learning_rate": 9.797710347893743e-05, + "loss": 0.138, + "step": 36500 + }, + { + "epoch": 10.14, + "eval_loss": 1.0478296279907227, + "eval_runtime": 17.614, + "eval_samples_per_second": 5.621, + "eval_wer": 0.45618556701030927, + "step": 36500 + }, + { + "epoch": 10.17, + "learning_rate": 9.797154607091253e-05, + "loss": 0.1456, + "step": 36600 + }, + { + "epoch": 10.17, + "eval_loss": 0.9326837062835693, + "eval_runtime": 17.7144, + "eval_samples_per_second": 5.589, + "eval_wer": 0.44587628865979384, + "step": 36600 + }, + { + "epoch": 10.2, + "learning_rate": 9.796598866288763e-05, + "loss": 0.1486, + "step": 36700 + }, + { + "epoch": 10.2, + "eval_loss": 0.9639229774475098, + "eval_runtime": 17.5424, + "eval_samples_per_second": 5.643, + "eval_wer": 0.44072164948453607, + "step": 36700 + }, + { + "epoch": 10.23, + "learning_rate": 9.796043125486274e-05, + "loss": 0.1385, + "step": 36800 + }, + { + "epoch": 10.23, + "eval_loss": 0.9051303863525391, + "eval_runtime": 17.5669, + "eval_samples_per_second": 5.636, + "eval_wer": 0.4329896907216495, + "step": 36800 + }, + { + "epoch": 10.25, + "learning_rate": 9.795487384683783e-05, + "loss": 0.1397, + "step": 36900 + }, + { + "epoch": 10.25, + "eval_loss": 0.9713443517684937, + "eval_runtime": 17.6453, + "eval_samples_per_second": 5.611, + "eval_wer": 0.4497422680412371, + "step": 36900 + }, + { + "epoch": 10.28, + "learning_rate": 9.794931643881294e-05, + "loss": 0.155, + "step": 37000 + }, + { + "epoch": 10.28, + "eval_loss": 0.9461785554885864, + "eval_runtime": 17.6547, + "eval_samples_per_second": 5.608, + "eval_wer": 0.44587628865979384, + "step": 37000 + }, + { + "epoch": 10.31, + "learning_rate": 9.794375903078805e-05, + "loss": 0.1484, + "step": 37100 + }, + { + "epoch": 10.31, + "eval_loss": 1.0771350860595703, + "eval_runtime": 17.4288, + "eval_samples_per_second": 5.68, + "eval_wer": 0.43943298969072164, + "step": 37100 + }, + { + "epoch": 10.34, + "learning_rate": 9.793820162276315e-05, + "loss": 0.134, + "step": 37200 + }, + { + "epoch": 10.34, + "eval_loss": 0.9590903520584106, + "eval_runtime": 17.6468, + "eval_samples_per_second": 5.61, + "eval_wer": 0.4265463917525773, + "step": 37200 + }, + { + "epoch": 10.36, + "learning_rate": 9.793264421473826e-05, + "loss": 0.1372, + "step": 37300 + }, + { + "epoch": 10.36, + "eval_loss": 0.9968072772026062, + "eval_runtime": 17.5496, + "eval_samples_per_second": 5.641, + "eval_wer": 0.43427835051546393, + "step": 37300 + }, + { + "epoch": 10.39, + "learning_rate": 9.792708680671335e-05, + "loss": 0.1412, + "step": 37400 + }, + { + "epoch": 10.39, + "eval_loss": 0.921562910079956, + "eval_runtime": 17.5184, + "eval_samples_per_second": 5.651, + "eval_wer": 0.4574742268041237, + "step": 37400 + }, + { + "epoch": 10.42, + "learning_rate": 9.792152939868846e-05, + "loss": 0.134, + "step": 37500 + }, + { + "epoch": 10.42, + "eval_loss": 0.9161884784698486, + "eval_runtime": 17.7692, + "eval_samples_per_second": 5.571, + "eval_wer": 0.46649484536082475, + "step": 37500 + }, + { + "epoch": 10.45, + "learning_rate": 9.791597199066356e-05, + "loss": 0.1467, + "step": 37600 + }, + { + "epoch": 10.45, + "eval_loss": 0.9519623517990112, + "eval_runtime": 17.501, + "eval_samples_per_second": 5.657, + "eval_wer": 0.44458762886597936, + "step": 37600 + }, + { + "epoch": 10.48, + "learning_rate": 9.791041458263866e-05, + "loss": 0.1297, + "step": 37700 + }, + { + "epoch": 10.48, + "eval_loss": 0.9233236312866211, + "eval_runtime": 17.6622, + "eval_samples_per_second": 5.605, + "eval_wer": 0.44458762886597936, + "step": 37700 + }, + { + "epoch": 10.5, + "learning_rate": 9.790485717461376e-05, + "loss": 0.1428, + "step": 37800 + }, + { + "epoch": 10.5, + "eval_loss": 0.9528768658638, + "eval_runtime": 17.5775, + "eval_samples_per_second": 5.632, + "eval_wer": 0.44329896907216493, + "step": 37800 + }, + { + "epoch": 10.53, + "learning_rate": 9.789929976658888e-05, + "loss": 0.1499, + "step": 37900 + }, + { + "epoch": 10.53, + "eval_loss": 0.8795115351676941, + "eval_runtime": 17.4947, + "eval_samples_per_second": 5.659, + "eval_wer": 0.45489690721649484, + "step": 37900 + }, + { + "epoch": 10.56, + "learning_rate": 9.789374235856396e-05, + "loss": 0.1492, + "step": 38000 + }, + { + "epoch": 10.56, + "eval_loss": 0.9267066121101379, + "eval_runtime": 17.6159, + "eval_samples_per_second": 5.62, + "eval_wer": 0.45103092783505155, + "step": 38000 + }, + { + "epoch": 10.59, + "learning_rate": 9.788818495053908e-05, + "loss": 0.1476, + "step": 38100 + }, + { + "epoch": 10.59, + "eval_loss": 0.9196488261222839, + "eval_runtime": 17.564, + "eval_samples_per_second": 5.637, + "eval_wer": 0.4690721649484536, + "step": 38100 + }, + { + "epoch": 10.61, + "learning_rate": 9.788262754251416e-05, + "loss": 0.1398, + "step": 38200 + }, + { + "epoch": 10.61, + "eval_loss": 0.928520143032074, + "eval_runtime": 17.5698, + "eval_samples_per_second": 5.635, + "eval_wer": 0.46005154639175255, + "step": 38200 + }, + { + "epoch": 10.64, + "learning_rate": 9.787707013448928e-05, + "loss": 0.1512, + "step": 38300 + }, + { + "epoch": 10.64, + "eval_loss": 0.840891420841217, + "eval_runtime": 17.5719, + "eval_samples_per_second": 5.634, + "eval_wer": 0.43556701030927836, + "step": 38300 + }, + { + "epoch": 10.67, + "learning_rate": 9.787151272646439e-05, + "loss": 0.1627, + "step": 38400 + }, + { + "epoch": 10.67, + "eval_loss": 0.8385064601898193, + "eval_runtime": 17.6499, + "eval_samples_per_second": 5.609, + "eval_wer": 0.44716494845360827, + "step": 38400 + }, + { + "epoch": 10.7, + "learning_rate": 9.786595531843948e-05, + "loss": 0.1418, + "step": 38500 + }, + { + "epoch": 10.7, + "eval_loss": 0.8606293797492981, + "eval_runtime": 17.9059, + "eval_samples_per_second": 5.529, + "eval_wer": 0.44329896907216493, + "step": 38500 + }, + { + "epoch": 10.73, + "learning_rate": 9.78603979104146e-05, + "loss": 0.1587, + "step": 38600 + }, + { + "epoch": 10.73, + "eval_loss": 0.776897132396698, + "eval_runtime": 17.5532, + "eval_samples_per_second": 5.64, + "eval_wer": 0.45103092783505155, + "step": 38600 + }, + { + "epoch": 10.75, + "learning_rate": 9.78548405023897e-05, + "loss": 0.1416, + "step": 38700 + }, + { + "epoch": 10.75, + "eval_loss": 0.7967720627784729, + "eval_runtime": 17.409, + "eval_samples_per_second": 5.687, + "eval_wer": 0.4420103092783505, + "step": 38700 + }, + { + "epoch": 10.78, + "learning_rate": 9.78492830943648e-05, + "loss": 0.1651, + "step": 38800 + }, + { + "epoch": 10.78, + "eval_loss": 0.8126049637794495, + "eval_runtime": 17.6952, + "eval_samples_per_second": 5.595, + "eval_wer": 0.4368556701030928, + "step": 38800 + }, + { + "epoch": 10.81, + "learning_rate": 9.78437256863399e-05, + "loss": 0.1439, + "step": 38900 + }, + { + "epoch": 10.81, + "eval_loss": 0.8487725853919983, + "eval_runtime": 17.6223, + "eval_samples_per_second": 5.618, + "eval_wer": 0.4252577319587629, + "step": 38900 + }, + { + "epoch": 10.84, + "learning_rate": 9.7838168278315e-05, + "loss": 0.129, + "step": 39000 + }, + { + "epoch": 10.84, + "eval_loss": 0.9903653860092163, + "eval_runtime": 17.4638, + "eval_samples_per_second": 5.669, + "eval_wer": 0.43556701030927836, + "step": 39000 + }, + { + "epoch": 10.86, + "learning_rate": 9.78326108702901e-05, + "loss": 0.1299, + "step": 39100 + }, + { + "epoch": 10.86, + "eval_loss": 0.9441640973091125, + "eval_runtime": 17.6194, + "eval_samples_per_second": 5.619, + "eval_wer": 0.4381443298969072, + "step": 39100 + }, + { + "epoch": 10.89, + "learning_rate": 9.782705346226521e-05, + "loss": 0.1521, + "step": 39200 + }, + { + "epoch": 10.89, + "eval_loss": 0.9177586436271667, + "eval_runtime": 17.6014, + "eval_samples_per_second": 5.625, + "eval_wer": 0.452319587628866, + "step": 39200 + }, + { + "epoch": 10.92, + "learning_rate": 9.78214960542403e-05, + "loss": 0.1651, + "step": 39300 + }, + { + "epoch": 10.92, + "eval_loss": 0.7855709195137024, + "eval_runtime": 17.36, + "eval_samples_per_second": 5.703, + "eval_wer": 0.4484536082474227, + "step": 39300 + }, + { + "epoch": 10.95, + "learning_rate": 9.781593864621541e-05, + "loss": 0.16, + "step": 39400 + }, + { + "epoch": 10.95, + "eval_loss": 0.8589774370193481, + "eval_runtime": 17.4597, + "eval_samples_per_second": 5.67, + "eval_wer": 0.44587628865979384, + "step": 39400 + }, + { + "epoch": 10.98, + "learning_rate": 9.781038123819051e-05, + "loss": 0.1551, + "step": 39500 + }, + { + "epoch": 10.98, + "eval_loss": 0.8536927103996277, + "eval_runtime": 17.5722, + "eval_samples_per_second": 5.634, + "eval_wer": 0.4574742268041237, + "step": 39500 + }, + { + "epoch": 11.0, + "learning_rate": 9.780482383016561e-05, + "loss": 0.1656, + "step": 39600 + }, + { + "epoch": 11.0, + "eval_loss": 0.7709180116653442, + "eval_runtime": 17.5544, + "eval_samples_per_second": 5.64, + "eval_wer": 0.45103092783505155, + "step": 39600 + }, + { + "epoch": 11.03, + "learning_rate": 9.779926642214073e-05, + "loss": 0.1348, + "step": 39700 + }, + { + "epoch": 11.03, + "eval_loss": 0.8829686045646667, + "eval_runtime": 17.4954, + "eval_samples_per_second": 5.659, + "eval_wer": 0.43556701030927836, + "step": 39700 + }, + { + "epoch": 11.06, + "learning_rate": 9.779370901411581e-05, + "loss": 0.1344, + "step": 39800 + }, + { + "epoch": 11.06, + "eval_loss": 0.8350869417190552, + "eval_runtime": 17.6252, + "eval_samples_per_second": 5.617, + "eval_wer": 0.44716494845360827, + "step": 39800 + }, + { + "epoch": 11.09, + "learning_rate": 9.778815160609093e-05, + "loss": 0.1484, + "step": 39900 + }, + { + "epoch": 11.09, + "eval_loss": 0.8020666241645813, + "eval_runtime": 17.8124, + "eval_samples_per_second": 5.558, + "eval_wer": 0.4484536082474227, + "step": 39900 + }, + { + "epoch": 11.11, + "learning_rate": 9.778259419806603e-05, + "loss": 0.1294, + "step": 40000 + }, + { + "epoch": 11.11, + "eval_loss": 0.8609241247177124, + "eval_runtime": 17.6098, + "eval_samples_per_second": 5.622, + "eval_wer": 0.44329896907216493, + "step": 40000 + }, + { + "epoch": 11.14, + "learning_rate": 9.777703679004113e-05, + "loss": 0.1339, + "step": 40100 + }, + { + "epoch": 11.14, + "eval_loss": 0.9225992560386658, + "eval_runtime": 18.105, + "eval_samples_per_second": 5.468, + "eval_wer": 0.4652061855670103, + "step": 40100 + }, + { + "epoch": 11.17, + "learning_rate": 9.777147938201623e-05, + "loss": 0.1405, + "step": 40200 + }, + { + "epoch": 11.17, + "eval_loss": 0.8729308247566223, + "eval_runtime": 17.978, + "eval_samples_per_second": 5.507, + "eval_wer": 0.4484536082474227, + "step": 40200 + }, + { + "epoch": 11.2, + "learning_rate": 9.776592197399133e-05, + "loss": 0.1463, + "step": 40300 + }, + { + "epoch": 11.2, + "eval_loss": 0.8339123725891113, + "eval_runtime": 17.6199, + "eval_samples_per_second": 5.619, + "eval_wer": 0.45103092783505155, + "step": 40300 + }, + { + "epoch": 11.23, + "learning_rate": 9.776036456596643e-05, + "loss": 0.1476, + "step": 40400 + }, + { + "epoch": 11.23, + "eval_loss": 0.8812620639801025, + "eval_runtime": 17.7803, + "eval_samples_per_second": 5.568, + "eval_wer": 0.45618556701030927, + "step": 40400 + }, + { + "epoch": 11.25, + "learning_rate": 9.775480715794154e-05, + "loss": 0.1436, + "step": 40500 + }, + { + "epoch": 11.25, + "eval_loss": 0.8837606906890869, + "eval_runtime": 17.5897, + "eval_samples_per_second": 5.628, + "eval_wer": 0.45618556701030927, + "step": 40500 + }, + { + "epoch": 11.28, + "learning_rate": 9.774924974991663e-05, + "loss": 0.1536, + "step": 40600 + }, + { + "epoch": 11.28, + "eval_loss": 0.8110833168029785, + "eval_runtime": 17.6617, + "eval_samples_per_second": 5.605, + "eval_wer": 0.47680412371134023, + "step": 40600 + }, + { + "epoch": 11.31, + "learning_rate": 9.774369234189175e-05, + "loss": 0.1281, + "step": 40700 + }, + { + "epoch": 11.31, + "eval_loss": 0.9150132536888123, + "eval_runtime": 17.6707, + "eval_samples_per_second": 5.602, + "eval_wer": 0.4639175257731959, + "step": 40700 + }, + { + "epoch": 11.34, + "learning_rate": 9.773813493386686e-05, + "loss": 0.1399, + "step": 40800 + }, + { + "epoch": 11.34, + "eval_loss": 0.8512896299362183, + "eval_runtime": 17.4246, + "eval_samples_per_second": 5.682, + "eval_wer": 0.46005154639175255, + "step": 40800 + }, + { + "epoch": 11.36, + "learning_rate": 9.773257752584195e-05, + "loss": 0.133, + "step": 40900 + }, + { + "epoch": 11.36, + "eval_loss": 0.8384860754013062, + "eval_runtime": 17.5781, + "eval_samples_per_second": 5.632, + "eval_wer": 0.45489690721649484, + "step": 40900 + }, + { + "epoch": 11.39, + "learning_rate": 9.772702011781706e-05, + "loss": 0.1477, + "step": 41000 + }, + { + "epoch": 11.39, + "eval_loss": 0.8938087821006775, + "eval_runtime": 17.8894, + "eval_samples_per_second": 5.534, + "eval_wer": 0.4484536082474227, + "step": 41000 + }, + { + "epoch": 11.42, + "learning_rate": 9.772146270979216e-05, + "loss": 0.1478, + "step": 41100 + }, + { + "epoch": 11.42, + "eval_loss": 0.8160294890403748, + "eval_runtime": 17.6392, + "eval_samples_per_second": 5.613, + "eval_wer": 0.46005154639175255, + "step": 41100 + }, + { + "epoch": 11.45, + "learning_rate": 9.771590530176726e-05, + "loss": 0.1505, + "step": 41200 + }, + { + "epoch": 11.45, + "eval_loss": 0.7812536358833313, + "eval_runtime": 17.5733, + "eval_samples_per_second": 5.634, + "eval_wer": 0.46262886597938147, + "step": 41200 + }, + { + "epoch": 11.48, + "learning_rate": 9.771034789374236e-05, + "loss": 0.1545, + "step": 41300 + }, + { + "epoch": 11.48, + "eval_loss": 0.8860114216804504, + "eval_runtime": 17.7418, + "eval_samples_per_second": 5.58, + "eval_wer": 0.47036082474226804, + "step": 41300 + }, + { + "epoch": 11.5, + "learning_rate": 9.770479048571746e-05, + "loss": 0.1266, + "step": 41400 + }, + { + "epoch": 11.5, + "eval_loss": 0.8299418091773987, + "eval_runtime": 17.8271, + "eval_samples_per_second": 5.553, + "eval_wer": 0.4587628865979381, + "step": 41400 + }, + { + "epoch": 11.53, + "learning_rate": 9.769923307769256e-05, + "loss": 0.1405, + "step": 41500 + }, + { + "epoch": 11.53, + "eval_loss": 0.7701277136802673, + "eval_runtime": 17.5493, + "eval_samples_per_second": 5.641, + "eval_wer": 0.44329896907216493, + "step": 41500 + }, + { + "epoch": 11.56, + "learning_rate": 9.769367566966768e-05, + "loss": 0.1499, + "step": 41600 + }, + { + "epoch": 11.56, + "eval_loss": 0.7627600431442261, + "eval_runtime": 17.7427, + "eval_samples_per_second": 5.58, + "eval_wer": 0.45103092783505155, + "step": 41600 + }, + { + "epoch": 11.59, + "learning_rate": 9.768811826164276e-05, + "loss": 0.1362, + "step": 41700 + }, + { + "epoch": 11.59, + "eval_loss": 0.8455436825752258, + "eval_runtime": 17.8944, + "eval_samples_per_second": 5.532, + "eval_wer": 0.44458762886597936, + "step": 41700 + }, + { + "epoch": 11.61, + "learning_rate": 9.768256085361788e-05, + "loss": 0.1539, + "step": 41800 + }, + { + "epoch": 11.61, + "eval_loss": 0.7182540893554688, + "eval_runtime": 17.7016, + "eval_samples_per_second": 5.593, + "eval_wer": 0.44072164948453607, + "step": 41800 + }, + { + "epoch": 11.64, + "learning_rate": 9.767700344559298e-05, + "loss": 0.1471, + "step": 41900 + }, + { + "epoch": 11.64, + "eval_loss": 0.6807606816291809, + "eval_runtime": 17.7241, + "eval_samples_per_second": 5.586, + "eval_wer": 0.42783505154639173, + "step": 41900 + }, + { + "epoch": 11.67, + "learning_rate": 9.767144603756808e-05, + "loss": 0.135, + "step": 42000 + }, + { + "epoch": 11.67, + "eval_loss": 0.8377964496612549, + "eval_runtime": 17.7805, + "eval_samples_per_second": 5.568, + "eval_wer": 0.43556701030927836, + "step": 42000 + }, + { + "epoch": 11.7, + "learning_rate": 9.76658886295432e-05, + "loss": 0.1406, + "step": 42100 + }, + { + "epoch": 11.7, + "eval_loss": 0.8310317397117615, + "eval_runtime": 17.8675, + "eval_samples_per_second": 5.541, + "eval_wer": 0.4536082474226804, + "step": 42100 + }, + { + "epoch": 11.73, + "learning_rate": 9.766033122151828e-05, + "loss": 0.1544, + "step": 42200 + }, + { + "epoch": 11.73, + "eval_loss": 0.8470320105552673, + "eval_runtime": 17.6266, + "eval_samples_per_second": 5.617, + "eval_wer": 0.45618556701030927, + "step": 42200 + }, + { + "epoch": 11.75, + "learning_rate": 9.76547738134934e-05, + "loss": 0.1445, + "step": 42300 + }, + { + "epoch": 11.75, + "eval_loss": 0.9373657703399658, + "eval_runtime": 17.6007, + "eval_samples_per_second": 5.625, + "eval_wer": 0.44458762886597936, + "step": 42300 + }, + { + "epoch": 11.78, + "learning_rate": 9.76492164054685e-05, + "loss": 0.1409, + "step": 42400 + }, + { + "epoch": 11.78, + "eval_loss": 0.9654198884963989, + "eval_runtime": 17.6901, + "eval_samples_per_second": 5.596, + "eval_wer": 0.452319587628866, + "step": 42400 + }, + { + "epoch": 11.81, + "learning_rate": 9.76436589974436e-05, + "loss": 0.1332, + "step": 42500 + }, + { + "epoch": 11.81, + "eval_loss": 0.8946043252944946, + "eval_runtime": 17.6063, + "eval_samples_per_second": 5.623, + "eval_wer": 0.43427835051546393, + "step": 42500 + }, + { + "epoch": 11.84, + "learning_rate": 9.76381015894187e-05, + "loss": 0.1525, + "step": 42600 + }, + { + "epoch": 11.84, + "eval_loss": 1.005324363708496, + "eval_runtime": 17.5394, + "eval_samples_per_second": 5.644, + "eval_wer": 0.45103092783505155, + "step": 42600 + }, + { + "epoch": 11.86, + "learning_rate": 9.76325441813938e-05, + "loss": 0.1331, + "step": 42700 + }, + { + "epoch": 11.86, + "eval_loss": 0.7600377202033997, + "eval_runtime": 17.3487, + "eval_samples_per_second": 5.706, + "eval_wer": 0.42912371134020616, + "step": 42700 + }, + { + "epoch": 11.89, + "learning_rate": 9.76269867733689e-05, + "loss": 0.1375, + "step": 42800 + }, + { + "epoch": 11.89, + "eval_loss": 0.9018005132675171, + "eval_runtime": 17.6205, + "eval_samples_per_second": 5.618, + "eval_wer": 0.42783505154639173, + "step": 42800 + }, + { + "epoch": 11.92, + "learning_rate": 9.762142936534401e-05, + "loss": 0.1654, + "step": 42900 + }, + { + "epoch": 11.92, + "eval_loss": 0.8960022330284119, + "eval_runtime": 17.6311, + "eval_samples_per_second": 5.615, + "eval_wer": 0.4368556701030928, + "step": 42900 + }, + { + "epoch": 11.95, + "learning_rate": 9.761587195731911e-05, + "loss": 0.1514, + "step": 43000 + }, + { + "epoch": 11.95, + "eval_loss": 0.9692587852478027, + "eval_runtime": 17.8495, + "eval_samples_per_second": 5.546, + "eval_wer": 0.43041237113402064, + "step": 43000 + }, + { + "epoch": 11.98, + "learning_rate": 9.761031454929421e-05, + "loss": 0.1396, + "step": 43100 + }, + { + "epoch": 11.98, + "eval_loss": 1.0123811960220337, + "eval_runtime": 17.4191, + "eval_samples_per_second": 5.683, + "eval_wer": 0.44587628865979384, + "step": 43100 + }, + { + "epoch": 12.0, + "learning_rate": 9.760475714126933e-05, + "loss": 0.1542, + "step": 43200 + }, + { + "epoch": 12.0, + "eval_loss": 1.1317671537399292, + "eval_runtime": 17.8602, + "eval_samples_per_second": 5.543, + "eval_wer": 0.43556701030927836, + "step": 43200 + }, + { + "epoch": 12.03, + "learning_rate": 9.759919973324441e-05, + "loss": 0.1317, + "step": 43300 + }, + { + "epoch": 12.03, + "eval_loss": 0.9830509424209595, + "eval_runtime": 17.6547, + "eval_samples_per_second": 5.608, + "eval_wer": 0.4536082474226804, + "step": 43300 + }, + { + "epoch": 12.06, + "learning_rate": 9.759364232521953e-05, + "loss": 0.1245, + "step": 43400 + }, + { + "epoch": 12.06, + "eval_loss": 0.8731426000595093, + "eval_runtime": 17.5203, + "eval_samples_per_second": 5.651, + "eval_wer": 0.44329896907216493, + "step": 43400 + }, + { + "epoch": 12.09, + "learning_rate": 9.758808491719462e-05, + "loss": 0.1514, + "step": 43500 + }, + { + "epoch": 12.09, + "eval_loss": 0.9377870559692383, + "eval_runtime": 17.9338, + "eval_samples_per_second": 5.52, + "eval_wer": 0.452319587628866, + "step": 43500 + }, + { + "epoch": 12.11, + "learning_rate": 9.758252750916973e-05, + "loss": 0.1446, + "step": 43600 + }, + { + "epoch": 12.11, + "eval_loss": 0.7838338017463684, + "eval_runtime": 17.4422, + "eval_samples_per_second": 5.676, + "eval_wer": 0.42783505154639173, + "step": 43600 + }, + { + "epoch": 12.14, + "learning_rate": 9.757697010114483e-05, + "loss": 0.121, + "step": 43700 + }, + { + "epoch": 12.14, + "eval_loss": 0.9419594407081604, + "eval_runtime": 17.4214, + "eval_samples_per_second": 5.683, + "eval_wer": 0.43943298969072164, + "step": 43700 + }, + { + "epoch": 12.17, + "learning_rate": 9.757141269311993e-05, + "loss": 0.1423, + "step": 43800 + }, + { + "epoch": 12.17, + "eval_loss": 1.0655540227890015, + "eval_runtime": 17.57, + "eval_samples_per_second": 5.635, + "eval_wer": 0.4574742268041237, + "step": 43800 + }, + { + "epoch": 12.2, + "learning_rate": 9.756585528509503e-05, + "loss": 0.1337, + "step": 43900 + }, + { + "epoch": 12.2, + "eval_loss": 0.8492249250411987, + "eval_runtime": 17.7159, + "eval_samples_per_second": 5.588, + "eval_wer": 0.44716494845360827, + "step": 43900 + }, + { + "epoch": 12.23, + "learning_rate": 9.756029787707015e-05, + "loss": 0.1456, + "step": 44000 + }, + { + "epoch": 12.23, + "eval_loss": 0.9107276201248169, + "eval_runtime": 17.6083, + "eval_samples_per_second": 5.622, + "eval_wer": 0.47036082474226804, + "step": 44000 + }, + { + "epoch": 12.25, + "learning_rate": 9.755474046904525e-05, + "loss": 0.1489, + "step": 44100 + }, + { + "epoch": 12.25, + "eval_loss": 0.7715519070625305, + "eval_runtime": 17.578, + "eval_samples_per_second": 5.632, + "eval_wer": 0.44716494845360827, + "step": 44100 + }, + { + "epoch": 12.28, + "learning_rate": 9.754918306102035e-05, + "loss": 0.1377, + "step": 44200 + }, + { + "epoch": 12.28, + "eval_loss": 0.7675387263298035, + "eval_runtime": 17.6393, + "eval_samples_per_second": 5.612, + "eval_wer": 0.452319587628866, + "step": 44200 + }, + { + "epoch": 12.31, + "learning_rate": 9.754362565299545e-05, + "loss": 0.1372, + "step": 44300 + }, + { + "epoch": 12.31, + "eval_loss": 0.8274447321891785, + "eval_runtime": 18.0346, + "eval_samples_per_second": 5.489, + "eval_wer": 0.45103092783505155, + "step": 44300 + }, + { + "epoch": 12.34, + "learning_rate": 9.753806824497055e-05, + "loss": 0.1293, + "step": 44400 + }, + { + "epoch": 12.34, + "eval_loss": 0.7182275652885437, + "eval_runtime": 17.8809, + "eval_samples_per_second": 5.537, + "eval_wer": 0.44458762886597936, + "step": 44400 + }, + { + "epoch": 12.36, + "learning_rate": 9.753251083694566e-05, + "loss": 0.1372, + "step": 44500 + }, + { + "epoch": 12.36, + "eval_loss": 0.7243654727935791, + "eval_runtime": 17.4045, + "eval_samples_per_second": 5.688, + "eval_wer": 0.4484536082474227, + "step": 44500 + }, + { + "epoch": 12.39, + "learning_rate": 9.752695342892075e-05, + "loss": 0.137, + "step": 44600 + }, + { + "epoch": 12.39, + "eval_loss": 0.9591490030288696, + "eval_runtime": 17.8398, + "eval_samples_per_second": 5.549, + "eval_wer": 0.44716494845360827, + "step": 44600 + }, + { + "epoch": 12.42, + "learning_rate": 9.752139602089586e-05, + "loss": 0.1402, + "step": 44700 + }, + { + "epoch": 12.42, + "eval_loss": 0.8182889223098755, + "eval_runtime": 17.7667, + "eval_samples_per_second": 5.572, + "eval_wer": 0.44458762886597936, + "step": 44700 + }, + { + "epoch": 12.45, + "learning_rate": 9.751583861287096e-05, + "loss": 0.1433, + "step": 44800 + }, + { + "epoch": 12.45, + "eval_loss": 0.8458079099655151, + "eval_runtime": 17.7774, + "eval_samples_per_second": 5.569, + "eval_wer": 0.4587628865979381, + "step": 44800 + }, + { + "epoch": 12.48, + "learning_rate": 9.751028120484606e-05, + "loss": 0.1507, + "step": 44900 + }, + { + "epoch": 12.48, + "eval_loss": 0.7557888627052307, + "eval_runtime": 17.5593, + "eval_samples_per_second": 5.638, + "eval_wer": 0.43943298969072164, + "step": 44900 + }, + { + "epoch": 12.5, + "learning_rate": 9.750472379682116e-05, + "loss": 0.1364, + "step": 45000 + }, + { + "epoch": 12.5, + "eval_loss": 0.7761731147766113, + "eval_runtime": 17.2076, + "eval_samples_per_second": 5.753, + "eval_wer": 0.43170103092783507, + "step": 45000 + }, + { + "epoch": 12.53, + "learning_rate": 9.749916638879626e-05, + "loss": 0.1352, + "step": 45100 + }, + { + "epoch": 12.53, + "eval_loss": 0.8945127725601196, + "eval_runtime": 17.1857, + "eval_samples_per_second": 5.761, + "eval_wer": 0.4497422680412371, + "step": 45100 + }, + { + "epoch": 12.56, + "learning_rate": 9.749360898077138e-05, + "loss": 0.1617, + "step": 45200 + }, + { + "epoch": 12.56, + "eval_loss": 0.9693708419799805, + "eval_runtime": 17.6296, + "eval_samples_per_second": 5.616, + "eval_wer": 0.4497422680412371, + "step": 45200 + }, + { + "epoch": 12.59, + "learning_rate": 9.748805157274648e-05, + "loss": 0.1391, + "step": 45300 + }, + { + "epoch": 12.59, + "eval_loss": 0.8889138102531433, + "eval_runtime": 17.7851, + "eval_samples_per_second": 5.566, + "eval_wer": 0.45618556701030927, + "step": 45300 + }, + { + "epoch": 12.61, + "learning_rate": 9.748249416472158e-05, + "loss": 0.1356, + "step": 45400 + }, + { + "epoch": 12.61, + "eval_loss": 0.8959171175956726, + "eval_runtime": 18.0488, + "eval_samples_per_second": 5.485, + "eval_wer": 0.4574742268041237, + "step": 45400 + }, + { + "epoch": 12.64, + "learning_rate": 9.747693675669668e-05, + "loss": 0.1316, + "step": 45500 + }, + { + "epoch": 12.64, + "eval_loss": 0.9146299362182617, + "eval_runtime": 17.9338, + "eval_samples_per_second": 5.52, + "eval_wer": 0.4497422680412371, + "step": 45500 + }, + { + "epoch": 12.67, + "learning_rate": 9.747137934867178e-05, + "loss": 0.1398, + "step": 45600 + }, + { + "epoch": 12.67, + "eval_loss": 0.9133784174919128, + "eval_runtime": 17.7605, + "eval_samples_per_second": 5.574, + "eval_wer": 0.4587628865979381, + "step": 45600 + }, + { + "epoch": 12.7, + "learning_rate": 9.746582194064688e-05, + "loss": 0.1508, + "step": 45700 + }, + { + "epoch": 12.7, + "eval_loss": 1.0588983297348022, + "eval_runtime": 17.9533, + "eval_samples_per_second": 5.514, + "eval_wer": 0.45618556701030927, + "step": 45700 + }, + { + "epoch": 12.73, + "learning_rate": 9.7460264532622e-05, + "loss": 0.1404, + "step": 45800 + }, + { + "epoch": 12.73, + "eval_loss": 0.902584433555603, + "eval_runtime": 17.8614, + "eval_samples_per_second": 5.543, + "eval_wer": 0.44072164948453607, + "step": 45800 + }, + { + "epoch": 12.75, + "learning_rate": 9.745470712459708e-05, + "loss": 0.1375, + "step": 45900 + }, + { + "epoch": 12.75, + "eval_loss": 0.8664600849151611, + "eval_runtime": 18.0529, + "eval_samples_per_second": 5.484, + "eval_wer": 0.44458762886597936, + "step": 45900 + }, + { + "epoch": 12.78, + "learning_rate": 9.74491497165722e-05, + "loss": 0.1189, + "step": 46000 + }, + { + "epoch": 12.78, + "eval_loss": 0.8664206266403198, + "eval_runtime": 17.4467, + "eval_samples_per_second": 5.674, + "eval_wer": 0.44329896907216493, + "step": 46000 + }, + { + "epoch": 12.81, + "learning_rate": 9.74435923085473e-05, + "loss": 0.1285, + "step": 46100 + }, + { + "epoch": 12.81, + "eval_loss": 0.7403653264045715, + "eval_runtime": 17.6209, + "eval_samples_per_second": 5.618, + "eval_wer": 0.4420103092783505, + "step": 46100 + }, + { + "epoch": 12.84, + "learning_rate": 9.74380349005224e-05, + "loss": 0.1276, + "step": 46200 + }, + { + "epoch": 12.84, + "eval_loss": 0.8062552213668823, + "eval_runtime": 18.0006, + "eval_samples_per_second": 5.5, + "eval_wer": 0.4639175257731959, + "step": 46200 + }, + { + "epoch": 12.86, + "learning_rate": 9.743247749249751e-05, + "loss": 0.1404, + "step": 46300 + }, + { + "epoch": 12.86, + "eval_loss": 0.8171700239181519, + "eval_runtime": 17.6983, + "eval_samples_per_second": 5.594, + "eval_wer": 0.4690721649484536, + "step": 46300 + }, + { + "epoch": 12.89, + "learning_rate": 9.742692008447261e-05, + "loss": 0.1425, + "step": 46400 + }, + { + "epoch": 12.89, + "eval_loss": 0.8227722644805908, + "eval_runtime": 17.5604, + "eval_samples_per_second": 5.638, + "eval_wer": 0.45103092783505155, + "step": 46400 + }, + { + "epoch": 12.92, + "learning_rate": 9.742136267644771e-05, + "loss": 0.1366, + "step": 46500 + }, + { + "epoch": 12.92, + "eval_loss": 0.904529869556427, + "eval_runtime": 18.125, + "eval_samples_per_second": 5.462, + "eval_wer": 0.44458762886597936, + "step": 46500 + }, + { + "epoch": 12.95, + "learning_rate": 9.741580526842281e-05, + "loss": 0.1278, + "step": 46600 + }, + { + "epoch": 12.95, + "eval_loss": 0.8617892265319824, + "eval_runtime": 17.7415, + "eval_samples_per_second": 5.58, + "eval_wer": 0.4574742268041237, + "step": 46600 + }, + { + "epoch": 12.98, + "learning_rate": 9.741024786039791e-05, + "loss": 0.1359, + "step": 46700 + }, + { + "epoch": 12.98, + "eval_loss": 0.9559828639030457, + "eval_runtime": 17.6272, + "eval_samples_per_second": 5.616, + "eval_wer": 0.4742268041237113, + "step": 46700 + }, + { + "epoch": 13.0, + "learning_rate": 9.740469045237301e-05, + "loss": 0.139, + "step": 46800 + }, + { + "epoch": 13.0, + "eval_loss": 0.8375121355056763, + "eval_runtime": 17.6913, + "eval_samples_per_second": 5.596, + "eval_wer": 0.4587628865979381, + "step": 46800 + }, + { + "epoch": 13.03, + "learning_rate": 9.739913304434813e-05, + "loss": 0.1354, + "step": 46900 + }, + { + "epoch": 13.03, + "eval_loss": 0.8707177639007568, + "eval_runtime": 17.7257, + "eval_samples_per_second": 5.585, + "eval_wer": 0.46262886597938147, + "step": 46900 + }, + { + "epoch": 13.06, + "learning_rate": 9.739357563632322e-05, + "loss": 0.1175, + "step": 47000 + }, + { + "epoch": 13.06, + "eval_loss": 0.8792176842689514, + "eval_runtime": 17.6797, + "eval_samples_per_second": 5.6, + "eval_wer": 0.45489690721649484, + "step": 47000 + }, + { + "epoch": 13.09, + "learning_rate": 9.738801822829833e-05, + "loss": 0.137, + "step": 47100 + }, + { + "epoch": 13.09, + "eval_loss": 0.9775089025497437, + "eval_runtime": 17.5385, + "eval_samples_per_second": 5.645, + "eval_wer": 0.4574742268041237, + "step": 47100 + }, + { + "epoch": 13.11, + "learning_rate": 9.738246082027343e-05, + "loss": 0.1223, + "step": 47200 + }, + { + "epoch": 13.11, + "eval_loss": 1.057368516921997, + "eval_runtime": 17.6222, + "eval_samples_per_second": 5.618, + "eval_wer": 0.46005154639175255, + "step": 47200 + }, + { + "epoch": 13.14, + "learning_rate": 9.737690341224853e-05, + "loss": 0.12, + "step": 47300 + }, + { + "epoch": 13.14, + "eval_loss": 0.9751449227333069, + "eval_runtime": 18.8995, + "eval_samples_per_second": 5.238, + "eval_wer": 0.4690721649484536, + "step": 47300 + }, + { + "epoch": 13.17, + "learning_rate": 9.737134600422364e-05, + "loss": 0.1428, + "step": 47400 + }, + { + "epoch": 13.17, + "eval_loss": 0.9404999017715454, + "eval_runtime": 18.2253, + "eval_samples_per_second": 5.432, + "eval_wer": 0.4484536082474227, + "step": 47400 + }, + { + "epoch": 13.2, + "learning_rate": 9.736578859619873e-05, + "loss": 0.1241, + "step": 47500 + }, + { + "epoch": 13.2, + "eval_loss": 0.849004328250885, + "eval_runtime": 18.7361, + "eval_samples_per_second": 5.284, + "eval_wer": 0.43943298969072164, + "step": 47500 + }, + { + "epoch": 13.23, + "learning_rate": 9.736023118817385e-05, + "loss": 0.1182, + "step": 47600 + }, + { + "epoch": 13.23, + "eval_loss": 0.9481346607208252, + "eval_runtime": 18.3385, + "eval_samples_per_second": 5.398, + "eval_wer": 0.4381443298969072, + "step": 47600 + }, + { + "epoch": 13.25, + "learning_rate": 9.735467378014895e-05, + "loss": 0.1358, + "step": 47700 + }, + { + "epoch": 13.25, + "eval_loss": 0.8224361538887024, + "eval_runtime": 18.1961, + "eval_samples_per_second": 5.441, + "eval_wer": 0.4329896907216495, + "step": 47700 + }, + { + "epoch": 13.28, + "learning_rate": 9.734911637212405e-05, + "loss": 0.1396, + "step": 47800 + }, + { + "epoch": 13.28, + "eval_loss": 0.8473471403121948, + "eval_runtime": 17.9527, + "eval_samples_per_second": 5.514, + "eval_wer": 0.46005154639175255, + "step": 47800 + }, + { + "epoch": 13.31, + "learning_rate": 9.734355896409915e-05, + "loss": 0.1267, + "step": 47900 + }, + { + "epoch": 13.31, + "eval_loss": 0.9468744993209839, + "eval_runtime": 17.4889, + "eval_samples_per_second": 5.661, + "eval_wer": 0.44072164948453607, + "step": 47900 + }, + { + "epoch": 13.34, + "learning_rate": 9.733800155607425e-05, + "loss": 0.1252, + "step": 48000 + }, + { + "epoch": 13.34, + "eval_loss": 0.8264307379722595, + "eval_runtime": 18.0995, + "eval_samples_per_second": 5.47, + "eval_wer": 0.45103092783505155, + "step": 48000 + }, + { + "epoch": 13.36, + "learning_rate": 9.733244414804935e-05, + "loss": 0.1226, + "step": 48100 + }, + { + "epoch": 13.36, + "eval_loss": 0.8667508363723755, + "eval_runtime": 18.589, + "eval_samples_per_second": 5.326, + "eval_wer": 0.44716494845360827, + "step": 48100 + }, + { + "epoch": 13.39, + "learning_rate": 9.732688674002446e-05, + "loss": 0.1328, + "step": 48200 + }, + { + "epoch": 13.39, + "eval_loss": 0.8937565088272095, + "eval_runtime": 18.255, + "eval_samples_per_second": 5.423, + "eval_wer": 0.4536082474226804, + "step": 48200 + }, + { + "epoch": 13.42, + "learning_rate": 9.732132933199955e-05, + "loss": 0.1425, + "step": 48300 + }, + { + "epoch": 13.42, + "eval_loss": 0.9718654155731201, + "eval_runtime": 18.0435, + "eval_samples_per_second": 5.487, + "eval_wer": 0.4639175257731959, + "step": 48300 + }, + { + "epoch": 13.45, + "learning_rate": 9.731577192397466e-05, + "loss": 0.114, + "step": 48400 + }, + { + "epoch": 13.45, + "eval_loss": 0.9460931420326233, + "eval_runtime": 18.0945, + "eval_samples_per_second": 5.471, + "eval_wer": 0.46262886597938147, + "step": 48400 + }, + { + "epoch": 13.48, + "learning_rate": 9.731021451594976e-05, + "loss": 0.1425, + "step": 48500 + }, + { + "epoch": 13.48, + "eval_loss": 0.7326005697250366, + "eval_runtime": 17.9853, + "eval_samples_per_second": 5.504, + "eval_wer": 0.44587628865979384, + "step": 48500 + }, + { + "epoch": 13.5, + "learning_rate": 9.730465710792486e-05, + "loss": 0.1164, + "step": 48600 + }, + { + "epoch": 13.5, + "eval_loss": 0.7906768321990967, + "eval_runtime": 18.2994, + "eval_samples_per_second": 5.41, + "eval_wer": 0.4536082474226804, + "step": 48600 + }, + { + "epoch": 13.53, + "learning_rate": 9.729909969989998e-05, + "loss": 0.1334, + "step": 48700 + }, + { + "epoch": 13.53, + "eval_loss": 0.8335945010185242, + "eval_runtime": 18.0063, + "eval_samples_per_second": 5.498, + "eval_wer": 0.4536082474226804, + "step": 48700 + }, + { + "epoch": 13.56, + "learning_rate": 9.729354229187507e-05, + "loss": 0.1213, + "step": 48800 + }, + { + "epoch": 13.56, + "eval_loss": 1.0961216688156128, + "eval_runtime": 18.2967, + "eval_samples_per_second": 5.411, + "eval_wer": 0.4793814432989691, + "step": 48800 + }, + { + "epoch": 13.59, + "learning_rate": 9.728798488385018e-05, + "loss": 0.1186, + "step": 48900 + }, + { + "epoch": 13.59, + "eval_loss": 1.0261573791503906, + "eval_runtime": 17.874, + "eval_samples_per_second": 5.539, + "eval_wer": 0.47551546391752575, + "step": 48900 + }, + { + "epoch": 13.61, + "learning_rate": 9.728242747582528e-05, + "loss": 0.1313, + "step": 49000 + }, + { + "epoch": 13.61, + "eval_loss": 0.9995627403259277, + "eval_runtime": 17.8346, + "eval_samples_per_second": 5.551, + "eval_wer": 0.44716494845360827, + "step": 49000 + }, + { + "epoch": 13.64, + "learning_rate": 9.727687006780038e-05, + "loss": 0.1372, + "step": 49100 + }, + { + "epoch": 13.64, + "eval_loss": 1.0337309837341309, + "eval_runtime": 17.768, + "eval_samples_per_second": 5.572, + "eval_wer": 0.46005154639175255, + "step": 49100 + }, + { + "epoch": 13.67, + "learning_rate": 9.727131265977548e-05, + "loss": 0.1183, + "step": 49200 + }, + { + "epoch": 13.67, + "eval_loss": 0.9927868247032166, + "eval_runtime": 18.1061, + "eval_samples_per_second": 5.468, + "eval_wer": 0.48195876288659795, + "step": 49200 + }, + { + "epoch": 13.7, + "learning_rate": 9.72657552517506e-05, + "loss": 0.1167, + "step": 49300 + }, + { + "epoch": 13.7, + "eval_loss": 0.9940055012702942, + "eval_runtime": 17.6771, + "eval_samples_per_second": 5.6, + "eval_wer": 0.49097938144329895, + "step": 49300 + }, + { + "epoch": 13.73, + "learning_rate": 9.726019784372568e-05, + "loss": 0.1324, + "step": 49400 + }, + { + "epoch": 13.73, + "eval_loss": 0.9435777068138123, + "eval_runtime": 17.8591, + "eval_samples_per_second": 5.543, + "eval_wer": 0.4729381443298969, + "step": 49400 + }, + { + "epoch": 13.75, + "learning_rate": 9.72546404357008e-05, + "loss": 0.1353, + "step": 49500 + }, + { + "epoch": 13.75, + "eval_loss": 1.0063272714614868, + "eval_runtime": 17.8941, + "eval_samples_per_second": 5.533, + "eval_wer": 0.4961340206185567, + "step": 49500 + }, + { + "epoch": 13.78, + "learning_rate": 9.72490830276759e-05, + "loss": 0.1193, + "step": 49600 + }, + { + "epoch": 13.78, + "eval_loss": 0.9747934341430664, + "eval_runtime": 17.8823, + "eval_samples_per_second": 5.536, + "eval_wer": 0.46134020618556704, + "step": 49600 + }, + { + "epoch": 13.81, + "learning_rate": 9.7243525619651e-05, + "loss": 0.132, + "step": 49700 + }, + { + "epoch": 13.81, + "eval_loss": 1.1134113073349, + "eval_runtime": 17.6443, + "eval_samples_per_second": 5.611, + "eval_wer": 0.4536082474226804, + "step": 49700 + }, + { + "epoch": 13.84, + "learning_rate": 9.723796821162611e-05, + "loss": 0.1244, + "step": 49800 + }, + { + "epoch": 13.84, + "eval_loss": 0.9971640706062317, + "eval_runtime": 17.5696, + "eval_samples_per_second": 5.635, + "eval_wer": 0.48195876288659795, + "step": 49800 + }, + { + "epoch": 13.86, + "learning_rate": 9.72324108036012e-05, + "loss": 0.1502, + "step": 49900 + }, + { + "epoch": 13.86, + "eval_loss": 1.0188100337982178, + "eval_runtime": 17.5476, + "eval_samples_per_second": 5.642, + "eval_wer": 0.47164948453608246, + "step": 49900 + }, + { + "epoch": 13.89, + "learning_rate": 9.722685339557631e-05, + "loss": 0.1361, + "step": 50000 + }, + { + "epoch": 13.89, + "eval_loss": 1.0230387449264526, + "eval_runtime": 17.5085, + "eval_samples_per_second": 5.654, + "eval_wer": 0.46649484536082475, + "step": 50000 + }, + { + "epoch": 13.92, + "learning_rate": 9.722129598755141e-05, + "loss": 0.1449, + "step": 50100 + }, + { + "epoch": 13.92, + "eval_loss": 0.9599841833114624, + "eval_runtime": 17.6089, + "eval_samples_per_second": 5.622, + "eval_wer": 0.46262886597938147, + "step": 50100 + }, + { + "epoch": 13.95, + "learning_rate": 9.721573857952651e-05, + "loss": 0.1295, + "step": 50200 + }, + { + "epoch": 13.95, + "eval_loss": 1.113866925239563, + "eval_runtime": 17.8779, + "eval_samples_per_second": 5.538, + "eval_wer": 0.45489690721649484, + "step": 50200 + }, + { + "epoch": 13.98, + "learning_rate": 9.721018117150161e-05, + "loss": 0.1299, + "step": 50300 + }, + { + "epoch": 13.98, + "eval_loss": 0.9001206159591675, + "eval_runtime": 17.7999, + "eval_samples_per_second": 5.562, + "eval_wer": 0.46134020618556704, + "step": 50300 + }, + { + "epoch": 14.0, + "learning_rate": 9.720462376347672e-05, + "loss": 0.1217, + "step": 50400 + }, + { + "epoch": 14.0, + "eval_loss": 1.0081254243850708, + "eval_runtime": 17.6755, + "eval_samples_per_second": 5.601, + "eval_wer": 0.4690721649484536, + "step": 50400 + }, + { + "epoch": 14.03, + "learning_rate": 9.719906635545182e-05, + "loss": 0.1383, + "step": 50500 + }, + { + "epoch": 14.03, + "eval_loss": 0.9827317595481873, + "eval_runtime": 17.7559, + "eval_samples_per_second": 5.576, + "eval_wer": 0.4536082474226804, + "step": 50500 + }, + { + "epoch": 14.06, + "learning_rate": 9.719350894742693e-05, + "loss": 0.1154, + "step": 50600 + }, + { + "epoch": 14.06, + "eval_loss": 1.0788767337799072, + "eval_runtime": 17.8636, + "eval_samples_per_second": 5.542, + "eval_wer": 0.47164948453608246, + "step": 50600 + } + ], + "max_steps": 1799500, + "num_train_epochs": 500, + "total_flos": 2.6466141630383727e+19, + "trial_name": null, + "trial_params": null +}