diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,8476 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 14.999909559555032, + "global_step": 82920, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "eval_loss": 6.646472930908203, + "eval_runtime": 693.7508, + "eval_samples_per_second": 21.75, + "eval_steps_per_second": 2.72, + "eval_wer": 1.0, + "step": 100 + }, + { + "epoch": 0.04, + "eval_loss": 3.0149917602539062, + "eval_runtime": 593.4559, + "eval_samples_per_second": 25.426, + "eval_steps_per_second": 3.18, + "eval_wer": 1.0, + "step": 200 + }, + { + "epoch": 0.05, + "eval_loss": 2.8622469902038574, + "eval_runtime": 589.8045, + "eval_samples_per_second": 25.583, + "eval_steps_per_second": 3.199, + "eval_wer": 1.0003352779454167, + "step": 300 + }, + { + "epoch": 0.07, + "eval_loss": 0.9505894780158997, + "eval_runtime": 590.9695, + "eval_samples_per_second": 25.533, + "eval_steps_per_second": 3.193, + "eval_wer": 0.9770547966082064, + "step": 400 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002988, + "loss": 5.1598, + "step": 500 + }, + { + "epoch": 0.09, + "eval_loss": 0.4883461594581604, + "eval_runtime": 589.517, + "eval_samples_per_second": 25.596, + "eval_steps_per_second": 3.201, + "eval_wer": 1.0009143943965912, + "step": 500 + }, + { + "epoch": 0.11, + "eval_loss": 0.3893147110939026, + "eval_runtime": 590.0583, + "eval_samples_per_second": 25.572, + "eval_steps_per_second": 3.198, + "eval_wer": 1.0202507879031717, + "step": 600 + }, + { + "epoch": 0.13, + "eval_loss": 0.3416591286659241, + "eval_runtime": 591.5909, + "eval_samples_per_second": 25.506, + "eval_steps_per_second": 3.19, + "eval_wer": 1.0283218424437495, + "step": 700 + }, + { + "epoch": 0.14, + "eval_loss": 0.33519014716148376, + "eval_runtime": 589.9365, + "eval_samples_per_second": 25.577, + "eval_steps_per_second": 3.199, + "eval_wer": 1.033539986466963, + "step": 800 + }, + { + "epoch": 0.16, + "eval_loss": 0.29870787262916565, + "eval_runtime": 587.4241, + "eval_samples_per_second": 25.687, + "eval_steps_per_second": 3.212, + "eval_wer": 1.0167699932334815, + "step": 900 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029818733317156027, + "loss": 0.3671, + "step": 1000 + }, + { + "epoch": 0.18, + "eval_loss": 0.2921440303325653, + "eval_runtime": 590.6258, + "eval_samples_per_second": 25.547, + "eval_steps_per_second": 3.195, + "eval_wer": 1.0159104625006858, + "step": 1000 + }, + { + "epoch": 0.2, + "eval_loss": 0.27703604102134705, + "eval_runtime": 589.3558, + "eval_samples_per_second": 25.603, + "eval_steps_per_second": 3.202, + "eval_wer": 1.009595045201563, + "step": 1100 + }, + { + "epoch": 0.22, + "eval_loss": 0.2790297865867615, + "eval_runtime": 590.1481, + "eval_samples_per_second": 25.568, + "eval_steps_per_second": 3.198, + "eval_wer": 1.039812732027578, + "step": 1200 + }, + { + "epoch": 0.24, + "eval_loss": 0.2659136652946472, + "eval_runtime": 597.7345, + "eval_samples_per_second": 25.244, + "eval_steps_per_second": 3.157, + "eval_wer": 1.0189706357479442, + "step": 1300 + }, + { + "epoch": 0.25, + "eval_loss": 0.26571863889694214, + "eval_runtime": 588.3253, + "eval_samples_per_second": 25.647, + "eval_steps_per_second": 3.207, + "eval_wer": 1.0527727486085965, + "step": 1400 + }, + { + "epoch": 0.27, + "learning_rate": 0.000296367386556661, + "loss": 0.289, + "step": 1500 + }, + { + "epoch": 0.27, + "eval_loss": 0.25557756423950195, + "eval_runtime": 589.1568, + "eval_samples_per_second": 25.611, + "eval_steps_per_second": 3.203, + "eval_wer": 1.0300530958346288, + "step": 1500 + }, + { + "epoch": 0.29, + "eval_loss": 0.251380980014801, + "eval_runtime": 588.0098, + "eval_samples_per_second": 25.661, + "eval_steps_per_second": 3.209, + "eval_wer": 1.0192693379174973, + "step": 1600 + }, + { + "epoch": 0.31, + "eval_loss": 0.2708043158054352, + "eval_runtime": 587.7443, + "eval_samples_per_second": 25.673, + "eval_steps_per_second": 3.211, + "eval_wer": 1.0698658278622069, + "step": 1700 + }, + { + "epoch": 0.33, + "eval_loss": 0.2454645037651062, + "eval_runtime": 588.52, + "eval_samples_per_second": 25.639, + "eval_steps_per_second": 3.206, + "eval_wer": 1.0723468846582909, + "step": 1800 + }, + { + "epoch": 0.34, + "eval_loss": 0.2456223964691162, + "eval_runtime": 588.2037, + "eval_samples_per_second": 25.653, + "eval_steps_per_second": 3.208, + "eval_wer": 1.0099851868107752, + "step": 1900 + }, + { + "epoch": 0.36, + "learning_rate": 0.00029454743994176166, + "loss": 0.271, + "step": 2000 + }, + { + "epoch": 0.36, + "eval_loss": 0.23379947245121002, + "eval_runtime": 589.0243, + "eval_samples_per_second": 25.617, + "eval_steps_per_second": 3.204, + "eval_wer": 1.0532665215827557, + "step": 2000 + }, + { + "epoch": 0.38, + "eval_loss": 0.24785736203193665, + "eval_runtime": 589.1749, + "eval_samples_per_second": 25.61, + "eval_steps_per_second": 3.203, + "eval_wer": 1.012795425589632, + "step": 2100 + }, + { + "epoch": 0.4, + "eval_loss": 0.2482644021511078, + "eval_runtime": 588.4854, + "eval_samples_per_second": 25.64, + "eval_steps_per_second": 3.207, + "eval_wer": 1.0385691556482142, + "step": 2200 + }, + { + "epoch": 0.42, + "eval_loss": 0.2435576617717743, + "eval_runtime": 588.7455, + "eval_samples_per_second": 25.629, + "eval_steps_per_second": 3.205, + "eval_wer": 1.052827612272392, + "step": 2300 + }, + { + "epoch": 0.43, + "eval_loss": 0.23819999396800995, + "eval_runtime": 588.1659, + "eval_samples_per_second": 25.654, + "eval_steps_per_second": 3.208, + "eval_wer": 1.0476094682491786, + "step": 2400 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002927274933268624, + "loss": 0.2634, + "step": 2500 + }, + { + "epoch": 0.45, + "eval_loss": 0.23290811479091644, + "eval_runtime": 586.0097, + "eval_samples_per_second": 25.749, + "eval_steps_per_second": 3.22, + "eval_wer": 1.0680492309943124, + "step": 2500 + }, + { + "epoch": 0.47, + "eval_loss": 0.24330949783325195, + "eval_runtime": 588.1907, + "eval_samples_per_second": 25.653, + "eval_steps_per_second": 3.208, + "eval_wer": 1.0581067159220447, + "step": 2600 + }, + { + "epoch": 0.49, + "eval_loss": 0.23539048433303833, + "eval_runtime": 586.7811, + "eval_samples_per_second": 25.715, + "eval_steps_per_second": 3.216, + "eval_wer": 1.0640990472010388, + "step": 2700 + }, + { + "epoch": 0.51, + "eval_loss": 0.23182104527950287, + "eval_runtime": 587.761, + "eval_samples_per_second": 25.672, + "eval_steps_per_second": 3.21, + "eval_wer": 1.0504197070280354, + "step": 2800 + }, + { + "epoch": 0.52, + "eval_loss": 0.2324739396572113, + "eval_runtime": 586.8577, + "eval_samples_per_second": 25.712, + "eval_steps_per_second": 3.215, + "eval_wer": 1.0500112775308912, + "step": 2900 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002909075467119631, + "loss": 0.2522, + "step": 3000 + }, + { + "epoch": 0.54, + "eval_loss": 0.23437276482582092, + "eval_runtime": 587.0455, + "eval_samples_per_second": 25.703, + "eval_steps_per_second": 3.214, + "eval_wer": 1.0380083270849716, + "step": 3000 + }, + { + "epoch": 0.56, + "eval_loss": 0.22438600659370422, + "eval_runtime": 586.7245, + "eval_samples_per_second": 25.717, + "eval_steps_per_second": 3.216, + "eval_wer": 1.0662996897155015, + "step": 3100 + }, + { + "epoch": 0.58, + "eval_loss": 0.23398412764072418, + "eval_runtime": 612.4912, + "eval_samples_per_second": 24.635, + "eval_steps_per_second": 3.081, + "eval_wer": 1.0646781636522131, + "step": 3200 + }, + { + "epoch": 0.6, + "eval_loss": 0.22881384193897247, + "eval_runtime": 585.7737, + "eval_samples_per_second": 25.759, + "eval_steps_per_second": 3.221, + "eval_wer": 1.053760294556915, + "step": 3300 + }, + { + "epoch": 0.61, + "eval_loss": 0.22119460999965668, + "eval_runtime": 586.2268, + "eval_samples_per_second": 25.739, + "eval_steps_per_second": 3.219, + "eval_wer": 1.0614473034509244, + "step": 3400 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002890876000970638, + "loss": 0.2468, + "step": 3500 + }, + { + "epoch": 0.63, + "eval_loss": 0.24868042767047882, + "eval_runtime": 586.4723, + "eval_samples_per_second": 25.728, + "eval_steps_per_second": 3.218, + "eval_wer": 1.0557414824161957, + "step": 3500 + }, + { + "epoch": 0.65, + "eval_loss": 0.23298682272434235, + "eval_runtime": 585.8307, + "eval_samples_per_second": 25.757, + "eval_steps_per_second": 3.221, + "eval_wer": 1.0509561517407022, + "step": 3600 + }, + { + "epoch": 0.67, + "eval_loss": 0.230791836977005, + "eval_runtime": 585.3799, + "eval_samples_per_second": 25.776, + "eval_steps_per_second": 3.224, + "eval_wer": 1.0506330657205734, + "step": 3700 + }, + { + "epoch": 0.69, + "eval_loss": 0.2320248782634735, + "eval_runtime": 583.445, + "eval_samples_per_second": 25.862, + "eval_steps_per_second": 3.234, + "eval_wer": 1.0450796437519432, + "step": 3800 + }, + { + "epoch": 0.71, + "eval_loss": 0.22605428099632263, + "eval_runtime": 586.6782, + "eval_samples_per_second": 25.719, + "eval_steps_per_second": 3.216, + "eval_wer": 1.0701462421438281, + "step": 3900 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002872676534821645, + "loss": 0.2505, + "step": 4000 + }, + { + "epoch": 0.72, + "eval_loss": 0.22813868522644043, + "eval_runtime": 585.3181, + "eval_samples_per_second": 25.779, + "eval_steps_per_second": 3.224, + "eval_wer": 1.0713288588967527, + "step": 4000 + }, + { + "epoch": 0.74, + "eval_loss": 0.22771993279457092, + "eval_runtime": 585.9383, + "eval_samples_per_second": 25.752, + "eval_steps_per_second": 3.22, + "eval_wer": 1.0741147138250338, + "step": 4100 + }, + { + "epoch": 0.76, + "eval_loss": 0.2253136932849884, + "eval_runtime": 586.3951, + "eval_samples_per_second": 25.732, + "eval_steps_per_second": 3.218, + "eval_wer": 1.0814237730351188, + "step": 4200 + }, + { + "epoch": 0.78, + "eval_loss": 0.22151607275009155, + "eval_runtime": 585.0731, + "eval_samples_per_second": 25.79, + "eval_steps_per_second": 3.225, + "eval_wer": 1.0437141481197003, + "step": 4300 + }, + { + "epoch": 0.8, + "eval_loss": 0.2219705879688263, + "eval_runtime": 585.6079, + "eval_samples_per_second": 25.766, + "eval_steps_per_second": 3.222, + "eval_wer": 1.0557475783788397, + "step": 4400 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002854477068672652, + "loss": 0.2434, + "step": 4500 + }, + { + "epoch": 0.81, + "eval_loss": 0.21836136281490326, + "eval_runtime": 585.1783, + "eval_samples_per_second": 25.785, + "eval_steps_per_second": 3.225, + "eval_wer": 1.053327481209195, + "step": 4500 + }, + { + "epoch": 0.83, + "eval_loss": 0.22221527993679047, + "eval_runtime": 585.7348, + "eval_samples_per_second": 25.761, + "eval_steps_per_second": 3.222, + "eval_wer": 1.0818809702334145, + "step": 4600 + }, + { + "epoch": 0.85, + "eval_loss": 0.21622225642204285, + "eval_runtime": 583.8059, + "eval_samples_per_second": 25.846, + "eval_steps_per_second": 3.232, + "eval_wer": 1.0237681583487257, + "step": 4700 + }, + { + "epoch": 0.87, + "eval_loss": 0.21315866708755493, + "eval_runtime": 586.2817, + "eval_samples_per_second": 25.737, + "eval_steps_per_second": 3.219, + "eval_wer": 1.0456831440536933, + "step": 4800 + }, + { + "epoch": 0.89, + "eval_loss": 0.2067827582359314, + "eval_runtime": 586.0493, + "eval_samples_per_second": 25.747, + "eval_steps_per_second": 3.22, + "eval_wer": 1.0611425053187273, + "step": 4900 + }, + { + "epoch": 0.9, + "learning_rate": 0.00028362776025236594, + "loss": 0.2347, + "step": 5000 + }, + { + "epoch": 0.9, + "eval_loss": 0.21656368672847748, + "eval_runtime": 587.7097, + "eval_samples_per_second": 25.674, + "eval_steps_per_second": 3.211, + "eval_wer": 1.033229092372122, + "step": 5000 + }, + { + "epoch": 0.92, + "eval_loss": 0.20866595208644867, + "eval_runtime": 584.4202, + "eval_samples_per_second": 25.819, + "eval_steps_per_second": 3.229, + "eval_wer": 1.043324006510488, + "step": 5100 + }, + { + "epoch": 0.94, + "eval_loss": 0.20998135209083557, + "eval_runtime": 584.1559, + "eval_samples_per_second": 25.83, + "eval_steps_per_second": 3.23, + "eval_wer": 1.0291813731765451, + "step": 5200 + }, + { + "epoch": 0.96, + "eval_loss": 0.20666413009166718, + "eval_runtime": 596.9283, + "eval_samples_per_second": 25.278, + "eval_steps_per_second": 3.161, + "eval_wer": 1.0733892942704046, + "step": 5300 + }, + { + "epoch": 0.98, + "eval_loss": 0.21476301550865173, + "eval_runtime": 586.1885, + "eval_samples_per_second": 25.741, + "eval_steps_per_second": 3.219, + "eval_wer": 1.0278646452454538, + "step": 5400 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002818078136374666, + "loss": 0.2333, + "step": 5500 + }, + { + "epoch": 0.99, + "eval_loss": 0.21248245239257812, + "eval_runtime": 583.9808, + "eval_samples_per_second": 25.838, + "eval_steps_per_second": 3.231, + "eval_wer": 1.0276695744408477, + "step": 5500 + }, + { + "epoch": 1.01, + "eval_loss": 0.20541033148765564, + "eval_runtime": 585.3036, + "eval_samples_per_second": 25.78, + "eval_steps_per_second": 3.224, + "eval_wer": 1.0453234822577007, + "step": 5600 + }, + { + "epoch": 1.03, + "eval_loss": 0.20914313197135925, + "eval_runtime": 587.377, + "eval_samples_per_second": 25.689, + "eval_steps_per_second": 3.213, + "eval_wer": 1.0556927147150443, + "step": 5700 + }, + { + "epoch": 1.05, + "eval_loss": 0.20860984921455383, + "eval_runtime": 586.6064, + "eval_samples_per_second": 25.723, + "eval_steps_per_second": 3.217, + "eval_wer": 1.0238900776016044, + "step": 5800 + }, + { + "epoch": 1.07, + "eval_loss": 0.20505470037460327, + "eval_runtime": 585.9549, + "eval_samples_per_second": 25.751, + "eval_steps_per_second": 3.22, + "eval_wer": 1.0645074766981828, + "step": 5900 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002799878670225673, + "loss": 0.2087, + "step": 6000 + }, + { + "epoch": 1.09, + "eval_loss": 0.21026617288589478, + "eval_runtime": 586.0996, + "eval_samples_per_second": 25.745, + "eval_steps_per_second": 3.22, + "eval_wer": 1.0239876130039076, + "step": 6000 + }, + { + "epoch": 1.1, + "eval_loss": 0.21449421346187592, + "eval_runtime": 637.0564, + "eval_samples_per_second": 23.686, + "eval_steps_per_second": 2.962, + "eval_wer": 1.019726535115793, + "step": 6100 + }, + { + "epoch": 1.12, + "eval_loss": 0.21362827718257904, + "eval_runtime": 584.7089, + "eval_samples_per_second": 25.806, + "eval_steps_per_second": 3.227, + "eval_wer": 1.024761800259688, + "step": 6200 + }, + { + "epoch": 1.14, + "eval_loss": 0.20446062088012695, + "eval_runtime": 585.0534, + "eval_samples_per_second": 25.791, + "eval_steps_per_second": 3.225, + "eval_wer": 1.0443359363093823, + "step": 6300 + }, + { + "epoch": 1.16, + "eval_loss": 0.20893406867980957, + "eval_runtime": 584.0987, + "eval_samples_per_second": 25.833, + "eval_steps_per_second": 3.231, + "eval_wer": 1.0396969087373433, + "step": 6400 + }, + { + "epoch": 1.18, + "learning_rate": 0.000278167920407668, + "loss": 0.2013, + "step": 6500 + }, + { + "epoch": 1.18, + "eval_loss": 0.20124834775924683, + "eval_runtime": 590.5862, + "eval_samples_per_second": 25.549, + "eval_steps_per_second": 3.195, + "eval_wer": 1.06541577513213, + "step": 6500 + }, + { + "epoch": 1.19, + "eval_loss": 0.20543764531612396, + "eval_runtime": 586.1833, + "eval_samples_per_second": 25.741, + "eval_steps_per_second": 3.219, + "eval_wer": 1.0414342580908664, + "step": 6600 + }, + { + "epoch": 1.21, + "eval_loss": 0.20810039341449738, + "eval_runtime": 584.4277, + "eval_samples_per_second": 25.818, + "eval_steps_per_second": 3.229, + "eval_wer": 1.0631846528044475, + "step": 6700 + }, + { + "epoch": 1.23, + "eval_loss": 0.21040508151054382, + "eval_runtime": 584.8815, + "eval_samples_per_second": 25.798, + "eval_steps_per_second": 3.226, + "eval_wer": 1.0189645397853002, + "step": 6800 + }, + { + "epoch": 1.25, + "eval_loss": 0.20450659096240997, + "eval_runtime": 650.9655, + "eval_samples_per_second": 23.179, + "eval_steps_per_second": 2.899, + "eval_wer": 1.0812835658943083, + "step": 6900 + }, + { + "epoch": 1.27, + "learning_rate": 0.00027634797379276873, + "loss": 0.2092, + "step": 7000 + }, + { + "epoch": 1.27, + "eval_loss": 0.20958924293518066, + "eval_runtime": 584.7926, + "eval_samples_per_second": 25.802, + "eval_steps_per_second": 3.227, + "eval_wer": 1.0751449315118597, + "step": 7000 + }, + { + "epoch": 1.28, + "eval_loss": 0.21034906804561615, + "eval_runtime": 585.9876, + "eval_samples_per_second": 25.75, + "eval_steps_per_second": 3.22, + "eval_wer": 1.0327597032485385, + "step": 7100 + }, + { + "epoch": 1.3, + "eval_loss": 0.20439012348651886, + "eval_runtime": 584.5735, + "eval_samples_per_second": 25.812, + "eval_steps_per_second": 3.228, + "eval_wer": 1.0011094652011971, + "step": 7200 + }, + { + "epoch": 1.32, + "eval_loss": 0.20891864597797394, + "eval_runtime": 600.6694, + "eval_samples_per_second": 25.12, + "eval_steps_per_second": 3.141, + "eval_wer": 1.0259748968258322, + "step": 7300 + }, + { + "epoch": 1.34, + "eval_loss": 0.20627248287200928, + "eval_runtime": 585.2007, + "eval_samples_per_second": 25.784, + "eval_steps_per_second": 3.225, + "eval_wer": 1.0550648305627184, + "step": 7400 + }, + { + "epoch": 1.36, + "learning_rate": 0.00027452802717786945, + "loss": 0.2076, + "step": 7500 + }, + { + "epoch": 1.36, + "eval_loss": 0.20286831259727478, + "eval_runtime": 584.7246, + "eval_samples_per_second": 25.805, + "eval_steps_per_second": 3.227, + "eval_wer": 1.0074919380894034, + "step": 7500 + }, + { + "epoch": 1.37, + "eval_loss": 0.20403894782066345, + "eval_runtime": 583.776, + "eval_samples_per_second": 25.847, + "eval_steps_per_second": 3.232, + "eval_wer": 1.05280932438446, + "step": 7600 + }, + { + "epoch": 1.39, + "eval_loss": 0.20745955407619476, + "eval_runtime": 604.3868, + "eval_samples_per_second": 24.966, + "eval_steps_per_second": 3.122, + "eval_wer": 1.039824923952866, + "step": 7700 + }, + { + "epoch": 1.41, + "eval_loss": 0.20228976011276245, + "eval_runtime": 585.3687, + "eval_samples_per_second": 25.777, + "eval_steps_per_second": 3.224, + "eval_wer": 1.0231280822711117, + "step": 7800 + }, + { + "epoch": 1.43, + "eval_loss": 0.20485945045948029, + "eval_runtime": 583.728, + "eval_samples_per_second": 25.849, + "eval_steps_per_second": 3.233, + "eval_wer": 1.0318331169266595, + "step": 7900 + }, + { + "epoch": 1.45, + "learning_rate": 0.0002727080805629701, + "loss": 0.2028, + "step": 8000 + }, + { + "epoch": 1.45, + "eval_loss": 0.20722831785678864, + "eval_runtime": 583.7841, + "eval_samples_per_second": 25.847, + "eval_steps_per_second": 3.232, + "eval_wer": 1.0762909724889207, + "step": 8000 + }, + { + "epoch": 1.47, + "eval_loss": 0.20749975740909576, + "eval_runtime": 584.061, + "eval_samples_per_second": 25.835, + "eval_steps_per_second": 3.231, + "eval_wer": 1.07615076534811, + "step": 8100 + }, + { + "epoch": 1.48, + "eval_loss": 0.20522591471672058, + "eval_runtime": 584.4057, + "eval_samples_per_second": 25.819, + "eval_steps_per_second": 3.229, + "eval_wer": 1.0838072944288997, + "step": 8200 + }, + { + "epoch": 1.5, + "eval_loss": 0.20528368651866913, + "eval_runtime": 585.178, + "eval_samples_per_second": 25.785, + "eval_steps_per_second": 3.225, + "eval_wer": 1.0407088385362375, + "step": 8300 + }, + { + "epoch": 1.52, + "eval_loss": 0.20656365156173706, + "eval_runtime": 582.9655, + "eval_samples_per_second": 25.883, + "eval_steps_per_second": 3.237, + "eval_wer": 1.0265844930902264, + "step": 8400 + }, + { + "epoch": 1.54, + "learning_rate": 0.00027089177384130066, + "loss": 0.2025, + "step": 8500 + }, + { + "epoch": 1.54, + "eval_loss": 0.20365557074546814, + "eval_runtime": 618.5483, + "eval_samples_per_second": 24.394, + "eval_steps_per_second": 3.051, + "eval_wer": 1.0628432788963869, + "step": 8500 + }, + { + "epoch": 1.56, + "eval_loss": 0.20097516477108002, + "eval_runtime": 587.6824, + "eval_samples_per_second": 25.675, + "eval_steps_per_second": 3.211, + "eval_wer": 1.0351432246423193, + "step": 8600 + }, + { + "epoch": 1.57, + "eval_loss": 0.19610826671123505, + "eval_runtime": 622.9403, + "eval_samples_per_second": 24.222, + "eval_steps_per_second": 3.029, + "eval_wer": 1.0811799345293611, + "step": 8700 + }, + { + "epoch": 1.59, + "eval_loss": 0.19632692635059357, + "eval_runtime": 575.4893, + "eval_samples_per_second": 26.219, + "eval_steps_per_second": 3.279, + "eval_wer": 1.0867516443859233, + "step": 8800 + }, + { + "epoch": 1.61, + "eval_loss": 0.20223282277584076, + "eval_runtime": 608.9116, + "eval_samples_per_second": 24.78, + "eval_steps_per_second": 3.099, + "eval_wer": 1.0710118688392678, + "step": 8900 + }, + { + "epoch": 1.63, + "learning_rate": 0.0002690718272264013, + "loss": 0.1997, + "step": 9000 + }, + { + "epoch": 1.63, + "eval_loss": 0.20513388514518738, + "eval_runtime": 598.4671, + "eval_samples_per_second": 25.213, + "eval_steps_per_second": 3.153, + "eval_wer": 1.076449467517663, + "step": 9000 + }, + { + "epoch": 1.65, + "eval_loss": 0.19871561229228973, + "eval_runtime": 590.1203, + "eval_samples_per_second": 25.569, + "eval_steps_per_second": 3.198, + "eval_wer": 1.0580579482208934, + "step": 9100 + }, + { + "epoch": 1.66, + "eval_loss": 0.2050638645887375, + "eval_runtime": 605.4186, + "eval_samples_per_second": 24.923, + "eval_steps_per_second": 3.117, + "eval_wer": 1.0611425053187273, + "step": 9200 + }, + { + "epoch": 1.68, + "eval_loss": 0.19992168247699738, + "eval_runtime": 583.3088, + "eval_samples_per_second": 25.868, + "eval_steps_per_second": 3.235, + "eval_wer": 1.0808263686960127, + "step": 9300 + }, + { + "epoch": 1.7, + "eval_loss": 0.19722315669059753, + "eval_runtime": 584.2218, + "eval_samples_per_second": 25.828, + "eval_steps_per_second": 3.23, + "eval_wer": 1.0703230250605025, + "step": 9400 + }, + { + "epoch": 1.72, + "learning_rate": 0.00026725552050473186, + "loss": 0.1983, + "step": 9500 + }, + { + "epoch": 1.72, + "eval_loss": 0.19610898196697235, + "eval_runtime": 595.3314, + "eval_samples_per_second": 25.346, + "eval_steps_per_second": 3.17, + "eval_wer": 1.0583749382783783, + "step": 9500 + }, + { + "epoch": 1.74, + "eval_loss": 0.20308014750480652, + "eval_runtime": 581.8181, + "eval_samples_per_second": 25.934, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0938107691276069, + "step": 9600 + }, + { + "epoch": 1.75, + "eval_loss": 0.20190203189849854, + "eval_runtime": 587.8215, + "eval_samples_per_second": 25.669, + "eval_steps_per_second": 3.21, + "eval_wer": 1.0891229738544161, + "step": 9700 + }, + { + "epoch": 1.77, + "eval_loss": 0.20063284039497375, + "eval_runtime": 584.1697, + "eval_samples_per_second": 25.83, + "eval_steps_per_second": 3.23, + "eval_wer": 1.0542418756057863, + "step": 9800 + }, + { + "epoch": 1.79, + "eval_loss": 0.19250920414924622, + "eval_runtime": 585.7179, + "eval_samples_per_second": 25.762, + "eval_steps_per_second": 3.222, + "eval_wer": 1.0627091677182203, + "step": 9900 + }, + { + "epoch": 1.81, + "learning_rate": 0.00026543557388983253, + "loss": 0.1961, + "step": 10000 + }, + { + "epoch": 1.81, + "eval_loss": 0.19760142266750336, + "eval_runtime": 583.2305, + "eval_samples_per_second": 25.871, + "eval_steps_per_second": 3.235, + "eval_wer": 1.0750595880348446, + "step": 10000 + }, + { + "epoch": 1.83, + "eval_loss": 0.20509831607341766, + "eval_runtime": 591.9667, + "eval_samples_per_second": 25.49, + "eval_steps_per_second": 3.188, + "eval_wer": 1.0611120255055078, + "step": 10100 + }, + { + "epoch": 1.85, + "eval_loss": 0.20372095704078674, + "eval_runtime": 583.6045, + "eval_samples_per_second": 25.855, + "eval_steps_per_second": 3.233, + "eval_wer": 1.0655986540114482, + "step": 10200 + }, + { + "epoch": 1.86, + "eval_loss": 0.20245492458343506, + "eval_runtime": 583.3003, + "eval_samples_per_second": 25.868, + "eval_steps_per_second": 3.235, + "eval_wer": 1.0291326054753935, + "step": 10300 + }, + { + "epoch": 1.88, + "eval_loss": 0.1976877748966217, + "eval_runtime": 583.6653, + "eval_samples_per_second": 25.852, + "eval_steps_per_second": 3.233, + "eval_wer": 1.052510622214907, + "step": 10400 + }, + { + "epoch": 1.9, + "learning_rate": 0.00026361562727493325, + "loss": 0.2025, + "step": 10500 + }, + { + "epoch": 1.9, + "eval_loss": 0.2030467540025711, + "eval_runtime": 587.811, + "eval_samples_per_second": 25.67, + "eval_steps_per_second": 3.21, + "eval_wer": 1.0669885334942668, + "step": 10500 + }, + { + "epoch": 1.92, + "eval_loss": 0.1979692280292511, + "eval_runtime": 584.4024, + "eval_samples_per_second": 25.82, + "eval_steps_per_second": 3.229, + "eval_wer": 1.0765165231067464, + "step": 10600 + }, + { + "epoch": 1.94, + "eval_loss": 0.19752389192581177, + "eval_runtime": 584.2228, + "eval_samples_per_second": 25.827, + "eval_steps_per_second": 3.23, + "eval_wer": 1.0254140682625896, + "step": 10700 + }, + { + "epoch": 1.95, + "eval_loss": 0.19863851368427277, + "eval_runtime": 584.6885, + "eval_samples_per_second": 25.807, + "eval_steps_per_second": 3.227, + "eval_wer": 1.0636052742268796, + "step": 10800 + }, + { + "epoch": 1.97, + "eval_loss": 0.19562380015850067, + "eval_runtime": 584.0348, + "eval_samples_per_second": 25.836, + "eval_steps_per_second": 3.231, + "eval_wer": 1.0351676084928951, + "step": 10900 + }, + { + "epoch": 1.99, + "learning_rate": 0.000261795680660034, + "loss": 0.2025, + "step": 11000 + }, + { + "epoch": 1.99, + "eval_loss": 0.19542592763900757, + "eval_runtime": 583.716, + "eval_samples_per_second": 25.85, + "eval_steps_per_second": 3.233, + "eval_wer": 1.0265479173143628, + "step": 11000 + }, + { + "epoch": 2.01, + "eval_loss": 0.19573526084423065, + "eval_runtime": 585.187, + "eval_samples_per_second": 25.785, + "eval_steps_per_second": 3.225, + "eval_wer": 1.075218083063587, + "step": 11100 + }, + { + "epoch": 2.03, + "eval_loss": 0.19426105916500092, + "eval_runtime": 582.8174, + "eval_samples_per_second": 25.89, + "eval_steps_per_second": 3.238, + "eval_wer": 1.0783818876757922, + "step": 11200 + }, + { + "epoch": 2.04, + "eval_loss": 0.1898316591978073, + "eval_runtime": 614.8974, + "eval_samples_per_second": 24.539, + "eval_steps_per_second": 3.069, + "eval_wer": 1.0341130069554934, + "step": 11300 + }, + { + "epoch": 2.06, + "eval_loss": 0.19210608303546906, + "eval_runtime": 584.1617, + "eval_samples_per_second": 25.83, + "eval_steps_per_second": 3.23, + "eval_wer": 1.0301445352742877, + "step": 11400 + }, + { + "epoch": 2.08, + "learning_rate": 0.00025997573404513464, + "loss": 0.1805, + "step": 11500 + }, + { + "epoch": 2.08, + "eval_loss": 0.19096077978610992, + "eval_runtime": 581.9805, + "eval_samples_per_second": 25.927, + "eval_steps_per_second": 3.242, + "eval_wer": 1.023006163018233, + "step": 11500 + }, + { + "epoch": 2.1, + "eval_loss": 0.19605235755443573, + "eval_runtime": 582.7853, + "eval_samples_per_second": 25.891, + "eval_steps_per_second": 3.238, + "eval_wer": 1.020311747529611, + "step": 11600 + }, + { + "epoch": 2.12, + "eval_loss": 0.1973300278186798, + "eval_runtime": 673.0903, + "eval_samples_per_second": 22.417, + "eval_steps_per_second": 2.803, + "eval_wer": 1.0776198923452998, + "step": 11700 + }, + { + "epoch": 2.13, + "eval_loss": 0.18762777745723724, + "eval_runtime": 583.2234, + "eval_samples_per_second": 25.872, + "eval_steps_per_second": 3.235, + "eval_wer": 1.0787598373597167, + "step": 11800 + }, + { + "epoch": 2.15, + "eval_loss": 0.19344566762447357, + "eval_runtime": 590.5519, + "eval_samples_per_second": 25.551, + "eval_steps_per_second": 3.195, + "eval_wer": 1.0251153660930366, + "step": 11900 + }, + { + "epoch": 2.17, + "learning_rate": 0.00025815578743023537, + "loss": 0.177, + "step": 12000 + }, + { + "epoch": 2.17, + "eval_loss": 0.1967364251613617, + "eval_runtime": 582.7068, + "eval_samples_per_second": 25.895, + "eval_steps_per_second": 3.238, + "eval_wer": 1.0339971836652584, + "step": 12000 + }, + { + "epoch": 2.19, + "eval_loss": 0.19323694705963135, + "eval_runtime": 614.0473, + "eval_samples_per_second": 24.573, + "eval_steps_per_second": 3.073, + "eval_wer": 1.0131428954603365, + "step": 12100 + }, + { + "epoch": 2.21, + "eval_loss": 0.19259363412857056, + "eval_runtime": 583.7904, + "eval_samples_per_second": 25.847, + "eval_steps_per_second": 3.232, + "eval_wer": 1.0077784483336687, + "step": 12200 + }, + { + "epoch": 2.23, + "eval_loss": 0.19467875361442566, + "eval_runtime": 592.864, + "eval_samples_per_second": 25.451, + "eval_steps_per_second": 3.183, + "eval_wer": 0.9991404692672043, + "step": 12300 + }, + { + "epoch": 2.24, + "eval_loss": 0.191410094499588, + "eval_runtime": 584.2417, + "eval_samples_per_second": 25.827, + "eval_steps_per_second": 3.23, + "eval_wer": 1.021262717702066, + "step": 12400 + }, + { + "epoch": 2.26, + "learning_rate": 0.00025633584081533603, + "loss": 0.1782, + "step": 12500 + }, + { + "epoch": 2.26, + "eval_loss": 0.19619227945804596, + "eval_runtime": 633.7228, + "eval_samples_per_second": 23.81, + "eval_steps_per_second": 2.978, + "eval_wer": 0.9882469840224819, + "step": 12500 + }, + { + "epoch": 2.28, + "eval_loss": 0.19596128165721893, + "eval_runtime": 581.5084, + "eval_samples_per_second": 25.948, + "eval_steps_per_second": 3.245, + "eval_wer": 1.0562230634650671, + "step": 12600 + }, + { + "epoch": 2.3, + "eval_loss": 0.20055778324604034, + "eval_runtime": 584.0758, + "eval_samples_per_second": 25.834, + "eval_steps_per_second": 3.231, + "eval_wer": 1.0400687624586236, + "step": 12700 + }, + { + "epoch": 2.32, + "eval_loss": 0.19500796496868134, + "eval_runtime": 582.9458, + "eval_samples_per_second": 25.884, + "eval_steps_per_second": 3.237, + "eval_wer": 1.0687502666983657, + "step": 12800 + }, + { + "epoch": 2.33, + "eval_loss": 0.19202886521816254, + "eval_runtime": 667.6773, + "eval_samples_per_second": 22.599, + "eval_steps_per_second": 2.826, + "eval_wer": 1.0435312692403822, + "step": 12900 + }, + { + "epoch": 2.35, + "learning_rate": 0.00025451589420043676, + "loss": 0.1796, + "step": 13000 + }, + { + "epoch": 2.35, + "eval_loss": 0.19256320595741272, + "eval_runtime": 583.0382, + "eval_samples_per_second": 25.88, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0667081192126455, + "step": 13000 + }, + { + "epoch": 2.37, + "eval_loss": 0.19494299590587616, + "eval_runtime": 594.068, + "eval_samples_per_second": 25.399, + "eval_steps_per_second": 3.176, + "eval_wer": 1.0858799217278396, + "step": 13100 + }, + { + "epoch": 2.39, + "eval_loss": 0.19322112202644348, + "eval_runtime": 583.3591, + "eval_samples_per_second": 25.866, + "eval_steps_per_second": 3.235, + "eval_wer": 1.0670373011954182, + "step": 13200 + }, + { + "epoch": 2.41, + "eval_loss": 0.1882387101650238, + "eval_runtime": 593.7714, + "eval_samples_per_second": 25.412, + "eval_steps_per_second": 3.178, + "eval_wer": 1.0663484574166529, + "step": 13300 + }, + { + "epoch": 2.42, + "eval_loss": 0.18768326938152313, + "eval_runtime": 583.1762, + "eval_samples_per_second": 25.874, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0759983662820114, + "step": 13400 + }, + { + "epoch": 2.44, + "learning_rate": 0.00025269958747876724, + "loss": 0.1775, + "step": 13500 + }, + { + "epoch": 2.44, + "eval_loss": 0.18931668996810913, + "eval_runtime": 582.2322, + "eval_samples_per_second": 25.916, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0858799217278396, + "step": 13500 + }, + { + "epoch": 2.46, + "eval_loss": 0.19357560575008392, + "eval_runtime": 582.3494, + "eval_samples_per_second": 25.911, + "eval_steps_per_second": 3.24, + "eval_wer": 1.0702315856208433, + "step": 13600 + }, + { + "epoch": 2.48, + "eval_loss": 0.18714427947998047, + "eval_runtime": 729.8014, + "eval_samples_per_second": 20.675, + "eval_steps_per_second": 2.586, + "eval_wer": 1.0413854903897148, + "step": 13700 + }, + { + "epoch": 2.5, + "eval_loss": 0.19174307584762573, + "eval_runtime": 582.2533, + "eval_samples_per_second": 25.915, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0430009204903592, + "step": 13800 + }, + { + "epoch": 2.51, + "eval_loss": 0.19221140444278717, + "eval_runtime": 582.224, + "eval_samples_per_second": 25.916, + "eval_steps_per_second": 3.241, + "eval_wer": 1.042208445346647, + "step": 13900 + }, + { + "epoch": 2.53, + "learning_rate": 0.00025087964086386796, + "loss": 0.1778, + "step": 14000 + }, + { + "epoch": 2.53, + "eval_loss": 0.1874552071094513, + "eval_runtime": 584.0031, + "eval_samples_per_second": 25.837, + "eval_steps_per_second": 3.231, + "eval_wer": 1.0584846656059692, + "step": 14000 + }, + { + "epoch": 2.55, + "eval_loss": 0.18758933246135712, + "eval_runtime": 585.1267, + "eval_samples_per_second": 25.788, + "eval_steps_per_second": 3.225, + "eval_wer": 1.0603195503617955, + "step": 14100 + }, + { + "epoch": 2.57, + "eval_loss": 0.18875516951084137, + "eval_runtime": 581.9395, + "eval_samples_per_second": 25.929, + "eval_steps_per_second": 3.243, + "eval_wer": 1.062837182933743, + "step": 14200 + }, + { + "epoch": 2.59, + "eval_loss": 0.1948392391204834, + "eval_runtime": 583.5666, + "eval_samples_per_second": 25.857, + "eval_steps_per_second": 3.234, + "eval_wer": 1.078217296684406, + "step": 14300 + }, + { + "epoch": 2.6, + "eval_loss": 0.19421540200710297, + "eval_runtime": 583.5382, + "eval_samples_per_second": 25.858, + "eval_steps_per_second": 3.234, + "eval_wer": 1.069536645879434, + "step": 14400 + }, + { + "epoch": 2.62, + "learning_rate": 0.0002490596942489687, + "loss": 0.1784, + "step": 14500 + }, + { + "epoch": 2.62, + "eval_loss": 0.18421576917171478, + "eval_runtime": 702.5128, + "eval_samples_per_second": 21.479, + "eval_steps_per_second": 2.686, + "eval_wer": 1.086276159299696, + "step": 14500 + }, + { + "epoch": 2.64, + "eval_loss": 0.18499960005283356, + "eval_runtime": 582.6097, + "eval_samples_per_second": 25.899, + "eval_steps_per_second": 3.239, + "eval_wer": 1.0542784513816499, + "step": 14600 + }, + { + "epoch": 2.66, + "eval_loss": 0.18243639171123505, + "eval_runtime": 582.7743, + "eval_samples_per_second": 25.892, + "eval_steps_per_second": 3.238, + "eval_wer": 1.0683479331638657, + "step": 14700 + }, + { + "epoch": 2.68, + "eval_loss": 0.1887967884540558, + "eval_runtime": 584.0929, + "eval_samples_per_second": 25.833, + "eval_steps_per_second": 3.231, + "eval_wer": 1.0693110952616083, + "step": 14800 + }, + { + "epoch": 2.7, + "eval_loss": 0.1871066838502884, + "eval_runtime": 649.9925, + "eval_samples_per_second": 23.214, + "eval_steps_per_second": 2.903, + "eval_wer": 1.0174771249001786, + "step": 14900 + }, + { + "epoch": 2.71, + "learning_rate": 0.00024723974763406935, + "loss": 0.1753, + "step": 15000 + }, + { + "epoch": 2.71, + "eval_loss": 0.1888967603445053, + "eval_runtime": 583.1751, + "eval_samples_per_second": 25.874, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0548636637954683, + "step": 15000 + }, + { + "epoch": 2.73, + "eval_loss": 0.18651245534420013, + "eval_runtime": 582.2511, + "eval_samples_per_second": 25.915, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0543881787092408, + "step": 15100 + }, + { + "epoch": 2.75, + "eval_loss": 0.19178926944732666, + "eval_runtime": 582.2685, + "eval_samples_per_second": 25.914, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0725907231640484, + "step": 15200 + }, + { + "epoch": 2.77, + "eval_loss": 0.19644701480865479, + "eval_runtime": 591.4992, + "eval_samples_per_second": 25.51, + "eval_steps_per_second": 3.19, + "eval_wer": 1.0915003992855532, + "step": 15300 + }, + { + "epoch": 2.79, + "eval_loss": 0.1900092214345932, + "eval_runtime": 582.3923, + "eval_samples_per_second": 25.909, + "eval_steps_per_second": 3.24, + "eval_wer": 1.0610205860658486, + "step": 15400 + }, + { + "epoch": 2.8, + "learning_rate": 0.0002454198010191701, + "loss": 0.1768, + "step": 15500 + }, + { + "epoch": 2.8, + "eval_loss": 0.1893770694732666, + "eval_runtime": 581.8947, + "eval_samples_per_second": 25.931, + "eval_steps_per_second": 3.243, + "eval_wer": 1.076254396713057, + "step": 15500 + }, + { + "epoch": 2.82, + "eval_loss": 0.18816040456295013, + "eval_runtime": 582.1192, + "eval_samples_per_second": 25.921, + "eval_steps_per_second": 3.242, + "eval_wer": 1.0547905122437409, + "step": 15600 + }, + { + "epoch": 2.84, + "eval_loss": 0.18607495725154877, + "eval_runtime": 677.7124, + "eval_samples_per_second": 22.265, + "eval_steps_per_second": 2.784, + "eval_wer": 1.0901531915412421, + "step": 15700 + }, + { + "epoch": 2.86, + "eval_loss": 0.18599402904510498, + "eval_runtime": 582.8742, + "eval_samples_per_second": 25.887, + "eval_steps_per_second": 3.237, + "eval_wer": 1.0551379821144455, + "step": 15800 + }, + { + "epoch": 2.88, + "eval_loss": 0.1878904402256012, + "eval_runtime": 583.6205, + "eval_samples_per_second": 25.854, + "eval_steps_per_second": 3.233, + "eval_wer": 1.058094523996757, + "step": 15900 + }, + { + "epoch": 2.89, + "learning_rate": 0.0002435998544042708, + "loss": 0.1761, + "step": 16000 + }, + { + "epoch": 2.89, + "eval_loss": 0.18994924426078796, + "eval_runtime": 582.1435, + "eval_samples_per_second": 25.92, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0544369464103924, + "step": 16000 + }, + { + "epoch": 2.91, + "eval_loss": 0.18596774339675903, + "eval_runtime": 667.4862, + "eval_samples_per_second": 22.606, + "eval_steps_per_second": 2.827, + "eval_wer": 1.0530226830769982, + "step": 16100 + }, + { + "epoch": 2.93, + "eval_loss": 0.1893654614686966, + "eval_runtime": 582.0917, + "eval_samples_per_second": 25.922, + "eval_steps_per_second": 3.242, + "eval_wer": 1.0595697469565906, + "step": 16200 + }, + { + "epoch": 2.95, + "eval_loss": 0.18347308039665222, + "eval_runtime": 583.0288, + "eval_samples_per_second": 25.88, + "eval_steps_per_second": 3.237, + "eval_wer": 1.039404302530434, + "step": 16300 + }, + { + "epoch": 2.97, + "eval_loss": 0.18515755236148834, + "eval_runtime": 582.7168, + "eval_samples_per_second": 25.894, + "eval_steps_per_second": 3.238, + "eval_wer": 1.0444883353754808, + "step": 16400 + }, + { + "epoch": 2.98, + "learning_rate": 0.00024178354768260128, + "loss": 0.1754, + "step": 16500 + }, + { + "epoch": 2.98, + "eval_loss": 0.1847403347492218, + "eval_runtime": 639.6413, + "eval_samples_per_second": 23.59, + "eval_steps_per_second": 2.95, + "eval_wer": 1.0389836811080022, + "step": 16500 + }, + { + "epoch": 3.0, + "eval_loss": 0.1828482747077942, + "eval_runtime": 584.2229, + "eval_samples_per_second": 25.827, + "eval_steps_per_second": 3.23, + "eval_wer": 1.0440311381771852, + "step": 16600 + }, + { + "epoch": 3.02, + "eval_loss": 0.18693839013576508, + "eval_runtime": 595.3259, + "eval_samples_per_second": 25.346, + "eval_steps_per_second": 3.17, + "eval_wer": 1.0559792249593094, + "step": 16700 + }, + { + "epoch": 3.04, + "eval_loss": 0.18819798529148102, + "eval_runtime": 594.2234, + "eval_samples_per_second": 25.393, + "eval_steps_per_second": 3.176, + "eval_wer": 1.057277665002469, + "step": 16800 + }, + { + "epoch": 3.06, + "eval_loss": 0.19123658537864685, + "eval_runtime": 595.6382, + "eval_samples_per_second": 25.332, + "eval_steps_per_second": 3.168, + "eval_wer": 1.0600269441548862, + "step": 16900 + }, + { + "epoch": 3.08, + "learning_rate": 0.000239963601067702, + "loss": 0.1592, + "step": 17000 + }, + { + "epoch": 3.08, + "eval_loss": 0.19209939241409302, + "eval_runtime": 581.7293, + "eval_samples_per_second": 25.938, + "eval_steps_per_second": 3.244, + "eval_wer": 1.0528702840108997, + "step": 17000 + }, + { + "epoch": 3.09, + "eval_loss": 0.18810659646987915, + "eval_runtime": 589.251, + "eval_samples_per_second": 25.607, + "eval_steps_per_second": 3.202, + "eval_wer": 1.0175137006760422, + "step": 17100 + }, + { + "epoch": 3.11, + "eval_loss": 0.18914476037025452, + "eval_runtime": 582.5239, + "eval_samples_per_second": 25.903, + "eval_steps_per_second": 3.239, + "eval_wer": 1.06541577513213, + "step": 17200 + }, + { + "epoch": 3.13, + "eval_loss": 0.18887841701507568, + "eval_runtime": 611.0926, + "eval_samples_per_second": 24.692, + "eval_steps_per_second": 3.088, + "eval_wer": 1.06872588284779, + "step": 17300 + }, + { + "epoch": 3.15, + "eval_loss": 0.19159947335720062, + "eval_runtime": 582.2026, + "eval_samples_per_second": 25.917, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0641661027901221, + "step": 17400 + }, + { + "epoch": 3.17, + "learning_rate": 0.0002381436544528027, + "loss": 0.1556, + "step": 17500 + }, + { + "epoch": 3.17, + "eval_loss": 0.1849842667579651, + "eval_runtime": 593.9614, + "eval_samples_per_second": 25.404, + "eval_steps_per_second": 3.177, + "eval_wer": 1.0295471309351816, + "step": 17500 + }, + { + "epoch": 3.18, + "eval_loss": 0.18748754262924194, + "eval_runtime": 582.3741, + "eval_samples_per_second": 25.909, + "eval_steps_per_second": 3.24, + "eval_wer": 1.0272794328316357, + "step": 17600 + }, + { + "epoch": 3.2, + "eval_loss": 0.1894107609987259, + "eval_runtime": 613.1677, + "eval_samples_per_second": 24.608, + "eval_steps_per_second": 3.077, + "eval_wer": 1.0051449924714861, + "step": 17700 + }, + { + "epoch": 3.22, + "eval_loss": 0.18696586787700653, + "eval_runtime": 581.7614, + "eval_samples_per_second": 25.937, + "eval_steps_per_second": 3.244, + "eval_wer": 1.046201300878428, + "step": 17800 + }, + { + "epoch": 3.24, + "eval_loss": 0.1830950528383255, + "eval_runtime": 584.1829, + "eval_samples_per_second": 25.829, + "eval_steps_per_second": 3.23, + "eval_wer": 1.0308272830904093, + "step": 17900 + }, + { + "epoch": 3.26, + "learning_rate": 0.0002363237078379034, + "loss": 0.1557, + "step": 18000 + }, + { + "epoch": 3.26, + "eval_loss": 0.18782374262809753, + "eval_runtime": 581.3732, + "eval_samples_per_second": 25.954, + "eval_steps_per_second": 3.246, + "eval_wer": 1.0602829745859317, + "step": 18000 + }, + { + "epoch": 3.27, + "eval_loss": 0.18500719964504242, + "eval_runtime": 608.8148, + "eval_samples_per_second": 24.784, + "eval_steps_per_second": 3.099, + "eval_wer": 1.0565644373731278, + "step": 18100 + }, + { + "epoch": 3.29, + "eval_loss": 0.18434764444828033, + "eval_runtime": 581.6725, + "eval_samples_per_second": 25.941, + "eval_steps_per_second": 3.244, + "eval_wer": 1.0629225264107582, + "step": 18200 + }, + { + "epoch": 3.31, + "eval_loss": 0.18864037096500397, + "eval_runtime": 592.2707, + "eval_samples_per_second": 25.477, + "eval_steps_per_second": 3.186, + "eval_wer": 1.037776680504502, + "step": 18300 + }, + { + "epoch": 3.33, + "eval_loss": 0.18917690217494965, + "eval_runtime": 582.1854, + "eval_samples_per_second": 25.918, + "eval_steps_per_second": 3.241, + "eval_wer": 1.038081478636699, + "step": 18400 + }, + { + "epoch": 3.35, + "learning_rate": 0.0002345074011162339, + "loss": 0.159, + "step": 18500 + }, + { + "epoch": 3.35, + "eval_loss": 0.19416740536689758, + "eval_runtime": 606.7386, + "eval_samples_per_second": 24.869, + "eval_steps_per_second": 3.11, + "eval_wer": 1.0519497936516644, + "step": 18500 + }, + { + "epoch": 3.36, + "eval_loss": 0.1828826367855072, + "eval_runtime": 583.2506, + "eval_samples_per_second": 25.871, + "eval_steps_per_second": 3.235, + "eval_wer": 1.0621910108934853, + "step": 18600 + }, + { + "epoch": 3.38, + "eval_loss": 0.18944011628627777, + "eval_runtime": 584.8676, + "eval_samples_per_second": 25.799, + "eval_steps_per_second": 3.226, + "eval_wer": 1.0556683308644685, + "step": 18700 + }, + { + "epoch": 3.4, + "eval_loss": 0.1894686222076416, + "eval_runtime": 583.4404, + "eval_samples_per_second": 25.862, + "eval_steps_per_second": 3.234, + "eval_wer": 1.0626543040544247, + "step": 18800 + }, + { + "epoch": 3.42, + "eval_loss": 0.1863497793674469, + "eval_runtime": 667.2283, + "eval_samples_per_second": 22.614, + "eval_steps_per_second": 2.828, + "eval_wer": 1.0361917302170773, + "step": 18900 + }, + { + "epoch": 3.44, + "learning_rate": 0.0002326874545013346, + "loss": 0.1582, + "step": 19000 + }, + { + "epoch": 3.44, + "eval_loss": 0.1887533962726593, + "eval_runtime": 583.1359, + "eval_samples_per_second": 25.876, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0491029790969442, + "step": 19000 + }, + { + "epoch": 3.46, + "eval_loss": 0.18543538451194763, + "eval_runtime": 602.1626, + "eval_samples_per_second": 25.058, + "eval_steps_per_second": 3.134, + "eval_wer": 1.0483287918411637, + "step": 19100 + }, + { + "epoch": 3.47, + "eval_loss": 0.17971904575824738, + "eval_runtime": 582.7463, + "eval_samples_per_second": 25.893, + "eval_steps_per_second": 3.238, + "eval_wer": 0.9786580347835628, + "step": 19200 + }, + { + "epoch": 3.49, + "eval_loss": 0.17851972579956055, + "eval_runtime": 599.5376, + "eval_samples_per_second": 25.168, + "eval_steps_per_second": 3.147, + "eval_wer": 1.0086440750291081, + "step": 19300 + }, + { + "epoch": 3.51, + "eval_loss": 0.17966009676456451, + "eval_runtime": 582.3922, + "eval_samples_per_second": 25.909, + "eval_steps_per_second": 3.24, + "eval_wer": 0.9914778442237706, + "step": 19400 + }, + { + "epoch": 3.53, + "learning_rate": 0.00023086750788643532, + "loss": 0.1507, + "step": 19500 + }, + { + "epoch": 3.53, + "eval_loss": 0.18731391429901123, + "eval_runtime": 592.8938, + "eval_samples_per_second": 25.45, + "eval_steps_per_second": 3.183, + "eval_wer": 1.026627164828734, + "step": 19500 + }, + { + "epoch": 3.55, + "eval_loss": 0.18384875357151031, + "eval_runtime": 582.4778, + "eval_samples_per_second": 25.905, + "eval_steps_per_second": 3.24, + "eval_wer": 1.0298946008058862, + "step": 19600 + }, + { + "epoch": 3.56, + "eval_loss": 0.1817297637462616, + "eval_runtime": 651.5542, + "eval_samples_per_second": 23.158, + "eval_steps_per_second": 2.896, + "eval_wer": 1.035496790475668, + "step": 19700 + }, + { + "epoch": 3.58, + "eval_loss": 0.1819145381450653, + "eval_runtime": 584.5774, + "eval_samples_per_second": 25.812, + "eval_steps_per_second": 3.228, + "eval_wer": 1.0271209378028932, + "step": 19800 + }, + { + "epoch": 3.6, + "eval_loss": 0.1882605254650116, + "eval_runtime": 584.3669, + "eval_samples_per_second": 25.821, + "eval_steps_per_second": 3.229, + "eval_wer": 1.0248410477740593, + "step": 19900 + }, + { + "epoch": 3.62, + "learning_rate": 0.00022904756127153602, + "loss": 0.1601, + "step": 20000 + }, + { + "epoch": 3.62, + "eval_loss": 0.18232683837413788, + "eval_runtime": 583.0799, + "eval_samples_per_second": 25.878, + "eval_steps_per_second": 3.236, + "eval_wer": 1.040556439470139, + "step": 20000 + }, + { + "epoch": 3.64, + "eval_loss": 0.1801084280014038, + "eval_runtime": 752.5425, + "eval_samples_per_second": 20.051, + "eval_steps_per_second": 2.507, + "eval_wer": 1.0260541443402036, + "step": 20100 + }, + { + "epoch": 3.65, + "eval_loss": 0.17828203737735748, + "eval_runtime": 584.7605, + "eval_samples_per_second": 25.804, + "eval_steps_per_second": 3.227, + "eval_wer": 1.032899910389349, + "step": 20200 + }, + { + "epoch": 3.67, + "eval_loss": 0.18572643399238586, + "eval_runtime": 592.41, + "eval_samples_per_second": 25.471, + "eval_steps_per_second": 3.185, + "eval_wer": 1.0161908767823071, + "step": 20300 + }, + { + "epoch": 3.69, + "eval_loss": 0.18137747049331665, + "eval_runtime": 584.2029, + "eval_samples_per_second": 25.828, + "eval_steps_per_second": 3.23, + "eval_wer": 1.0211956621129825, + "step": 20400 + }, + { + "epoch": 3.71, + "learning_rate": 0.0002272276146566367, + "loss": 0.1552, + "step": 20500 + }, + { + "epoch": 3.71, + "eval_loss": 0.18369783461093903, + "eval_runtime": 679.994, + "eval_samples_per_second": 22.19, + "eval_steps_per_second": 2.775, + "eval_wer": 1.0231768499722633, + "step": 20500 + }, + { + "epoch": 3.73, + "eval_loss": 0.18426425755023956, + "eval_runtime": 583.2731, + "eval_samples_per_second": 25.87, + "eval_steps_per_second": 3.235, + "eval_wer": 1.031357631840432, + "step": 20600 + }, + { + "epoch": 3.74, + "eval_loss": 0.18420319259166718, + "eval_runtime": 584.6255, + "eval_samples_per_second": 25.81, + "eval_steps_per_second": 3.228, + "eval_wer": 1.0258042098718019, + "step": 20700 + }, + { + "epoch": 3.76, + "eval_loss": 0.1821189969778061, + "eval_runtime": 583.3576, + "eval_samples_per_second": 25.866, + "eval_steps_per_second": 3.235, + "eval_wer": 1.0479386502319514, + "step": 20800 + }, + { + "epoch": 3.78, + "eval_loss": 0.18640317022800446, + "eval_runtime": 583.5933, + "eval_samples_per_second": 25.855, + "eval_steps_per_second": 3.233, + "eval_wer": 1.045920886596807, + "step": 20900 + }, + { + "epoch": 3.8, + "learning_rate": 0.0002254076680417374, + "loss": 0.1576, + "step": 21000 + }, + { + "epoch": 3.8, + "eval_loss": 0.18312126398086548, + "eval_runtime": 584.1144, + "eval_samples_per_second": 25.832, + "eval_steps_per_second": 3.231, + "eval_wer": 1.0364294727601908, + "step": 21000 + }, + { + "epoch": 3.82, + "eval_loss": 0.18524977564811707, + "eval_runtime": 583.1667, + "eval_samples_per_second": 25.874, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0271148418402491, + "step": 21100 + }, + { + "epoch": 3.83, + "eval_loss": 0.18645203113555908, + "eval_runtime": 582.2828, + "eval_samples_per_second": 25.914, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0204458587077778, + "step": 21200 + }, + { + "epoch": 3.85, + "eval_loss": 0.1793699860572815, + "eval_runtime": 644.1191, + "eval_samples_per_second": 23.426, + "eval_steps_per_second": 2.93, + "eval_wer": 1.0324305212657656, + "step": 21300 + }, + { + "epoch": 3.87, + "eval_loss": 0.18262524902820587, + "eval_runtime": 583.8148, + "eval_samples_per_second": 25.846, + "eval_steps_per_second": 3.232, + "eval_wer": 1.0315039349438866, + "step": 21400 + }, + { + "epoch": 3.89, + "learning_rate": 0.0002235877214268381, + "loss": 0.1585, + "step": 21500 + }, + { + "epoch": 3.89, + "eval_loss": 0.18238940834999084, + "eval_runtime": 588.9702, + "eval_samples_per_second": 25.619, + "eval_steps_per_second": 3.204, + "eval_wer": 1.0326804557341673, + "step": 21500 + }, + { + "epoch": 3.91, + "eval_loss": 0.18375591933727264, + "eval_runtime": 583.1374, + "eval_samples_per_second": 25.876, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0207811366531947, + "step": 21600 + }, + { + "epoch": 3.93, + "eval_loss": 0.1849592924118042, + "eval_runtime": 583.4937, + "eval_samples_per_second": 25.86, + "eval_steps_per_second": 3.234, + "eval_wer": 1.019909413995111, + "step": 21700 + }, + { + "epoch": 3.94, + "eval_loss": 0.1841159164905548, + "eval_runtime": 584.0991, + "eval_samples_per_second": 25.833, + "eval_steps_per_second": 3.231, + "eval_wer": 1.0050352651438952, + "step": 21800 + }, + { + "epoch": 3.96, + "eval_loss": 0.178331658244133, + "eval_runtime": 583.3943, + "eval_samples_per_second": 25.864, + "eval_steps_per_second": 3.235, + "eval_wer": 1.0003352779454167, + "step": 21900 + }, + { + "epoch": 3.98, + "learning_rate": 0.00022176777481193883, + "loss": 0.1572, + "step": 22000 + }, + { + "epoch": 3.98, + "eval_loss": 0.17869696021080017, + "eval_runtime": 582.8458, + "eval_samples_per_second": 25.888, + "eval_steps_per_second": 3.238, + "eval_wer": 1.0114726016958968, + "step": 22000 + }, + { + "epoch": 4.0, + "eval_loss": 0.180954247713089, + "eval_runtime": 583.446, + "eval_samples_per_second": 25.862, + "eval_steps_per_second": 3.234, + "eval_wer": 1.0235426077308998, + "step": 22100 + }, + { + "epoch": 4.02, + "eval_loss": 0.17629148066043854, + "eval_runtime": 584.1606, + "eval_samples_per_second": 25.83, + "eval_steps_per_second": 3.23, + "eval_wer": 1.019092555000823, + "step": 22200 + }, + { + "epoch": 4.03, + "eval_loss": 0.1763954758644104, + "eval_runtime": 583.2857, + "eval_samples_per_second": 25.869, + "eval_steps_per_second": 3.235, + "eval_wer": 1.033222996409478, + "step": 22300 + }, + { + "epoch": 4.05, + "eval_loss": 0.1793549805879593, + "eval_runtime": 582.3125, + "eval_samples_per_second": 25.912, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0428972891254122, + "step": 22400 + }, + { + "epoch": 4.07, + "learning_rate": 0.00021994782819703953, + "loss": 0.1406, + "step": 22500 + }, + { + "epoch": 4.07, + "eval_loss": 0.1905169039964676, + "eval_runtime": 671.5465, + "eval_samples_per_second": 22.469, + "eval_steps_per_second": 2.81, + "eval_wer": 1.0287546557914693, + "step": 22500 + }, + { + "epoch": 4.09, + "eval_loss": 0.17760008573532104, + "eval_runtime": 582.5998, + "eval_samples_per_second": 25.899, + "eval_steps_per_second": 3.239, + "eval_wer": 1.0244265223142712, + "step": 22600 + }, + { + "epoch": 4.11, + "eval_loss": 0.17820368707180023, + "eval_runtime": 595.3661, + "eval_samples_per_second": 25.344, + "eval_steps_per_second": 3.169, + "eval_wer": 1.045085739714587, + "step": 22700 + }, + { + "epoch": 4.12, + "eval_loss": 0.17709559202194214, + "eval_runtime": 582.1208, + "eval_samples_per_second": 25.921, + "eval_steps_per_second": 3.242, + "eval_wer": 1.0387276506769567, + "step": 22800 + }, + { + "epoch": 4.14, + "eval_loss": 0.17884837090969086, + "eval_runtime": 645.9188, + "eval_samples_per_second": 23.361, + "eval_steps_per_second": 2.921, + "eval_wer": 1.0434581176886548, + "step": 22900 + }, + { + "epoch": 4.16, + "learning_rate": 0.00021812788158214025, + "loss": 0.14, + "step": 23000 + }, + { + "epoch": 4.16, + "eval_loss": 0.17918579280376434, + "eval_runtime": 581.9318, + "eval_samples_per_second": 25.929, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0420804301311242, + "step": 23000 + }, + { + "epoch": 4.18, + "eval_loss": 0.18405954539775848, + "eval_runtime": 588.3849, + "eval_samples_per_second": 25.645, + "eval_steps_per_second": 3.207, + "eval_wer": 1.0240546685929908, + "step": 23100 + }, + { + "epoch": 4.2, + "eval_loss": 0.17691761255264282, + "eval_runtime": 581.3629, + "eval_samples_per_second": 25.955, + "eval_steps_per_second": 3.246, + "eval_wer": 1.0545588656632712, + "step": 23200 + }, + { + "epoch": 4.21, + "eval_loss": 0.18145306408405304, + "eval_runtime": 719.2259, + "eval_samples_per_second": 20.979, + "eval_steps_per_second": 2.624, + "eval_wer": 1.0601915351462727, + "step": 23300 + }, + { + "epoch": 4.23, + "eval_loss": 0.1783633530139923, + "eval_runtime": 581.7307, + "eval_samples_per_second": 25.938, + "eval_steps_per_second": 3.244, + "eval_wer": 1.0368683820705547, + "step": 23400 + }, + { + "epoch": 4.25, + "learning_rate": 0.00021630793496724095, + "loss": 0.1394, + "step": 23500 + }, + { + "epoch": 4.25, + "eval_loss": 0.1808551549911499, + "eval_runtime": 594.0637, + "eval_samples_per_second": 25.4, + "eval_steps_per_second": 3.176, + "eval_wer": 1.0406356869845101, + "step": 23500 + }, + { + "epoch": 4.27, + "eval_loss": 0.17443229258060455, + "eval_runtime": 582.3112, + "eval_samples_per_second": 25.912, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0132831026011473, + "step": 23600 + }, + { + "epoch": 4.29, + "eval_loss": 0.17706982791423798, + "eval_runtime": 624.4614, + "eval_samples_per_second": 24.163, + "eval_steps_per_second": 3.022, + "eval_wer": 1.021354157141725, + "step": 23700 + }, + { + "epoch": 4.31, + "eval_loss": 0.17652854323387146, + "eval_runtime": 582.3415, + "eval_samples_per_second": 25.911, + "eval_steps_per_second": 3.24, + "eval_wer": 1.006394664813494, + "step": 23800 + }, + { + "epoch": 4.32, + "eval_loss": 0.1792861521244049, + "eval_runtime": 610.5223, + "eval_samples_per_second": 24.715, + "eval_steps_per_second": 3.091, + "eval_wer": 1.0200008534347702, + "step": 23900 + }, + { + "epoch": 4.34, + "learning_rate": 0.00021448798835234167, + "loss": 0.14, + "step": 24000 + }, + { + "epoch": 4.34, + "eval_loss": 0.1775696575641632, + "eval_runtime": 582.2567, + "eval_samples_per_second": 25.915, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0351737044555391, + "step": 24000 + }, + { + "epoch": 4.36, + "eval_loss": 0.1774866282939911, + "eval_runtime": 589.1918, + "eval_samples_per_second": 25.61, + "eval_steps_per_second": 3.203, + "eval_wer": 1.0294252116823028, + "step": 24100 + }, + { + "epoch": 4.38, + "eval_loss": 0.1763463169336319, + "eval_runtime": 582.7316, + "eval_samples_per_second": 25.894, + "eval_steps_per_second": 3.238, + "eval_wer": 1.0212810055899977, + "step": 24200 + }, + { + "epoch": 4.4, + "eval_loss": 0.1697307527065277, + "eval_runtime": 594.6072, + "eval_samples_per_second": 25.376, + "eval_steps_per_second": 3.174, + "eval_wer": 1.0302237827886591, + "step": 24300 + }, + { + "epoch": 4.41, + "eval_loss": 0.17706170678138733, + "eval_runtime": 581.6621, + "eval_samples_per_second": 25.941, + "eval_steps_per_second": 3.244, + "eval_wer": 1.025901745274105, + "step": 24400 + }, + { + "epoch": 4.43, + "learning_rate": 0.00021267532152390194, + "loss": 0.1408, + "step": 24500 + }, + { + "epoch": 4.43, + "eval_loss": 0.17474128305912018, + "eval_runtime": 600.4729, + "eval_samples_per_second": 25.129, + "eval_steps_per_second": 3.143, + "eval_wer": 1.0409100053034874, + "step": 24500 + }, + { + "epoch": 4.45, + "eval_loss": 0.17691320180892944, + "eval_runtime": 580.8883, + "eval_samples_per_second": 25.976, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0278341654322343, + "step": 24600 + }, + { + "epoch": 4.47, + "eval_loss": 0.17671321332454681, + "eval_runtime": 581.8233, + "eval_samples_per_second": 25.934, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0189950195985198, + "step": 24700 + }, + { + "epoch": 4.49, + "eval_loss": 0.17452046275138855, + "eval_runtime": 581.5649, + "eval_samples_per_second": 25.946, + "eval_steps_per_second": 3.245, + "eval_wer": 1.0280962918259238, + "step": 24800 + }, + { + "epoch": 4.5, + "eval_loss": 0.17375342547893524, + "eval_runtime": 581.0408, + "eval_samples_per_second": 25.969, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0355577501021074, + "step": 24900 + }, + { + "epoch": 4.52, + "learning_rate": 0.00021085537490900266, + "loss": 0.1391, + "step": 25000 + }, + { + "epoch": 4.52, + "eval_loss": 0.1780717819929123, + "eval_runtime": 581.6537, + "eval_samples_per_second": 25.942, + "eval_steps_per_second": 3.244, + "eval_wer": 1.0429399608639198, + "step": 25000 + }, + { + "epoch": 4.54, + "eval_loss": 0.17844460904598236, + "eval_runtime": 588.6313, + "eval_samples_per_second": 25.634, + "eval_steps_per_second": 3.206, + "eval_wer": 1.0075894734917064, + "step": 25100 + }, + { + "epoch": 4.56, + "eval_loss": 0.1770990788936615, + "eval_runtime": 581.2924, + "eval_samples_per_second": 25.958, + "eval_steps_per_second": 3.246, + "eval_wer": 1.0156666239949281, + "step": 25200 + }, + { + "epoch": 4.58, + "eval_loss": 0.17579950392246246, + "eval_runtime": 591.9028, + "eval_samples_per_second": 25.492, + "eval_steps_per_second": 3.188, + "eval_wer": 1.033728961308925, + "step": 25300 + }, + { + "epoch": 4.59, + "eval_loss": 0.1758110374212265, + "eval_runtime": 581.3785, + "eval_samples_per_second": 25.954, + "eval_steps_per_second": 3.246, + "eval_wer": 1.0466036344129284, + "step": 25400 + }, + { + "epoch": 4.61, + "learning_rate": 0.00020903542829410336, + "loss": 0.1398, + "step": 25500 + }, + { + "epoch": 4.61, + "eval_loss": 0.1723676174879074, + "eval_runtime": 614.5901, + "eval_samples_per_second": 24.551, + "eval_steps_per_second": 3.07, + "eval_wer": 1.040330888852313, + "step": 25500 + }, + { + "epoch": 4.63, + "eval_loss": 0.17654301226139069, + "eval_runtime": 580.7681, + "eval_samples_per_second": 25.981, + "eval_steps_per_second": 3.249, + "eval_wer": 1.0480727614101182, + "step": 25600 + }, + { + "epoch": 4.65, + "eval_loss": 0.17569170892238617, + "eval_runtime": 619.4473, + "eval_samples_per_second": 24.359, + "eval_steps_per_second": 3.046, + "eval_wer": 1.031979420030114, + "step": 25700 + }, + { + "epoch": 4.67, + "eval_loss": 0.18143196403980255, + "eval_runtime": 581.9906, + "eval_samples_per_second": 25.927, + "eval_steps_per_second": 3.242, + "eval_wer": 1.047877690605512, + "step": 25800 + }, + { + "epoch": 4.69, + "eval_loss": 0.17128212749958038, + "eval_runtime": 607.3729, + "eval_samples_per_second": 24.843, + "eval_steps_per_second": 3.107, + "eval_wer": 1.0251092701303925, + "step": 25900 + }, + { + "epoch": 4.7, + "learning_rate": 0.00020721548167920408, + "loss": 0.1427, + "step": 26000 + }, + { + "epoch": 4.7, + "eval_loss": 0.1734877973794937, + "eval_runtime": 581.7467, + "eval_samples_per_second": 25.937, + "eval_steps_per_second": 3.244, + "eval_wer": 1.0339971836652584, + "step": 26000 + }, + { + "epoch": 4.72, + "eval_loss": 0.1765192449092865, + "eval_runtime": 590.7316, + "eval_samples_per_second": 25.543, + "eval_steps_per_second": 3.194, + "eval_wer": 1.0358198764957969, + "step": 26100 + }, + { + "epoch": 4.74, + "eval_loss": 0.17305831611156464, + "eval_runtime": 582.6945, + "eval_samples_per_second": 25.895, + "eval_steps_per_second": 3.238, + "eval_wer": 1.021975945331407, + "step": 26200 + }, + { + "epoch": 4.76, + "eval_loss": 0.17689305543899536, + "eval_runtime": 596.8319, + "eval_samples_per_second": 25.282, + "eval_steps_per_second": 3.162, + "eval_wer": 1.0261394878172188, + "step": 26300 + }, + { + "epoch": 4.78, + "eval_loss": 0.1746763437986374, + "eval_runtime": 580.7187, + "eval_samples_per_second": 25.983, + "eval_steps_per_second": 3.249, + "eval_wer": 1.013923178678761, + "step": 26400 + }, + { + "epoch": 4.79, + "learning_rate": 0.00020539553506430477, + "loss": 0.1424, + "step": 26500 + }, + { + "epoch": 4.79, + "eval_loss": 0.17905060946941376, + "eval_runtime": 612.0357, + "eval_samples_per_second": 24.654, + "eval_steps_per_second": 3.083, + "eval_wer": 1.040550343507495, + "step": 26500 + }, + { + "epoch": 4.81, + "eval_loss": 0.17353174090385437, + "eval_runtime": 581.1951, + "eval_samples_per_second": 25.962, + "eval_steps_per_second": 3.247, + "eval_wer": 1.0496577116975427, + "step": 26600 + }, + { + "epoch": 4.83, + "eval_loss": 0.17099276185035706, + "eval_runtime": 582.2823, + "eval_samples_per_second": 25.914, + "eval_steps_per_second": 3.241, + "eval_wer": 1.043250854958761, + "step": 26700 + }, + { + "epoch": 4.85, + "eval_loss": 0.1770693063735962, + "eval_runtime": 581.9174, + "eval_samples_per_second": 25.93, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0001828788793183, + "step": 26800 + }, + { + "epoch": 4.87, + "eval_loss": 0.17479608952999115, + "eval_runtime": 605.5155, + "eval_samples_per_second": 24.919, + "eval_steps_per_second": 3.116, + "eval_wer": 1.004645123534683, + "step": 26900 + }, + { + "epoch": 4.88, + "learning_rate": 0.00020357558844940547, + "loss": 0.1419, + "step": 27000 + }, + { + "epoch": 4.88, + "eval_loss": 0.1793585568666458, + "eval_runtime": 579.9597, + "eval_samples_per_second": 26.017, + "eval_steps_per_second": 3.254, + "eval_wer": 1.03324128429741, + "step": 27000 + }, + { + "epoch": 4.9, + "eval_loss": 0.17716261744499207, + "eval_runtime": 589.6493, + "eval_samples_per_second": 25.59, + "eval_steps_per_second": 3.2, + "eval_wer": 1.0557780581920595, + "step": 27100 + }, + { + "epoch": 4.92, + "eval_loss": 0.1757478266954422, + "eval_runtime": 580.361, + "eval_samples_per_second": 25.999, + "eval_steps_per_second": 3.251, + "eval_wer": 1.0477496753899893, + "step": 27200 + }, + { + "epoch": 4.94, + "eval_loss": 0.17353762686252594, + "eval_runtime": 625.2736, + "eval_samples_per_second": 24.132, + "eval_steps_per_second": 3.018, + "eval_wer": 1.0324122333778338, + "step": 27300 + }, + { + "epoch": 4.96, + "eval_loss": 0.17579859495162964, + "eval_runtime": 581.3776, + "eval_samples_per_second": 25.954, + "eval_steps_per_second": 3.246, + "eval_wer": 1.025999280676408, + "step": 27400 + }, + { + "epoch": 4.97, + "learning_rate": 0.00020175564183450617, + "loss": 0.1433, + "step": 27500 + }, + { + "epoch": 4.97, + "eval_loss": 0.17672304809093475, + "eval_runtime": 580.2867, + "eval_samples_per_second": 26.003, + "eval_steps_per_second": 3.252, + "eval_wer": 1.0421535816828515, + "step": 27500 + }, + { + "epoch": 4.99, + "eval_loss": 0.1695006638765335, + "eval_runtime": 579.8433, + "eval_samples_per_second": 26.023, + "eval_steps_per_second": 3.254, + "eval_wer": 1.038587443536146, + "step": 27600 + }, + { + "epoch": 5.01, + "eval_loss": 0.1763276606798172, + "eval_runtime": 691.6775, + "eval_samples_per_second": 21.815, + "eval_steps_per_second": 2.728, + "eval_wer": 1.057052114384643, + "step": 27700 + }, + { + "epoch": 5.03, + "eval_loss": 0.17430032789707184, + "eval_runtime": 582.2365, + "eval_samples_per_second": 25.916, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0366672153033045, + "step": 27800 + }, + { + "epoch": 5.05, + "eval_loss": 0.1804419308900833, + "eval_runtime": 589.7736, + "eval_samples_per_second": 25.584, + "eval_steps_per_second": 3.2, + "eval_wer": 1.0254689319263852, + "step": 27900 + }, + { + "epoch": 5.07, + "learning_rate": 0.00019993933511283668, + "loss": 0.1306, + "step": 28000 + }, + { + "epoch": 5.07, + "eval_loss": 0.1802925318479538, + "eval_runtime": 581.8829, + "eval_samples_per_second": 25.931, + "eval_steps_per_second": 3.243, + "eval_wer": 1.037673049139555, + "step": 28000 + }, + { + "epoch": 5.08, + "eval_loss": 0.17504069209098816, + "eval_runtime": 581.7334, + "eval_samples_per_second": 25.938, + "eval_steps_per_second": 3.244, + "eval_wer": 1.055211133666173, + "step": 28100 + }, + { + "epoch": 5.1, + "eval_loss": 0.17433439195156097, + "eval_runtime": 581.8045, + "eval_samples_per_second": 25.935, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0511573185079521, + "step": 28200 + }, + { + "epoch": 5.12, + "eval_loss": 0.1777062863111496, + "eval_runtime": 581.1315, + "eval_samples_per_second": 25.965, + "eval_steps_per_second": 3.247, + "eval_wer": 1.0583627463530902, + "step": 28300 + }, + { + "epoch": 5.14, + "eval_loss": 0.1725868433713913, + "eval_runtime": 572.8216, + "eval_samples_per_second": 26.342, + "eval_steps_per_second": 3.294, + "eval_wer": 1.0373682510073579, + "step": 28400 + }, + { + "epoch": 5.16, + "learning_rate": 0.0001981193884979374, + "loss": 0.123, + "step": 28500 + }, + { + "epoch": 5.16, + "eval_loss": 0.17764069139957428, + "eval_runtime": 580.2271, + "eval_samples_per_second": 26.005, + "eval_steps_per_second": 3.252, + "eval_wer": 1.0439214108495942, + "step": 28500 + }, + { + "epoch": 5.17, + "eval_loss": 0.17592105269432068, + "eval_runtime": 581.0221, + "eval_samples_per_second": 25.97, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0681955340977671, + "step": 28600 + }, + { + "epoch": 5.19, + "eval_loss": 0.17235223948955536, + "eval_runtime": 580.265, + "eval_samples_per_second": 26.004, + "eval_steps_per_second": 3.252, + "eval_wer": 1.0511207427320886, + "step": 28700 + }, + { + "epoch": 5.21, + "eval_loss": 0.16769592463970184, + "eval_runtime": 590.3886, + "eval_samples_per_second": 25.558, + "eval_steps_per_second": 3.196, + "eval_wer": 1.0559670330340216, + "step": 28800 + }, + { + "epoch": 5.23, + "eval_loss": 0.16985873878002167, + "eval_runtime": 580.2765, + "eval_samples_per_second": 26.003, + "eval_steps_per_second": 3.252, + "eval_wer": 1.0420682382058364, + "step": 28900 + }, + { + "epoch": 5.25, + "learning_rate": 0.00019629944188303807, + "loss": 0.1217, + "step": 29000 + }, + { + "epoch": 5.25, + "eval_loss": 0.18032023310661316, + "eval_runtime": 580.8131, + "eval_samples_per_second": 25.979, + "eval_steps_per_second": 3.249, + "eval_wer": 1.0369781093981456, + "step": 29000 + }, + { + "epoch": 5.26, + "eval_loss": 0.17702044546604156, + "eval_runtime": 582.0629, + "eval_samples_per_second": 25.923, + "eval_steps_per_second": 3.242, + "eval_wer": 1.0473778216687089, + "step": 29100 + }, + { + "epoch": 5.28, + "eval_loss": 0.17327551543712616, + "eval_runtime": 581.4254, + "eval_samples_per_second": 25.952, + "eval_steps_per_second": 3.245, + "eval_wer": 1.0331864206336143, + "step": 29200 + }, + { + "epoch": 5.3, + "eval_loss": 0.17459562420845032, + "eval_runtime": 581.5283, + "eval_samples_per_second": 25.947, + "eval_steps_per_second": 3.245, + "eval_wer": 1.0158312149863145, + "step": 29300 + }, + { + "epoch": 5.32, + "eval_loss": 0.1762886941432953, + "eval_runtime": 581.9585, + "eval_samples_per_second": 25.928, + "eval_steps_per_second": 3.242, + "eval_wer": 1.0341130069554934, + "step": 29400 + }, + { + "epoch": 5.34, + "learning_rate": 0.00019447949526813876, + "loss": 0.1246, + "step": 29500 + }, + { + "epoch": 5.34, + "eval_loss": 0.17754170298576355, + "eval_runtime": 581.4218, + "eval_samples_per_second": 25.952, + "eval_steps_per_second": 3.245, + "eval_wer": 1.034753083033107, + "step": 29500 + }, + { + "epoch": 5.35, + "eval_loss": 0.17297494411468506, + "eval_runtime": 608.3786, + "eval_samples_per_second": 24.802, + "eval_steps_per_second": 3.102, + "eval_wer": 1.0491761306486713, + "step": 29600 + }, + { + "epoch": 5.37, + "eval_loss": 0.17302390933036804, + "eval_runtime": 582.277, + "eval_samples_per_second": 25.914, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0502734039245807, + "step": 29700 + }, + { + "epoch": 5.39, + "eval_loss": 0.17274653911590576, + "eval_runtime": 601.2418, + "eval_samples_per_second": 25.096, + "eval_steps_per_second": 3.139, + "eval_wer": 1.0436958602317685, + "step": 29800 + }, + { + "epoch": 5.41, + "eval_loss": 0.17440034449100494, + "eval_runtime": 582.4042, + "eval_samples_per_second": 25.908, + "eval_steps_per_second": 3.24, + "eval_wer": 1.0539065976603694, + "step": 29900 + }, + { + "epoch": 5.43, + "learning_rate": 0.00019266318854646927, + "loss": 0.127, + "step": 30000 + }, + { + "epoch": 5.43, + "eval_loss": 0.17481261491775513, + "eval_runtime": 585.1655, + "eval_samples_per_second": 25.786, + "eval_steps_per_second": 3.225, + "eval_wer": 1.046311028206019, + "step": 30000 + }, + { + "epoch": 5.44, + "eval_loss": 0.17456230521202087, + "eval_runtime": 668.4648, + "eval_samples_per_second": 22.573, + "eval_steps_per_second": 2.823, + "eval_wer": 1.0554793560225062, + "step": 30100 + }, + { + "epoch": 5.46, + "eval_loss": 0.18095143139362335, + "eval_runtime": 581.559, + "eval_samples_per_second": 25.946, + "eval_steps_per_second": 3.245, + "eval_wer": 1.0557963460799913, + "step": 30200 + }, + { + "epoch": 5.48, + "eval_loss": 0.1773470938205719, + "eval_runtime": 582.2966, + "eval_samples_per_second": 25.913, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0406722627603737, + "step": 30300 + }, + { + "epoch": 5.5, + "eval_loss": 0.1722005307674408, + "eval_runtime": 580.9789, + "eval_samples_per_second": 25.972, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0488530446285425, + "step": 30400 + }, + { + "epoch": 5.52, + "learning_rate": 0.00019084324193156997, + "loss": 0.1276, + "step": 30500 + }, + { + "epoch": 5.52, + "eval_loss": 0.1720392405986786, + "eval_runtime": 582.1568, + "eval_samples_per_second": 25.919, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0520168492407478, + "step": 30500 + }, + { + "epoch": 5.54, + "eval_loss": 0.1776796579360962, + "eval_runtime": 582.2358, + "eval_samples_per_second": 25.916, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0346616435934481, + "step": 30600 + }, + { + "epoch": 5.55, + "eval_loss": 0.16850876808166504, + "eval_runtime": 584.0539, + "eval_samples_per_second": 25.835, + "eval_steps_per_second": 3.231, + "eval_wer": 1.03467993148138, + "step": 30700 + }, + { + "epoch": 5.57, + "eval_loss": 0.16591408848762512, + "eval_runtime": 583.1779, + "eval_samples_per_second": 25.874, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0338082088232963, + "step": 30800 + }, + { + "epoch": 5.59, + "eval_loss": 0.17562197148799896, + "eval_runtime": 585.3902, + "eval_samples_per_second": 25.776, + "eval_steps_per_second": 3.223, + "eval_wer": 1.0228232841389149, + "step": 30900 + }, + { + "epoch": 5.61, + "learning_rate": 0.0001890232953166707, + "loss": 0.1246, + "step": 31000 + }, + { + "epoch": 5.61, + "eval_loss": 0.1716947704553604, + "eval_runtime": 580.9184, + "eval_samples_per_second": 25.974, + "eval_steps_per_second": 3.248, + "eval_wer": 1.040855141639692, + "step": 31000 + }, + { + "epoch": 5.63, + "eval_loss": 0.17640528082847595, + "eval_runtime": 581.1871, + "eval_samples_per_second": 25.962, + "eval_steps_per_second": 3.247, + "eval_wer": 1.0201654444261565, + "step": 31100 + }, + { + "epoch": 5.64, + "eval_loss": 0.16931375861167908, + "eval_runtime": 582.1998, + "eval_samples_per_second": 25.917, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0314368793548032, + "step": 31200 + }, + { + "epoch": 5.66, + "eval_loss": 0.17311854660511017, + "eval_runtime": 581.8005, + "eval_samples_per_second": 25.935, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0319184604036746, + "step": 31300 + }, + { + "epoch": 5.68, + "eval_loss": 0.16878977417945862, + "eval_runtime": 580.1048, + "eval_samples_per_second": 26.011, + "eval_steps_per_second": 3.253, + "eval_wer": 1.0380388068981914, + "step": 31400 + }, + { + "epoch": 5.7, + "learning_rate": 0.00018720334870177139, + "loss": 0.1271, + "step": 31500 + }, + { + "epoch": 5.7, + "eval_loss": 0.16712072491645813, + "eval_runtime": 580.9082, + "eval_samples_per_second": 25.975, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0349908255762208, + "step": 31500 + }, + { + "epoch": 5.72, + "eval_loss": 0.1675543487071991, + "eval_runtime": 581.5005, + "eval_samples_per_second": 25.948, + "eval_steps_per_second": 3.245, + "eval_wer": 1.043025304340935, + "step": 31600 + }, + { + "epoch": 5.73, + "eval_loss": 0.16557875275611877, + "eval_runtime": 592.5273, + "eval_samples_per_second": 25.465, + "eval_steps_per_second": 3.185, + "eval_wer": 1.0440738099156928, + "step": 31700 + }, + { + "epoch": 5.75, + "eval_loss": 0.16642601788043976, + "eval_runtime": 582.1063, + "eval_samples_per_second": 25.921, + "eval_steps_per_second": 3.242, + "eval_wer": 1.0403126009643813, + "step": 31800 + }, + { + "epoch": 5.77, + "eval_loss": 0.16907727718353271, + "eval_runtime": 581.4123, + "eval_samples_per_second": 25.952, + "eval_steps_per_second": 3.246, + "eval_wer": 1.015185042946057, + "step": 31900 + }, + { + "epoch": 5.79, + "learning_rate": 0.0001853834020868721, + "loss": 0.1259, + "step": 32000 + }, + { + "epoch": 5.79, + "eval_loss": 0.17020300030708313, + "eval_runtime": 581.9961, + "eval_samples_per_second": 25.926, + "eval_steps_per_second": 3.242, + "eval_wer": 1.0017556372414549, + "step": 32000 + }, + { + "epoch": 5.81, + "eval_loss": 0.16643249988555908, + "eval_runtime": 580.5409, + "eval_samples_per_second": 25.991, + "eval_steps_per_second": 3.25, + "eval_wer": 1.024554537529794, + "step": 32100 + }, + { + "epoch": 5.82, + "eval_loss": 0.17374736070632935, + "eval_runtime": 581.8721, + "eval_samples_per_second": 25.932, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0339545119267508, + "step": 32200 + }, + { + "epoch": 5.84, + "eval_loss": 0.17424912750720978, + "eval_runtime": 581.9636, + "eval_samples_per_second": 25.928, + "eval_steps_per_second": 3.242, + "eval_wer": 1.0448906689099808, + "step": 32300 + }, + { + "epoch": 5.86, + "eval_loss": 0.170697420835495, + "eval_runtime": 581.919, + "eval_samples_per_second": 25.93, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0279012210213176, + "step": 32400 + }, + { + "epoch": 5.88, + "learning_rate": 0.0001835634554719728, + "loss": 0.1273, + "step": 32500 + }, + { + "epoch": 5.88, + "eval_loss": 0.16966979205608368, + "eval_runtime": 573.0944, + "eval_samples_per_second": 26.329, + "eval_steps_per_second": 3.293, + "eval_wer": 1.0470852154617996, + "step": 32500 + }, + { + "epoch": 5.9, + "eval_loss": 0.16675007343292236, + "eval_runtime": 583.4412, + "eval_samples_per_second": 25.862, + "eval_steps_per_second": 3.234, + "eval_wer": 1.0322171625732277, + "step": 32600 + }, + { + "epoch": 5.92, + "eval_loss": 0.17055776715278625, + "eval_runtime": 582.1651, + "eval_samples_per_second": 25.919, + "eval_steps_per_second": 3.241, + "eval_wer": 1.037782776467146, + "step": 32700 + }, + { + "epoch": 5.93, + "eval_loss": 0.17042866349220276, + "eval_runtime": 582.8815, + "eval_samples_per_second": 25.887, + "eval_steps_per_second": 3.237, + "eval_wer": 1.0350274013520846, + "step": 32800 + }, + { + "epoch": 5.95, + "eval_loss": 0.17252954840660095, + "eval_runtime": 583.3586, + "eval_samples_per_second": 25.866, + "eval_steps_per_second": 3.235, + "eval_wer": 1.0244021384636954, + "step": 32900 + }, + { + "epoch": 5.97, + "learning_rate": 0.00018174350885707353, + "loss": 0.123, + "step": 33000 + }, + { + "epoch": 5.97, + "eval_loss": 0.16781975328922272, + "eval_runtime": 581.176, + "eval_samples_per_second": 25.963, + "eval_steps_per_second": 3.247, + "eval_wer": 1.044683406180087, + "step": 33000 + }, + { + "epoch": 5.99, + "eval_loss": 0.1680649071931839, + "eval_runtime": 583.9517, + "eval_samples_per_second": 25.839, + "eval_steps_per_second": 3.231, + "eval_wer": 1.0438177794846473, + "step": 33100 + }, + { + "epoch": 6.01, + "eval_loss": 0.16894467175006866, + "eval_runtime": 582.6025, + "eval_samples_per_second": 25.899, + "eval_steps_per_second": 3.239, + "eval_wer": 1.0297117219265681, + "step": 33200 + }, + { + "epoch": 6.02, + "eval_loss": 0.1690208464860916, + "eval_runtime": 582.3983, + "eval_samples_per_second": 25.908, + "eval_steps_per_second": 3.24, + "eval_wer": 1.0333388196997129, + "step": 33300 + }, + { + "epoch": 6.04, + "eval_loss": 0.173419788479805, + "eval_runtime": 582.2669, + "eval_samples_per_second": 25.914, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0296324744121967, + "step": 33400 + }, + { + "epoch": 6.06, + "learning_rate": 0.00017992356224217422, + "loss": 0.1163, + "step": 33500 + }, + { + "epoch": 6.06, + "eval_loss": 0.1748138964176178, + "eval_runtime": 582.5758, + "eval_samples_per_second": 25.9, + "eval_steps_per_second": 3.239, + "eval_wer": 1.03073584365075, + "step": 33500 + }, + { + "epoch": 6.08, + "eval_loss": 0.17153716087341309, + "eval_runtime": 588.9678, + "eval_samples_per_second": 25.619, + "eval_steps_per_second": 3.204, + "eval_wer": 1.0122528849143213, + "step": 33600 + }, + { + "epoch": 6.1, + "eval_loss": 0.16684116423130035, + "eval_runtime": 581.9585, + "eval_samples_per_second": 25.928, + "eval_steps_per_second": 3.242, + "eval_wer": 1.011655480575215, + "step": 33700 + }, + { + "epoch": 6.11, + "eval_loss": 0.1689983457326889, + "eval_runtime": 580.6755, + "eval_samples_per_second": 25.985, + "eval_steps_per_second": 3.25, + "eval_wer": 1.0229634912797254, + "step": 33800 + }, + { + "epoch": 6.13, + "eval_loss": 0.16927799582481384, + "eval_runtime": 581.3775, + "eval_samples_per_second": 25.954, + "eval_steps_per_second": 3.246, + "eval_wer": 1.0165688264662314, + "step": 33900 + }, + { + "epoch": 6.15, + "learning_rate": 0.00017810361562727492, + "loss": 0.1101, + "step": 34000 + }, + { + "epoch": 6.15, + "eval_loss": 0.17283213138580322, + "eval_runtime": 581.7575, + "eval_samples_per_second": 25.937, + "eval_steps_per_second": 3.244, + "eval_wer": 1.0161664929317313, + "step": 34000 + }, + { + "epoch": 6.17, + "eval_loss": 0.16832078993320465, + "eval_runtime": 593.7449, + "eval_samples_per_second": 25.413, + "eval_steps_per_second": 3.178, + "eval_wer": 1.0107167023280481, + "step": 34100 + }, + { + "epoch": 6.19, + "eval_loss": 0.17034588754177094, + "eval_runtime": 581.571, + "eval_samples_per_second": 25.945, + "eval_steps_per_second": 3.245, + "eval_wer": 0.9813646421974727, + "step": 34200 + }, + { + "epoch": 6.2, + "eval_loss": 0.16915497183799744, + "eval_runtime": 584.1319, + "eval_samples_per_second": 25.831, + "eval_steps_per_second": 3.23, + "eval_wer": 1.0007437074425607, + "step": 34300 + }, + { + "epoch": 6.22, + "eval_loss": 0.16902200877666473, + "eval_runtime": 579.9055, + "eval_samples_per_second": 26.02, + "eval_steps_per_second": 3.254, + "eval_wer": 0.9999695201867803, + "step": 34400 + }, + { + "epoch": 6.24, + "learning_rate": 0.00017629094879883522, + "loss": 0.1118, + "step": 34500 + }, + { + "epoch": 6.24, + "eval_loss": 0.1733812838792801, + "eval_runtime": 641.6204, + "eval_samples_per_second": 23.517, + "eval_steps_per_second": 2.941, + "eval_wer": 0.9971958571837872, + "step": 34500 + }, + { + "epoch": 6.26, + "eval_loss": 0.17394082248210907, + "eval_runtime": 583.4185, + "eval_samples_per_second": 25.863, + "eval_steps_per_second": 3.234, + "eval_wer": 1.0096438129027145, + "step": 34600 + }, + { + "epoch": 6.28, + "eval_loss": 0.17487762868404388, + "eval_runtime": 586.9087, + "eval_samples_per_second": 25.709, + "eval_steps_per_second": 3.215, + "eval_wer": 1.0046695073852587, + "step": 34700 + }, + { + "epoch": 6.3, + "eval_loss": 0.17093946039676666, + "eval_runtime": 647.3178, + "eval_samples_per_second": 23.31, + "eval_steps_per_second": 2.915, + "eval_wer": 1.0111068439372604, + "step": 34800 + }, + { + "epoch": 6.31, + "eval_loss": 0.17170192301273346, + "eval_runtime": 816.7662, + "eval_samples_per_second": 18.474, + "eval_steps_per_second": 2.31, + "eval_wer": 1.0179038422852544, + "step": 34900 + }, + { + "epoch": 6.33, + "learning_rate": 0.00017447100218393594, + "loss": 0.1153, + "step": 35000 + }, + { + "epoch": 6.33, + "eval_loss": 0.16898946464061737, + "eval_runtime": 581.8044, + "eval_samples_per_second": 25.935, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0155142249288296, + "step": 35000 + }, + { + "epoch": 6.35, + "eval_loss": 0.17097432911396027, + "eval_runtime": 580.1808, + "eval_samples_per_second": 26.007, + "eval_steps_per_second": 3.252, + "eval_wer": 1.0143803758770567, + "step": 35100 + }, + { + "epoch": 6.37, + "eval_loss": 0.1719246357679367, + "eval_runtime": 580.9111, + "eval_samples_per_second": 25.975, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0030418853593266, + "step": 35200 + }, + { + "epoch": 6.39, + "eval_loss": 0.1690385490655899, + "eval_runtime": 650.929, + "eval_samples_per_second": 23.181, + "eval_steps_per_second": 2.899, + "eval_wer": 1.02722456916784, + "step": 35300 + }, + { + "epoch": 6.4, + "eval_loss": 0.16729648411273956, + "eval_runtime": 581.1582, + "eval_samples_per_second": 25.964, + "eval_steps_per_second": 3.247, + "eval_wer": 1.0103387526441239, + "step": 35400 + }, + { + "epoch": 6.42, + "learning_rate": 0.00017265105556903663, + "loss": 0.1106, + "step": 35500 + }, + { + "epoch": 6.42, + "eval_loss": 0.1710328310728073, + "eval_runtime": 601.8486, + "eval_samples_per_second": 25.071, + "eval_steps_per_second": 3.135, + "eval_wer": 1.0222136878745207, + "step": 35500 + }, + { + "epoch": 6.44, + "eval_loss": 0.17468269169330597, + "eval_runtime": 590.7957, + "eval_samples_per_second": 25.54, + "eval_steps_per_second": 3.194, + "eval_wer": 1.0172881500582165, + "step": 35600 + }, + { + "epoch": 6.46, + "eval_loss": 0.17207881808280945, + "eval_runtime": 632.0801, + "eval_samples_per_second": 23.872, + "eval_steps_per_second": 2.985, + "eval_wer": 0.9932578653158013, + "step": 35700 + }, + { + "epoch": 6.48, + "eval_loss": 0.1670292764902115, + "eval_runtime": 582.7073, + "eval_samples_per_second": 25.895, + "eval_steps_per_second": 3.238, + "eval_wer": 1.018354943520906, + "step": 35800 + }, + { + "epoch": 6.49, + "eval_loss": 0.17143051326274872, + "eval_runtime": 594.2992, + "eval_samples_per_second": 25.39, + "eval_steps_per_second": 3.175, + "eval_wer": 1.0122224051011015, + "step": 35900 + }, + { + "epoch": 6.51, + "learning_rate": 0.00017083110895413733, + "loss": 0.1116, + "step": 36000 + }, + { + "epoch": 6.51, + "eval_loss": 0.17166104912757874, + "eval_runtime": 581.3301, + "eval_samples_per_second": 25.956, + "eval_steps_per_second": 3.246, + "eval_wer": 1.0034929865949782, + "step": 36000 + }, + { + "epoch": 6.53, + "eval_loss": 0.16851219534873962, + "eval_runtime": 794.8894, + "eval_samples_per_second": 18.983, + "eval_steps_per_second": 2.374, + "eval_wer": 1.009893747371116, + "step": 36100 + }, + { + "epoch": 6.55, + "eval_loss": 0.16873739659786224, + "eval_runtime": 642.5817, + "eval_samples_per_second": 23.482, + "eval_steps_per_second": 2.937, + "eval_wer": 1.0288217113805527, + "step": 36200 + }, + { + "epoch": 6.57, + "eval_loss": 0.16639259457588196, + "eval_runtime": 582.0547, + "eval_samples_per_second": 25.924, + "eval_steps_per_second": 3.242, + "eval_wer": 1.0313881116536519, + "step": 36300 + }, + { + "epoch": 6.58, + "eval_loss": 0.16646970808506012, + "eval_runtime": 581.4585, + "eval_samples_per_second": 25.95, + "eval_steps_per_second": 3.245, + "eval_wer": 1.0263589424724004, + "step": 36400 + }, + { + "epoch": 6.6, + "learning_rate": 0.00016901116233923805, + "loss": 0.1128, + "step": 36500 + }, + { + "epoch": 6.6, + "eval_loss": 0.16809915006160736, + "eval_runtime": 841.9975, + "eval_samples_per_second": 17.92, + "eval_steps_per_second": 2.241, + "eval_wer": 1.041995086654109, + "step": 36500 + }, + { + "epoch": 6.62, + "eval_loss": 0.1682288646697998, + "eval_runtime": 581.315, + "eval_samples_per_second": 25.957, + "eval_steps_per_second": 3.246, + "eval_wer": 1.0408856214529116, + "step": 36600 + }, + { + "epoch": 6.64, + "eval_loss": 0.17166656255722046, + "eval_runtime": 596.6613, + "eval_samples_per_second": 25.289, + "eval_steps_per_second": 3.163, + "eval_wer": 1.0270538822138098, + "step": 36700 + }, + { + "epoch": 6.66, + "eval_loss": 0.17169848084449768, + "eval_runtime": 580.5042, + "eval_samples_per_second": 25.993, + "eval_steps_per_second": 3.251, + "eval_wer": 1.0165993062794512, + "step": 36800 + }, + { + "epoch": 6.68, + "eval_loss": 0.1754983514547348, + "eval_runtime": 667.9005, + "eval_samples_per_second": 22.592, + "eval_steps_per_second": 2.825, + "eval_wer": 1.0174527410496028, + "step": 36900 + }, + { + "epoch": 6.69, + "learning_rate": 0.00016719121572433872, + "loss": 0.1134, + "step": 37000 + }, + { + "epoch": 6.69, + "eval_loss": 0.16234032809734344, + "eval_runtime": 661.7885, + "eval_samples_per_second": 22.8, + "eval_steps_per_second": 2.851, + "eval_wer": 1.0185012466243606, + "step": 37000 + }, + { + "epoch": 6.71, + "eval_loss": 0.16741453111171722, + "eval_runtime": 591.6954, + "eval_samples_per_second": 25.501, + "eval_steps_per_second": 3.189, + "eval_wer": 1.0301811110501515, + "step": 37100 + }, + { + "epoch": 6.73, + "eval_loss": 0.16326996684074402, + "eval_runtime": 606.6342, + "eval_samples_per_second": 24.873, + "eval_steps_per_second": 3.111, + "eval_wer": 1.0324670970416294, + "step": 37200 + }, + { + "epoch": 6.75, + "eval_loss": 0.1627754420042038, + "eval_runtime": 925.563, + "eval_samples_per_second": 16.303, + "eval_steps_per_second": 2.039, + "eval_wer": 1.0228171881762709, + "step": 37300 + }, + { + "epoch": 6.77, + "eval_loss": 0.16362273693084717, + "eval_runtime": 699.1407, + "eval_samples_per_second": 21.582, + "eval_steps_per_second": 2.699, + "eval_wer": 1.024261931322885, + "step": 37400 + }, + { + "epoch": 6.78, + "learning_rate": 0.00016537126910943944, + "loss": 0.1102, + "step": 37500 + }, + { + "epoch": 6.78, + "eval_loss": 0.16669456660747528, + "eval_runtime": 583.9747, + "eval_samples_per_second": 25.838, + "eval_steps_per_second": 3.231, + "eval_wer": 1.0282304030040903, + "step": 37500 + }, + { + "epoch": 6.8, + "eval_loss": 0.16227515041828156, + "eval_runtime": 588.9317, + "eval_samples_per_second": 25.621, + "eval_steps_per_second": 3.204, + "eval_wer": 1.0212078540382705, + "step": 37600 + }, + { + "epoch": 6.82, + "eval_loss": 0.1639271229505539, + "eval_runtime": 594.657, + "eval_samples_per_second": 25.374, + "eval_steps_per_second": 3.173, + "eval_wer": 1.0139536584919808, + "step": 37700 + }, + { + "epoch": 6.84, + "eval_loss": 0.15872186422348022, + "eval_runtime": 632.8508, + "eval_samples_per_second": 23.843, + "eval_steps_per_second": 2.982, + "eval_wer": 1.0258285937223777, + "step": 37800 + }, + { + "epoch": 6.86, + "eval_loss": 0.16100141406059265, + "eval_runtime": 983.2839, + "eval_samples_per_second": 15.346, + "eval_steps_per_second": 1.919, + "eval_wer": 1.0087050346555477, + "step": 37900 + }, + { + "epoch": 6.87, + "learning_rate": 0.00016355132249454014, + "loss": 0.1113, + "step": 38000 + }, + { + "epoch": 6.87, + "eval_loss": 0.1646973341703415, + "eval_runtime": 599.5992, + "eval_samples_per_second": 25.165, + "eval_steps_per_second": 3.147, + "eval_wer": 1.0199277018830428, + "step": 38000 + }, + { + "epoch": 6.89, + "eval_loss": 0.16088496148586273, + "eval_runtime": 1148.6193, + "eval_samples_per_second": 13.137, + "eval_steps_per_second": 1.643, + "eval_wer": 1.005364447126668, + "step": 38100 + }, + { + "epoch": 6.91, + "eval_loss": 0.16020412743091583, + "eval_runtime": 638.6985, + "eval_samples_per_second": 23.625, + "eval_steps_per_second": 2.954, + "eval_wer": 1.0145205830178672, + "step": 38200 + }, + { + "epoch": 6.93, + "eval_loss": 0.16017159819602966, + "eval_runtime": 590.1313, + "eval_samples_per_second": 25.569, + "eval_steps_per_second": 3.198, + "eval_wer": 1.014435239540852, + "step": 38300 + }, + { + "epoch": 6.95, + "eval_loss": 0.16017083823680878, + "eval_runtime": 583.7731, + "eval_samples_per_second": 25.847, + "eval_steps_per_second": 3.232, + "eval_wer": 1.0374840742975926, + "step": 38400 + }, + { + "epoch": 6.96, + "learning_rate": 0.00016173137587964084, + "loss": 0.1071, + "step": 38500 + }, + { + "epoch": 6.96, + "eval_loss": 0.15924811363220215, + "eval_runtime": 644.5353, + "eval_samples_per_second": 23.411, + "eval_steps_per_second": 2.928, + "eval_wer": 1.0259261291246806, + "step": 38500 + }, + { + "epoch": 6.98, + "eval_loss": 0.16121791303157806, + "eval_runtime": 583.6652, + "eval_samples_per_second": 25.852, + "eval_steps_per_second": 3.233, + "eval_wer": 1.0235608956188316, + "step": 38600 + }, + { + "epoch": 7.0, + "eval_loss": 0.16208681464195251, + "eval_runtime": 586.5854, + "eval_samples_per_second": 25.723, + "eval_steps_per_second": 3.217, + "eval_wer": 1.0276695744408477, + "step": 38700 + }, + { + "epoch": 7.02, + "eval_loss": 0.1668541133403778, + "eval_runtime": 583.1032, + "eval_samples_per_second": 25.877, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0367281749297441, + "step": 38800 + }, + { + "epoch": 7.04, + "eval_loss": 0.17419211566448212, + "eval_runtime": 647.5268, + "eval_samples_per_second": 23.303, + "eval_steps_per_second": 2.914, + "eval_wer": 1.0484324232061106, + "step": 38900 + }, + { + "epoch": 7.05, + "learning_rate": 0.00015991142926474156, + "loss": 0.1062, + "step": 39000 + }, + { + "epoch": 7.05, + "eval_loss": 0.17524433135986328, + "eval_runtime": 582.9109, + "eval_samples_per_second": 25.886, + "eval_steps_per_second": 3.237, + "eval_wer": 1.0301567271995757, + "step": 39000 + }, + { + "epoch": 7.07, + "eval_loss": 0.16763833165168762, + "eval_runtime": 832.1716, + "eval_samples_per_second": 18.132, + "eval_steps_per_second": 2.268, + "eval_wer": 1.024444810202203, + "step": 39100 + }, + { + "epoch": 7.09, + "eval_loss": 0.17226064205169678, + "eval_runtime": 584.5325, + "eval_samples_per_second": 25.814, + "eval_steps_per_second": 3.228, + "eval_wer": 1.0300104240961212, + "step": 39200 + }, + { + "epoch": 7.11, + "eval_loss": 0.1727043092250824, + "eval_runtime": 732.8624, + "eval_samples_per_second": 20.589, + "eval_steps_per_second": 2.575, + "eval_wer": 1.0293886359064393, + "step": 39300 + }, + { + "epoch": 7.13, + "eval_loss": 0.17107614874839783, + "eval_runtime": 583.7282, + "eval_samples_per_second": 25.849, + "eval_steps_per_second": 3.233, + "eval_wer": 1.025475027889029, + "step": 39400 + }, + { + "epoch": 7.15, + "learning_rate": 0.00015809512254307204, + "loss": 0.1021, + "step": 39500 + }, + { + "epoch": 7.15, + "eval_loss": 0.16992105543613434, + "eval_runtime": 585.4315, + "eval_samples_per_second": 25.774, + "eval_steps_per_second": 3.223, + "eval_wer": 1.0471156952750194, + "step": 39500 + }, + { + "epoch": 7.16, + "eval_loss": 0.1682046800851822, + "eval_runtime": 583.7765, + "eval_samples_per_second": 25.847, + "eval_steps_per_second": 3.232, + "eval_wer": 1.0425742031052834, + "step": 39600 + }, + { + "epoch": 7.18, + "eval_loss": 0.17128342390060425, + "eval_runtime": 681.9553, + "eval_samples_per_second": 22.126, + "eval_steps_per_second": 2.767, + "eval_wer": 1.0233353450010059, + "step": 39700 + }, + { + "epoch": 7.2, + "eval_loss": 0.16821503639221191, + "eval_runtime": 662.0353, + "eval_samples_per_second": 22.792, + "eval_steps_per_second": 2.85, + "eval_wer": 1.0259139371993928, + "step": 39800 + }, + { + "epoch": 7.22, + "eval_loss": 0.17101679742336273, + "eval_runtime": 602.057, + "eval_samples_per_second": 25.062, + "eval_steps_per_second": 3.134, + "eval_wer": 1.0161725888943753, + "step": 39900 + }, + { + "epoch": 7.24, + "learning_rate": 0.00015627881582140255, + "loss": 0.103, + "step": 40000 + }, + { + "epoch": 7.24, + "eval_loss": 0.17253848910331726, + "eval_runtime": 585.651, + "eval_samples_per_second": 25.764, + "eval_steps_per_second": 3.222, + "eval_wer": 1.0282730747425979, + "step": 40000 + }, + { + "epoch": 7.25, + "eval_loss": 0.1728762835264206, + "eval_runtime": 997.1851, + "eval_samples_per_second": 15.132, + "eval_steps_per_second": 1.892, + "eval_wer": 1.0263650384350445, + "step": 40100 + }, + { + "epoch": 7.27, + "eval_loss": 0.16648218035697937, + "eval_runtime": 648.7615, + "eval_samples_per_second": 23.258, + "eval_steps_per_second": 2.909, + "eval_wer": 1.045085739714587, + "step": 40200 + }, + { + "epoch": 7.29, + "eval_loss": 0.16705408692359924, + "eval_runtime": 587.011, + "eval_samples_per_second": 25.705, + "eval_steps_per_second": 3.215, + "eval_wer": 1.0386179233493658, + "step": 40300 + }, + { + "epoch": 7.31, + "eval_loss": 0.1670595407485962, + "eval_runtime": 581.7984, + "eval_samples_per_second": 25.935, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0316014703461898, + "step": 40400 + }, + { + "epoch": 7.33, + "learning_rate": 0.00015445886920650325, + "loss": 0.0981, + "step": 40500 + }, + { + "epoch": 7.33, + "eval_loss": 0.17082154750823975, + "eval_runtime": 644.8212, + "eval_samples_per_second": 23.4, + "eval_steps_per_second": 2.926, + "eval_wer": 1.0256761946562791, + "step": 40500 + }, + { + "epoch": 7.34, + "eval_loss": 0.16420403122901917, + "eval_runtime": 584.3525, + "eval_samples_per_second": 25.822, + "eval_steps_per_second": 3.229, + "eval_wer": 1.0152033308339887, + "step": 40600 + }, + { + "epoch": 7.36, + "eval_loss": 0.1707213968038559, + "eval_runtime": 598.9814, + "eval_samples_per_second": 25.191, + "eval_steps_per_second": 3.15, + "eval_wer": 1.0110215004602452, + "step": 40700 + }, + { + "epoch": 7.38, + "eval_loss": 0.1675441563129425, + "eval_runtime": 586.7024, + "eval_samples_per_second": 25.718, + "eval_steps_per_second": 3.216, + "eval_wer": 1.0185561102881562, + "step": 40800 + }, + { + "epoch": 7.4, + "eval_loss": 0.17023596167564392, + "eval_runtime": 713.0578, + "eval_samples_per_second": 21.161, + "eval_steps_per_second": 2.646, + "eval_wer": 1.012277268764897, + "step": 40900 + }, + { + "epoch": 7.42, + "learning_rate": 0.00015263892259160397, + "loss": 0.1005, + "step": 41000 + }, + { + "epoch": 7.42, + "eval_loss": 0.16991430521011353, + "eval_runtime": 583.1849, + "eval_samples_per_second": 25.873, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0159287503886176, + "step": 41000 + }, + { + "epoch": 7.43, + "eval_loss": 0.1702755093574524, + "eval_runtime": 586.1073, + "eval_samples_per_second": 25.744, + "eval_steps_per_second": 3.22, + "eval_wer": 1.0219271776302554, + "step": 41100 + }, + { + "epoch": 7.45, + "eval_loss": 0.17067919671535492, + "eval_runtime": 588.7524, + "eval_samples_per_second": 25.629, + "eval_steps_per_second": 3.205, + "eval_wer": 1.019385161207732, + "step": 41200 + }, + { + "epoch": 7.47, + "eval_loss": 0.16438345611095428, + "eval_runtime": 813.104, + "eval_samples_per_second": 18.557, + "eval_steps_per_second": 2.321, + "eval_wer": 1.0016215260632884, + "step": 41300 + }, + { + "epoch": 7.49, + "eval_loss": 0.17156347632408142, + "eval_runtime": 608.2034, + "eval_samples_per_second": 24.809, + "eval_steps_per_second": 3.103, + "eval_wer": 0.9941478758618167, + "step": 41400 + }, + { + "epoch": 7.51, + "learning_rate": 0.00015081897597670466, + "loss": 0.1021, + "step": 41500 + }, + { + "epoch": 7.51, + "eval_loss": 0.16701160371303558, + "eval_runtime": 580.9378, + "eval_samples_per_second": 25.974, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0159470382765494, + "step": 41500 + }, + { + "epoch": 7.53, + "eval_loss": 0.16667711734771729, + "eval_runtime": 580.8947, + "eval_samples_per_second": 25.975, + "eval_steps_per_second": 3.248, + "eval_wer": 1.003291819827728, + "step": 41600 + }, + { + "epoch": 7.54, + "eval_loss": 0.1667308658361435, + "eval_runtime": 738.8402, + "eval_samples_per_second": 20.423, + "eval_steps_per_second": 2.554, + "eval_wer": 1.0175624683771938, + "step": 41700 + }, + { + "epoch": 7.56, + "eval_loss": 0.16792383790016174, + "eval_runtime": 721.671, + "eval_samples_per_second": 20.908, + "eval_steps_per_second": 2.615, + "eval_wer": 1.0193790652450883, + "step": 41800 + }, + { + "epoch": 7.58, + "eval_loss": 0.1631632000207901, + "eval_runtime": 591.7115, + "eval_samples_per_second": 25.501, + "eval_steps_per_second": 3.189, + "eval_wer": 1.0418426875880105, + "step": 41900 + }, + { + "epoch": 7.6, + "learning_rate": 0.0001489990293618054, + "loss": 0.0963, + "step": 42000 + }, + { + "epoch": 7.6, + "eval_loss": 0.17123085260391235, + "eval_runtime": 592.0783, + "eval_samples_per_second": 25.485, + "eval_steps_per_second": 3.187, + "eval_wer": 1.0152399066098523, + "step": 42000 + }, + { + "epoch": 7.62, + "eval_loss": 0.16319897770881653, + "eval_runtime": 838.4842, + "eval_samples_per_second": 17.996, + "eval_steps_per_second": 2.25, + "eval_wer": 1.0364477606481228, + "step": 42100 + }, + { + "epoch": 7.63, + "eval_loss": 0.17024168372154236, + "eval_runtime": 1184.0841, + "eval_samples_per_second": 12.743, + "eval_steps_per_second": 1.594, + "eval_wer": 1.0228598599147785, + "step": 42200 + }, + { + "epoch": 7.65, + "eval_loss": 0.1655167192220688, + "eval_runtime": 581.3081, + "eval_samples_per_second": 25.957, + "eval_steps_per_second": 3.246, + "eval_wer": 1.0178733624720349, + "step": 42300 + }, + { + "epoch": 7.67, + "eval_loss": 0.16978418827056885, + "eval_runtime": 580.4103, + "eval_samples_per_second": 25.997, + "eval_steps_per_second": 3.251, + "eval_wer": 1.0329425821278566, + "step": 42400 + }, + { + "epoch": 7.69, + "learning_rate": 0.00014717908274690608, + "loss": 0.1014, + "step": 42500 + }, + { + "epoch": 7.69, + "eval_loss": 0.1691199243068695, + "eval_runtime": 715.0503, + "eval_samples_per_second": 21.102, + "eval_steps_per_second": 2.639, + "eval_wer": 1.0398432118407979, + "step": 42500 + }, + { + "epoch": 7.71, + "eval_loss": 0.1637689173221588, + "eval_runtime": 790.6965, + "eval_samples_per_second": 19.083, + "eval_steps_per_second": 2.387, + "eval_wer": 1.0486945495998001, + "step": 42600 + }, + { + "epoch": 7.72, + "eval_loss": 0.16167329251766205, + "eval_runtime": 591.7835, + "eval_samples_per_second": 25.497, + "eval_steps_per_second": 3.189, + "eval_wer": 1.0210066872710204, + "step": 42700 + }, + { + "epoch": 7.74, + "eval_loss": 0.1647609919309616, + "eval_runtime": 595.5162, + "eval_samples_per_second": 25.338, + "eval_steps_per_second": 3.169, + "eval_wer": 1.0123504203166243, + "step": 42800 + }, + { + "epoch": 7.76, + "eval_loss": 0.16076742112636566, + "eval_runtime": 849.0674, + "eval_samples_per_second": 17.771, + "eval_steps_per_second": 2.222, + "eval_wer": 1.0202142121273081, + "step": 42900 + }, + { + "epoch": 7.78, + "learning_rate": 0.00014535913613200678, + "loss": 0.1008, + "step": 43000 + }, + { + "epoch": 7.78, + "eval_loss": 0.1611439436674118, + "eval_runtime": 692.2883, + "eval_samples_per_second": 21.796, + "eval_steps_per_second": 2.726, + "eval_wer": 1.0353261035216377, + "step": 43000 + }, + { + "epoch": 7.8, + "eval_loss": 0.16334283351898193, + "eval_runtime": 587.0659, + "eval_samples_per_second": 25.702, + "eval_steps_per_second": 3.214, + "eval_wer": 1.0319123644410306, + "step": 43100 + }, + { + "epoch": 7.81, + "eval_loss": 0.16403447091579437, + "eval_runtime": 603.3209, + "eval_samples_per_second": 25.01, + "eval_steps_per_second": 3.128, + "eval_wer": 1.0031577086495613, + "step": 43200 + }, + { + "epoch": 7.83, + "eval_loss": 0.15894734859466553, + "eval_runtime": 900.4737, + "eval_samples_per_second": 16.757, + "eval_steps_per_second": 2.096, + "eval_wer": 0.9984821053016587, + "step": 43300 + }, + { + "epoch": 7.85, + "eval_loss": 0.16296441853046417, + "eval_runtime": 734.1091, + "eval_samples_per_second": 20.554, + "eval_steps_per_second": 2.57, + "eval_wer": 0.9975372310918479, + "step": 43400 + }, + { + "epoch": 7.87, + "learning_rate": 0.00014353918951710747, + "loss": 0.0988, + "step": 43500 + }, + { + "epoch": 7.87, + "eval_loss": 0.16040995717048645, + "eval_runtime": 597.3861, + "eval_samples_per_second": 25.258, + "eval_steps_per_second": 3.159, + "eval_wer": 1.0053156794255165, + "step": 43500 + }, + { + "epoch": 7.89, + "eval_loss": 0.16874484717845917, + "eval_runtime": 595.203, + "eval_samples_per_second": 25.351, + "eval_steps_per_second": 3.17, + "eval_wer": 1.0063458971123425, + "step": 43600 + }, + { + "epoch": 7.91, + "eval_loss": 0.1619204580783844, + "eval_runtime": 833.6968, + "eval_samples_per_second": 18.099, + "eval_steps_per_second": 2.263, + "eval_wer": 1.0096377169400705, + "step": 43700 + }, + { + "epoch": 7.92, + "eval_loss": 0.15647700428962708, + "eval_runtime": 714.5224, + "eval_samples_per_second": 21.118, + "eval_steps_per_second": 2.641, + "eval_wer": 0.99010015666624, + "step": 43800 + }, + { + "epoch": 7.94, + "eval_loss": 0.1618899703025818, + "eval_runtime": 600.3451, + "eval_samples_per_second": 25.134, + "eval_steps_per_second": 3.143, + "eval_wer": 0.9742140780161299, + "step": 43900 + }, + { + "epoch": 7.96, + "learning_rate": 0.00014172288279543798, + "loss": 0.102, + "step": 44000 + }, + { + "epoch": 7.96, + "eval_loss": 0.15979322791099548, + "eval_runtime": 581.3117, + "eval_samples_per_second": 25.957, + "eval_steps_per_second": 3.246, + "eval_wer": 0.9592789695384747, + "step": 44000 + }, + { + "epoch": 7.98, + "eval_loss": 0.16352316737174988, + "eval_runtime": 701.4326, + "eval_samples_per_second": 21.512, + "eval_steps_per_second": 2.69, + "eval_wer": 0.9717817889211975, + "step": 44100 + }, + { + "epoch": 8.0, + "eval_loss": 0.16242262721061707, + "eval_runtime": 673.5202, + "eval_samples_per_second": 22.403, + "eval_steps_per_second": 2.802, + "eval_wer": 0.9902769395829142, + "step": 44200 + }, + { + "epoch": 8.01, + "eval_loss": 0.16053874790668488, + "eval_runtime": 581.9167, + "eval_samples_per_second": 25.93, + "eval_steps_per_second": 3.243, + "eval_wer": 0.9882043122839743, + "step": 44300 + }, + { + "epoch": 8.03, + "eval_loss": 0.1657256782054901, + "eval_runtime": 580.7431, + "eval_samples_per_second": 25.982, + "eval_steps_per_second": 3.249, + "eval_wer": 1.0128137134775639, + "step": 44400 + }, + { + "epoch": 8.05, + "learning_rate": 0.0001399065760737685, + "loss": 0.0961, + "step": 44500 + }, + { + "epoch": 8.05, + "eval_loss": 0.1650768518447876, + "eval_runtime": 757.4307, + "eval_samples_per_second": 19.921, + "eval_steps_per_second": 2.491, + "eval_wer": 1.0154959370408978, + "step": 44500 + }, + { + "epoch": 8.07, + "eval_loss": 0.16800330579280853, + "eval_runtime": 697.2243, + "eval_samples_per_second": 21.642, + "eval_steps_per_second": 2.706, + "eval_wer": 1.0193546813945125, + "step": 44600 + }, + { + "epoch": 8.09, + "eval_loss": 0.16936592757701874, + "eval_runtime": 580.6067, + "eval_samples_per_second": 25.988, + "eval_steps_per_second": 3.25, + "eval_wer": 1.0111678035636997, + "step": 44700 + }, + { + "epoch": 8.1, + "eval_loss": 0.16645368933677673, + "eval_runtime": 583.2116, + "eval_samples_per_second": 25.872, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0072785793968655, + "step": 44800 + }, + { + "epoch": 8.12, + "eval_loss": 0.1612410545349121, + "eval_runtime": 590.9695, + "eval_samples_per_second": 25.533, + "eval_steps_per_second": 3.193, + "eval_wer": 1.020006949397414, + "step": 44900 + }, + { + "epoch": 8.14, + "learning_rate": 0.0001380866294588692, + "loss": 0.0894, + "step": 45000 + }, + { + "epoch": 8.14, + "eval_loss": 0.1652226448059082, + "eval_runtime": 627.3595, + "eval_samples_per_second": 24.052, + "eval_steps_per_second": 3.008, + "eval_wer": 1.0336740976451297, + "step": 45000 + }, + { + "epoch": 8.16, + "eval_loss": 0.1626013070344925, + "eval_runtime": 583.3577, + "eval_samples_per_second": 25.866, + "eval_steps_per_second": 3.235, + "eval_wer": 1.0086257871411763, + "step": 45100 + }, + { + "epoch": 8.18, + "eval_loss": 0.16394564509391785, + "eval_runtime": 708.5073, + "eval_samples_per_second": 21.297, + "eval_steps_per_second": 2.663, + "eval_wer": 1.0083270849716233, + "step": 45200 + }, + { + "epoch": 8.19, + "eval_loss": 0.16342629492282867, + "eval_runtime": 710.8612, + "eval_samples_per_second": 21.226, + "eval_steps_per_second": 2.655, + "eval_wer": 1.0223356071273995, + "step": 45300 + }, + { + "epoch": 8.21, + "eval_loss": 0.16308727860450745, + "eval_runtime": 586.3602, + "eval_samples_per_second": 25.733, + "eval_steps_per_second": 3.218, + "eval_wer": 1.0339240321135312, + "step": 45400 + }, + { + "epoch": 8.23, + "learning_rate": 0.00013626668284396988, + "loss": 0.0887, + "step": 45500 + }, + { + "epoch": 8.23, + "eval_loss": 0.163980633020401, + "eval_runtime": 632.8729, + "eval_samples_per_second": 23.842, + "eval_steps_per_second": 2.982, + "eval_wer": 1.0311076973720306, + "step": 45500 + }, + { + "epoch": 8.25, + "eval_loss": 0.16611836850643158, + "eval_runtime": 595.5038, + "eval_samples_per_second": 25.338, + "eval_steps_per_second": 3.169, + "eval_wer": 1.0264442859494156, + "step": 45600 + }, + { + "epoch": 8.27, + "eval_loss": 0.16504013538360596, + "eval_runtime": 651.568, + "eval_samples_per_second": 23.158, + "eval_steps_per_second": 2.896, + "eval_wer": 1.0315466066823942, + "step": 45700 + }, + { + "epoch": 8.29, + "eval_loss": 0.16236093640327454, + "eval_runtime": 656.1816, + "eval_samples_per_second": 22.995, + "eval_steps_per_second": 2.876, + "eval_wer": 1.039008064958578, + "step": 45800 + }, + { + "epoch": 8.3, + "eval_loss": 0.16241197288036346, + "eval_runtime": 630.0031, + "eval_samples_per_second": 23.951, + "eval_steps_per_second": 2.995, + "eval_wer": 1.0350334973147284, + "step": 45900 + }, + { + "epoch": 8.32, + "learning_rate": 0.0001344467362290706, + "loss": 0.0884, + "step": 46000 + }, + { + "epoch": 8.32, + "eval_loss": 0.1615293174982071, + "eval_runtime": 586.0849, + "eval_samples_per_second": 25.745, + "eval_steps_per_second": 3.22, + "eval_wer": 1.03177215730022, + "step": 46000 + }, + { + "epoch": 8.34, + "eval_loss": 0.16276471316814423, + "eval_runtime": 757.1338, + "eval_samples_per_second": 19.929, + "eval_steps_per_second": 2.492, + "eval_wer": 1.0410136366684346, + "step": 46100 + }, + { + "epoch": 8.36, + "eval_loss": 0.16269972920417786, + "eval_runtime": 823.1858, + "eval_samples_per_second": 18.33, + "eval_steps_per_second": 2.292, + "eval_wer": 1.0429460568265638, + "step": 46200 + }, + { + "epoch": 8.38, + "eval_loss": 0.1644161343574524, + "eval_runtime": 582.4378, + "eval_samples_per_second": 25.907, + "eval_steps_per_second": 3.24, + "eval_wer": 1.0320159958059778, + "step": 46300 + }, + { + "epoch": 8.39, + "eval_loss": 0.16325706243515015, + "eval_runtime": 583.1236, + "eval_samples_per_second": 25.876, + "eval_steps_per_second": 3.236, + "eval_wer": 1.017660003779497, + "step": 46400 + }, + { + "epoch": 8.41, + "learning_rate": 0.0001326267896141713, + "loss": 0.0893, + "step": 46500 + }, + { + "epoch": 8.41, + "eval_loss": 0.1654362827539444, + "eval_runtime": 833.0769, + "eval_samples_per_second": 18.112, + "eval_steps_per_second": 2.265, + "eval_wer": 1.0189279640094366, + "step": 46500 + }, + { + "epoch": 8.43, + "eval_loss": 0.1598113626241684, + "eval_runtime": 789.1667, + "eval_samples_per_second": 19.12, + "eval_steps_per_second": 2.391, + "eval_wer": 1.0154044976012386, + "step": 46600 + }, + { + "epoch": 8.45, + "eval_loss": 0.16180771589279175, + "eval_runtime": 594.7754, + "eval_samples_per_second": 25.369, + "eval_steps_per_second": 3.173, + "eval_wer": 1.024962967026938, + "step": 46700 + }, + { + "epoch": 8.47, + "eval_loss": 0.16394685208797455, + "eval_runtime": 602.2498, + "eval_samples_per_second": 25.054, + "eval_steps_per_second": 3.133, + "eval_wer": 1.0402150655620783, + "step": 46800 + }, + { + "epoch": 8.48, + "eval_loss": 0.16158275306224823, + "eval_runtime": 670.3939, + "eval_samples_per_second": 22.508, + "eval_steps_per_second": 2.815, + "eval_wer": 1.0336009460934024, + "step": 46900 + }, + { + "epoch": 8.5, + "learning_rate": 0.00013080684299927203, + "loss": 0.0869, + "step": 47000 + }, + { + "epoch": 8.5, + "eval_loss": 0.16125723719596863, + "eval_runtime": 671.1005, + "eval_samples_per_second": 22.484, + "eval_steps_per_second": 2.812, + "eval_wer": 1.029620282486909, + "step": 47000 + }, + { + "epoch": 8.52, + "eval_loss": 0.16476690769195557, + "eval_runtime": 593.5391, + "eval_samples_per_second": 25.422, + "eval_steps_per_second": 3.179, + "eval_wer": 1.056759508177734, + "step": 47100 + }, + { + "epoch": 8.54, + "eval_loss": 0.1624673455953598, + "eval_runtime": 581.8717, + "eval_samples_per_second": 25.932, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0255786592539762, + "step": 47200 + }, + { + "epoch": 8.56, + "eval_loss": 0.1608557254076004, + "eval_runtime": 761.7175, + "eval_samples_per_second": 19.809, + "eval_steps_per_second": 2.477, + "eval_wer": 1.0390202568838658, + "step": 47300 + }, + { + "epoch": 8.57, + "eval_loss": 0.16064698994159698, + "eval_runtime": 722.0512, + "eval_samples_per_second": 20.897, + "eval_steps_per_second": 2.613, + "eval_wer": 1.0449516285364204, + "step": 47400 + }, + { + "epoch": 8.59, + "learning_rate": 0.0001289905362776025, + "loss": 0.0894, + "step": 47500 + }, + { + "epoch": 8.59, + "eval_loss": 0.16054730117321014, + "eval_runtime": 580.1173, + "eval_samples_per_second": 26.01, + "eval_steps_per_second": 3.253, + "eval_wer": 1.0445492950019202, + "step": 47500 + }, + { + "epoch": 8.61, + "eval_loss": 0.1660243272781372, + "eval_runtime": 580.8578, + "eval_samples_per_second": 25.977, + "eval_steps_per_second": 3.249, + "eval_wer": 1.0402150655620783, + "step": 47600 + }, + { + "epoch": 8.63, + "eval_loss": 0.16181260347366333, + "eval_runtime": 815.8627, + "eval_samples_per_second": 18.495, + "eval_steps_per_second": 2.313, + "eval_wer": 1.044366416122602, + "step": 47700 + }, + { + "epoch": 8.65, + "eval_loss": 0.16689060628414154, + "eval_runtime": 695.8821, + "eval_samples_per_second": 21.683, + "eval_steps_per_second": 2.712, + "eval_wer": 1.033320531811781, + "step": 47800 + }, + { + "epoch": 8.66, + "eval_loss": 0.16267940402030945, + "eval_runtime": 581.4066, + "eval_samples_per_second": 25.953, + "eval_steps_per_second": 3.246, + "eval_wer": 1.0363624171711077, + "step": 47900 + }, + { + "epoch": 8.68, + "learning_rate": 0.00012717058966270323, + "loss": 0.0885, + "step": 48000 + }, + { + "epoch": 8.68, + "eval_loss": 0.1616200953722, + "eval_runtime": 580.4014, + "eval_samples_per_second": 25.998, + "eval_steps_per_second": 3.251, + "eval_wer": 1.0333510116250009, + "step": 48000 + }, + { + "epoch": 8.7, + "eval_loss": 0.16262862086296082, + "eval_runtime": 591.4018, + "eval_samples_per_second": 25.514, + "eval_steps_per_second": 3.191, + "eval_wer": 1.0563632706058776, + "step": 48100 + }, + { + "epoch": 8.72, + "eval_loss": 0.16235637664794922, + "eval_runtime": 582.9904, + "eval_samples_per_second": 25.882, + "eval_steps_per_second": 3.237, + "eval_wer": 1.0396054692976842, + "step": 48200 + }, + { + "epoch": 8.74, + "eval_loss": 0.1622648388147354, + "eval_runtime": 580.0532, + "eval_samples_per_second": 26.013, + "eval_steps_per_second": 3.253, + "eval_wer": 1.0395871814097524, + "step": 48300 + }, + { + "epoch": 8.76, + "eval_loss": 0.16115820407867432, + "eval_runtime": 593.5347, + "eval_samples_per_second": 25.422, + "eval_steps_per_second": 3.179, + "eval_wer": 1.0111860914516315, + "step": 48400 + }, + { + "epoch": 8.77, + "learning_rate": 0.00012535064304780393, + "loss": 0.0888, + "step": 48500 + }, + { + "epoch": 8.77, + "eval_loss": 0.16379259526729584, + "eval_runtime": 598.4046, + "eval_samples_per_second": 25.215, + "eval_steps_per_second": 3.153, + "eval_wer": 1.029211852989765, + "step": 48500 + }, + { + "epoch": 8.79, + "eval_loss": 0.16386225819587708, + "eval_runtime": 707.2069, + "eval_samples_per_second": 21.336, + "eval_steps_per_second": 2.668, + "eval_wer": 0.9988173832470755, + "step": 48600 + }, + { + "epoch": 8.81, + "eval_loss": 0.1618259996175766, + "eval_runtime": 581.5329, + "eval_samples_per_second": 25.947, + "eval_steps_per_second": 3.245, + "eval_wer": 1.0127161780752607, + "step": 48700 + }, + { + "epoch": 8.83, + "eval_loss": 0.1584457904100418, + "eval_runtime": 592.4893, + "eval_samples_per_second": 25.467, + "eval_steps_per_second": 3.185, + "eval_wer": 1.004230598074895, + "step": 48800 + }, + { + "epoch": 8.85, + "eval_loss": 0.16147887706756592, + "eval_runtime": 892.6436, + "eval_samples_per_second": 16.904, + "eval_steps_per_second": 2.114, + "eval_wer": 1.0040903909340844, + "step": 48900 + }, + { + "epoch": 8.86, + "learning_rate": 0.00012353069643290462, + "loss": 0.0887, + "step": 49000 + }, + { + "epoch": 8.86, + "eval_loss": 0.16373465955257416, + "eval_runtime": 597.5877, + "eval_samples_per_second": 25.25, + "eval_steps_per_second": 3.158, + "eval_wer": 1.0268770992971354, + "step": 49000 + }, + { + "epoch": 8.88, + "eval_loss": 0.16268499195575714, + "eval_runtime": 582.3813, + "eval_samples_per_second": 25.909, + "eval_steps_per_second": 3.24, + "eval_wer": 0.9988783428735148, + "step": 49100 + }, + { + "epoch": 8.9, + "eval_loss": 0.1583053022623062, + "eval_runtime": 597.6851, + "eval_samples_per_second": 25.246, + "eval_steps_per_second": 3.157, + "eval_wer": 1.0103631364946997, + "step": 49200 + }, + { + "epoch": 8.92, + "eval_loss": 0.1600298136472702, + "eval_runtime": 661.9601, + "eval_samples_per_second": 22.794, + "eval_steps_per_second": 2.851, + "eval_wer": 1.021360253104369, + "step": 49300 + }, + { + "epoch": 8.94, + "eval_loss": 0.15990710258483887, + "eval_runtime": 728.4467, + "eval_samples_per_second": 20.714, + "eval_steps_per_second": 2.59, + "eval_wer": 1.0126247386356015, + "step": 49400 + }, + { + "epoch": 8.95, + "learning_rate": 0.00012171074981800533, + "loss": 0.0893, + "step": 49500 + }, + { + "epoch": 8.95, + "eval_loss": 0.15952347218990326, + "eval_runtime": 582.1344, + "eval_samples_per_second": 25.92, + "eval_steps_per_second": 3.242, + "eval_wer": 1.0515779399303842, + "step": 49500 + }, + { + "epoch": 8.97, + "eval_loss": 0.16249197721481323, + "eval_runtime": 582.3785, + "eval_samples_per_second": 25.909, + "eval_steps_per_second": 3.24, + "eval_wer": 1.0463536999445266, + "step": 49600 + }, + { + "epoch": 8.99, + "eval_loss": 0.15948396921157837, + "eval_runtime": 788.7938, + "eval_samples_per_second": 19.129, + "eval_steps_per_second": 2.392, + "eval_wer": 1.0360941948147742, + "step": 49700 + }, + { + "epoch": 9.01, + "eval_loss": 0.16136983036994934, + "eval_runtime": 672.0772, + "eval_samples_per_second": 22.451, + "eval_steps_per_second": 2.808, + "eval_wer": 1.0468962406198374, + "step": 49800 + }, + { + "epoch": 9.03, + "eval_loss": 0.16116857528686523, + "eval_runtime": 580.6233, + "eval_samples_per_second": 25.988, + "eval_steps_per_second": 3.25, + "eval_wer": 1.0303944697426894, + "step": 49900 + }, + { + "epoch": 9.04, + "learning_rate": 0.00011989080320310603, + "loss": 0.0834, + "step": 50000 + }, + { + "epoch": 9.04, + "eval_loss": 0.16431789100170135, + "eval_runtime": 582.7513, + "eval_samples_per_second": 25.893, + "eval_steps_per_second": 3.238, + "eval_wer": 1.033533890504319, + "step": 50000 + }, + { + "epoch": 9.06, + "eval_loss": 0.16401399672031403, + "eval_runtime": 885.9925, + "eval_samples_per_second": 17.031, + "eval_steps_per_second": 2.13, + "eval_wer": 1.017531988563974, + "step": 50100 + }, + { + "epoch": 9.08, + "eval_loss": 0.16546601057052612, + "eval_runtime": 648.7007, + "eval_samples_per_second": 23.26, + "eval_steps_per_second": 2.909, + "eval_wer": 1.0263833263229762, + "step": 50200 + }, + { + "epoch": 9.1, + "eval_loss": 0.16776497662067413, + "eval_runtime": 581.0662, + "eval_samples_per_second": 25.968, + "eval_steps_per_second": 3.247, + "eval_wer": 1.0243046030613925, + "step": 50300 + }, + { + "epoch": 9.12, + "eval_loss": 0.16594190895557404, + "eval_runtime": 585.0092, + "eval_samples_per_second": 25.793, + "eval_steps_per_second": 3.226, + "eval_wer": 1.0145205830178672, + "step": 50400 + }, + { + "epoch": 9.14, + "learning_rate": 0.00011807085658820674, + "loss": 0.079, + "step": 50500 + }, + { + "epoch": 9.14, + "eval_loss": 0.16435874998569489, + "eval_runtime": 814.5284, + "eval_samples_per_second": 18.525, + "eval_steps_per_second": 2.317, + "eval_wer": 1.0315587986076822, + "step": 50500 + }, + { + "epoch": 9.15, + "eval_loss": 0.1629723608493805, + "eval_runtime": 758.0979, + "eval_samples_per_second": 19.904, + "eval_steps_per_second": 2.489, + "eval_wer": 1.0326377839956598, + "step": 50600 + }, + { + "epoch": 9.17, + "eval_loss": 0.16343791782855988, + "eval_runtime": 581.3896, + "eval_samples_per_second": 25.953, + "eval_steps_per_second": 3.246, + "eval_wer": 1.015367921825375, + "step": 50700 + }, + { + "epoch": 9.19, + "eval_loss": 0.169687420129776, + "eval_runtime": 582.3186, + "eval_samples_per_second": 25.912, + "eval_steps_per_second": 3.24, + "eval_wer": 1.009491413836616, + "step": 50800 + }, + { + "epoch": 9.21, + "eval_loss": 0.1677592247724533, + "eval_runtime": 702.7189, + "eval_samples_per_second": 21.472, + "eval_steps_per_second": 2.685, + "eval_wer": 1.0050291691812512, + "step": 50900 + }, + { + "epoch": 9.23, + "learning_rate": 0.00011625090997330743, + "loss": 0.078, + "step": 51000 + }, + { + "epoch": 9.23, + "eval_loss": 0.16258232295513153, + "eval_runtime": 585.8429, + "eval_samples_per_second": 25.756, + "eval_steps_per_second": 3.221, + "eval_wer": 1.0159409423139054, + "step": 51000 + }, + { + "epoch": 9.24, + "eval_loss": 0.1665642261505127, + "eval_runtime": 584.7636, + "eval_samples_per_second": 25.804, + "eval_steps_per_second": 3.227, + "eval_wer": 1.0237559664234377, + "step": 51100 + }, + { + "epoch": 9.26, + "eval_loss": 0.1644172966480255, + "eval_runtime": 581.2024, + "eval_samples_per_second": 25.962, + "eval_steps_per_second": 3.247, + "eval_wer": 1.0244082344263394, + "step": 51200 + }, + { + "epoch": 9.28, + "eval_loss": 0.16548845171928406, + "eval_runtime": 773.778, + "eval_samples_per_second": 19.5, + "eval_steps_per_second": 2.439, + "eval_wer": 1.0345092445273496, + "step": 51300 + }, + { + "epoch": 9.3, + "eval_loss": 0.16148586571216583, + "eval_runtime": 753.2674, + "eval_samples_per_second": 20.031, + "eval_steps_per_second": 2.505, + "eval_wer": 1.0236767189090665, + "step": 51400 + }, + { + "epoch": 9.32, + "learning_rate": 0.00011443460325163794, + "loss": 0.0776, + "step": 51500 + }, + { + "epoch": 9.32, + "eval_loss": 0.1664086878299713, + "eval_runtime": 600.4636, + "eval_samples_per_second": 25.129, + "eval_steps_per_second": 3.143, + "eval_wer": 1.0179952817249136, + "step": 51500 + }, + { + "epoch": 9.33, + "eval_loss": 0.16034889221191406, + "eval_runtime": 598.9514, + "eval_samples_per_second": 25.192, + "eval_steps_per_second": 3.151, + "eval_wer": 1.0207933285784825, + "step": 51600 + }, + { + "epoch": 9.35, + "eval_loss": 0.1594148576259613, + "eval_runtime": 1099.0175, + "eval_samples_per_second": 13.73, + "eval_steps_per_second": 1.717, + "eval_wer": 1.0229695872423694, + "step": 51700 + }, + { + "epoch": 9.37, + "eval_loss": 0.16220493614673615, + "eval_runtime": 635.6696, + "eval_samples_per_second": 23.737, + "eval_steps_per_second": 2.969, + "eval_wer": 1.0201410605755807, + "step": 51800 + }, + { + "epoch": 9.39, + "eval_loss": 0.15961703658103943, + "eval_runtime": 580.4546, + "eval_samples_per_second": 25.995, + "eval_steps_per_second": 3.251, + "eval_wer": 1.003907512054766, + "step": 51900 + }, + { + "epoch": 9.41, + "learning_rate": 0.00011261465663673865, + "loss": 0.0782, + "step": 52000 + }, + { + "epoch": 9.41, + "eval_loss": 0.1644771248102188, + "eval_runtime": 580.2702, + "eval_samples_per_second": 26.003, + "eval_steps_per_second": 3.252, + "eval_wer": 1.0203605152307627, + "step": 52000 + }, + { + "epoch": 9.42, + "eval_loss": 0.16403250396251678, + "eval_runtime": 586.7485, + "eval_samples_per_second": 25.716, + "eval_steps_per_second": 3.216, + "eval_wer": 1.0318209250013717, + "step": 52100 + }, + { + "epoch": 9.44, + "eval_loss": 0.16205865144729614, + "eval_runtime": 580.5387, + "eval_samples_per_second": 25.991, + "eval_steps_per_second": 3.25, + "eval_wer": 1.0290167821851588, + "step": 52200 + }, + { + "epoch": 9.46, + "eval_loss": 0.16380777955055237, + "eval_runtime": 594.1221, + "eval_samples_per_second": 25.397, + "eval_steps_per_second": 3.176, + "eval_wer": 1.031766061337576, + "step": 52300 + }, + { + "epoch": 9.48, + "eval_loss": 0.16133266687393188, + "eval_runtime": 585.3086, + "eval_samples_per_second": 25.78, + "eval_steps_per_second": 3.224, + "eval_wer": 1.0216528593112781, + "step": 52400 + }, + { + "epoch": 9.5, + "learning_rate": 0.00011079471002183935, + "loss": 0.0782, + "step": 52500 + }, + { + "epoch": 9.5, + "eval_loss": 0.16088727116584778, + "eval_runtime": 626.7548, + "eval_samples_per_second": 24.075, + "eval_steps_per_second": 3.011, + "eval_wer": 1.0260541443402036, + "step": 52500 + }, + { + "epoch": 9.52, + "eval_loss": 0.16250905394554138, + "eval_runtime": 792.3097, + "eval_samples_per_second": 19.044, + "eval_steps_per_second": 2.382, + "eval_wer": 1.010113202026298, + "step": 52600 + }, + { + "epoch": 9.53, + "eval_loss": 0.1612967550754547, + "eval_runtime": 579.6946, + "eval_samples_per_second": 26.029, + "eval_steps_per_second": 3.255, + "eval_wer": 1.0057545887358803, + "step": 52700 + }, + { + "epoch": 9.55, + "eval_loss": 0.15985870361328125, + "eval_runtime": 581.2133, + "eval_samples_per_second": 25.961, + "eval_steps_per_second": 3.247, + "eval_wer": 1.006803094310638, + "step": 52800 + }, + { + "epoch": 9.57, + "eval_loss": 0.159987673163414, + "eval_runtime": 593.2496, + "eval_samples_per_second": 25.434, + "eval_steps_per_second": 3.181, + "eval_wer": 1.011033692385533, + "step": 52900 + }, + { + "epoch": 9.59, + "learning_rate": 0.00010897476340694006, + "loss": 0.0797, + "step": 53000 + }, + { + "epoch": 9.59, + "eval_loss": 0.15943679213523865, + "eval_runtime": 669.0711, + "eval_samples_per_second": 22.552, + "eval_steps_per_second": 2.82, + "eval_wer": 1.0170625994403906, + "step": 53000 + }, + { + "epoch": 9.61, + "eval_loss": 0.1583079844713211, + "eval_runtime": 605.5808, + "eval_samples_per_second": 24.917, + "eval_steps_per_second": 3.116, + "eval_wer": 1.012368708204556, + "step": 53100 + }, + { + "epoch": 9.62, + "eval_loss": 0.16463600099086761, + "eval_runtime": 612.4932, + "eval_samples_per_second": 24.635, + "eval_steps_per_second": 3.081, + "eval_wer": 1.0093329188078735, + "step": 53200 + }, + { + "epoch": 9.64, + "eval_loss": 0.15795104205608368, + "eval_runtime": 780.4208, + "eval_samples_per_second": 19.334, + "eval_steps_per_second": 2.418, + "eval_wer": 1.0200922928744294, + "step": 53300 + }, + { + "epoch": 9.66, + "eval_loss": 0.15989932417869568, + "eval_runtime": 794.8985, + "eval_samples_per_second": 18.982, + "eval_steps_per_second": 2.374, + "eval_wer": 1.0206775052882475, + "step": 53400 + }, + { + "epoch": 9.68, + "learning_rate": 0.00010715481679204077, + "loss": 0.0783, + "step": 53500 + }, + { + "epoch": 9.68, + "eval_loss": 0.15769976377487183, + "eval_runtime": 591.2607, + "eval_samples_per_second": 25.52, + "eval_steps_per_second": 3.191, + "eval_wer": 1.0226404052595965, + "step": 53500 + }, + { + "epoch": 9.7, + "eval_loss": 0.15931198000907898, + "eval_runtime": 580.3684, + "eval_samples_per_second": 25.999, + "eval_steps_per_second": 3.251, + "eval_wer": 1.0160262857909206, + "step": 53600 + }, + { + "epoch": 9.71, + "eval_loss": 0.15701308846473694, + "eval_runtime": 631.6476, + "eval_samples_per_second": 23.888, + "eval_steps_per_second": 2.987, + "eval_wer": 1.01732472583408, + "step": 53700 + }, + { + "epoch": 9.73, + "eval_loss": 0.16138727962970734, + "eval_runtime": 823.2091, + "eval_samples_per_second": 18.329, + "eval_steps_per_second": 2.292, + "eval_wer": 1.0299372725443938, + "step": 53800 + }, + { + "epoch": 9.75, + "eval_loss": 0.16104823350906372, + "eval_runtime": 592.3865, + "eval_samples_per_second": 25.472, + "eval_steps_per_second": 3.185, + "eval_wer": 1.0184098071847016, + "step": 53900 + }, + { + "epoch": 9.77, + "learning_rate": 0.00010533487017714146, + "loss": 0.0779, + "step": 54000 + }, + { + "epoch": 9.77, + "eval_loss": 0.16055870056152344, + "eval_runtime": 578.7328, + "eval_samples_per_second": 26.072, + "eval_steps_per_second": 3.261, + "eval_wer": 1.0173003419835043, + "step": 54000 + }, + { + "epoch": 9.79, + "eval_loss": 0.15772290527820587, + "eval_runtime": 762.4369, + "eval_samples_per_second": 19.79, + "eval_steps_per_second": 2.475, + "eval_wer": 1.0031699005748493, + "step": 54100 + }, + { + "epoch": 9.8, + "eval_loss": 0.1589614897966385, + "eval_runtime": 769.937, + "eval_samples_per_second": 19.598, + "eval_steps_per_second": 2.451, + "eval_wer": 1.007016453003176, + "step": 54200 + }, + { + "epoch": 9.82, + "eval_loss": 0.15804855525493622, + "eval_runtime": 581.4557, + "eval_samples_per_second": 25.95, + "eval_steps_per_second": 3.245, + "eval_wer": 1.0256883865815671, + "step": 54300 + }, + { + "epoch": 9.84, + "eval_loss": 0.15920314192771912, + "eval_runtime": 579.5344, + "eval_samples_per_second": 26.036, + "eval_steps_per_second": 3.256, + "eval_wer": 1.0107837579171315, + "step": 54400 + }, + { + "epoch": 9.86, + "learning_rate": 0.00010351856345547196, + "loss": 0.0778, + "step": 54500 + }, + { + "epoch": 9.86, + "eval_loss": 0.1616947501897812, + "eval_runtime": 784.3278, + "eval_samples_per_second": 19.238, + "eval_steps_per_second": 2.406, + "eval_wer": 0.9907463287064977, + "step": 54500 + }, + { + "epoch": 9.88, + "eval_loss": 0.16045895218849182, + "eval_runtime": 696.7226, + "eval_samples_per_second": 21.657, + "eval_steps_per_second": 2.708, + "eval_wer": 1.0188548124577093, + "step": 54600 + }, + { + "epoch": 9.89, + "eval_loss": 0.16049787402153015, + "eval_runtime": 585.856, + "eval_samples_per_second": 25.755, + "eval_steps_per_second": 3.221, + "eval_wer": 1.0176843876300725, + "step": 54700 + }, + { + "epoch": 9.91, + "eval_loss": 0.15361995995044708, + "eval_runtime": 592.9048, + "eval_samples_per_second": 25.449, + "eval_steps_per_second": 3.183, + "eval_wer": 1.0274927915241736, + "step": 54800 + }, + { + "epoch": 9.93, + "eval_loss": 0.16578349471092224, + "eval_runtime": 796.0097, + "eval_samples_per_second": 18.956, + "eval_steps_per_second": 2.371, + "eval_wer": 1.028169443377651, + "step": 54900 + }, + { + "epoch": 9.95, + "learning_rate": 0.00010169861684057267, + "loss": 0.0777, + "step": 55000 + }, + { + "epoch": 9.95, + "eval_loss": 0.15434084832668304, + "eval_runtime": 657.9027, + "eval_samples_per_second": 22.935, + "eval_steps_per_second": 2.868, + "eval_wer": 1.038489908133843, + "step": 55000 + }, + { + "epoch": 9.97, + "eval_loss": 0.15585801005363464, + "eval_runtime": 593.5105, + "eval_samples_per_second": 25.423, + "eval_steps_per_second": 3.179, + "eval_wer": 1.0375328419987442, + "step": 55100 + }, + { + "epoch": 9.99, + "eval_loss": 0.1590491086244583, + "eval_runtime": 599.7954, + "eval_samples_per_second": 25.157, + "eval_steps_per_second": 3.146, + "eval_wer": 1.0215431319836872, + "step": 55200 + }, + { + "epoch": 10.0, + "eval_loss": 0.16239939630031586, + "eval_runtime": 676.8287, + "eval_samples_per_second": 22.294, + "eval_steps_per_second": 2.788, + "eval_wer": 1.0241765878458697, + "step": 55300 + }, + { + "epoch": 10.02, + "eval_loss": 0.16353543102741241, + "eval_runtime": 778.4878, + "eval_samples_per_second": 19.382, + "eval_steps_per_second": 2.424, + "eval_wer": 1.024353370762544, + "step": 55400 + }, + { + "epoch": 10.04, + "learning_rate": 9.987867022567338e-05, + "loss": 0.0712, + "step": 55500 + }, + { + "epoch": 10.04, + "eval_loss": 0.1628965139389038, + "eval_runtime": 581.6719, + "eval_samples_per_second": 25.941, + "eval_steps_per_second": 3.244, + "eval_wer": 1.029803161366227, + "step": 55500 + }, + { + "epoch": 10.06, + "eval_loss": 0.16010913252830505, + "eval_runtime": 580.2062, + "eval_samples_per_second": 26.006, + "eval_steps_per_second": 3.252, + "eval_wer": 1.0298824088805985, + "step": 55600 + }, + { + "epoch": 10.08, + "eval_loss": 0.16253387928009033, + "eval_runtime": 810.8172, + "eval_samples_per_second": 18.61, + "eval_steps_per_second": 2.327, + "eval_wer": 1.011667672500503, + "step": 55700 + }, + { + "epoch": 10.09, + "eval_loss": 0.16501325368881226, + "eval_runtime": 598.9657, + "eval_samples_per_second": 25.192, + "eval_steps_per_second": 3.15, + "eval_wer": 1.0232804813372103, + "step": 55800 + }, + { + "epoch": 10.11, + "eval_loss": 0.16311536729335785, + "eval_runtime": 580.9085, + "eval_samples_per_second": 25.975, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0061020586065847, + "step": 55900 + }, + { + "epoch": 10.13, + "learning_rate": 9.805872361077407e-05, + "loss": 0.0667, + "step": 56000 + }, + { + "epoch": 10.13, + "eval_loss": 0.1636841744184494, + "eval_runtime": 600.3431, + "eval_samples_per_second": 25.134, + "eval_steps_per_second": 3.143, + "eval_wer": 1.0226343092969525, + "step": 56000 + }, + { + "epoch": 10.15, + "eval_loss": 0.1607149839401245, + "eval_runtime": 1230.1922, + "eval_samples_per_second": 12.266, + "eval_steps_per_second": 1.534, + "eval_wer": 1.004212310186963, + "step": 56100 + }, + { + "epoch": 10.17, + "eval_loss": 0.1599477082490921, + "eval_runtime": 596.4073, + "eval_samples_per_second": 25.3, + "eval_steps_per_second": 3.164, + "eval_wer": 1.0117225361642983, + "step": 56200 + }, + { + "epoch": 10.18, + "eval_loss": 0.16232724487781525, + "eval_runtime": 580.397, + "eval_samples_per_second": 25.998, + "eval_steps_per_second": 3.251, + "eval_wer": 1.0245972092683016, + "step": 56300 + }, + { + "epoch": 10.2, + "eval_loss": 0.16392558813095093, + "eval_runtime": 580.3269, + "eval_samples_per_second": 26.001, + "eval_steps_per_second": 3.252, + "eval_wer": 1.0294252116823028, + "step": 56400 + }, + { + "epoch": 10.22, + "learning_rate": 9.624241688910458e-05, + "loss": 0.0695, + "step": 56500 + }, + { + "epoch": 10.22, + "eval_loss": 0.16502028703689575, + "eval_runtime": 859.9983, + "eval_samples_per_second": 17.545, + "eval_steps_per_second": 2.194, + "eval_wer": 1.0231890418975513, + "step": 56500 + }, + { + "epoch": 10.24, + "eval_loss": 0.162032812833786, + "eval_runtime": 629.7937, + "eval_samples_per_second": 23.959, + "eval_steps_per_second": 2.996, + "eval_wer": 1.02889486293228, + "step": 56600 + }, + { + "epoch": 10.26, + "eval_loss": 0.16672161221504211, + "eval_runtime": 591.7678, + "eval_samples_per_second": 25.498, + "eval_steps_per_second": 3.189, + "eval_wer": 1.0208664801302099, + "step": 56700 + }, + { + "epoch": 10.27, + "eval_loss": 0.15804210305213928, + "eval_runtime": 580.1264, + "eval_samples_per_second": 26.01, + "eval_steps_per_second": 3.253, + "eval_wer": 1.0163493718110495, + "step": 56800 + }, + { + "epoch": 10.29, + "eval_loss": 0.16456495225429535, + "eval_runtime": 784.7617, + "eval_samples_per_second": 19.227, + "eval_steps_per_second": 2.405, + "eval_wer": 1.0293459641679317, + "step": 56900 + }, + { + "epoch": 10.31, + "learning_rate": 9.442247027420528e-05, + "loss": 0.0686, + "step": 57000 + }, + { + "epoch": 10.31, + "eval_loss": 0.16356460750102997, + "eval_runtime": 816.4454, + "eval_samples_per_second": 18.481, + "eval_steps_per_second": 2.311, + "eval_wer": 1.0105764951872376, + "step": 57000 + }, + { + "epoch": 10.33, + "eval_loss": 0.1585777848958969, + "eval_runtime": 581.6554, + "eval_samples_per_second": 25.941, + "eval_steps_per_second": 3.244, + "eval_wer": 1.0043829971409934, + "step": 57100 + }, + { + "epoch": 10.35, + "eval_loss": 0.15822261571884155, + "eval_runtime": 586.4769, + "eval_samples_per_second": 25.728, + "eval_steps_per_second": 3.218, + "eval_wer": 1.0212810055899977, + "step": 57200 + }, + { + "epoch": 10.37, + "eval_loss": 0.1626518964767456, + "eval_runtime": 652.945, + "eval_samples_per_second": 23.109, + "eval_steps_per_second": 2.89, + "eval_wer": 1.0151179873569736, + "step": 57300 + }, + { + "epoch": 10.38, + "eval_loss": 0.1618737131357193, + "eval_runtime": 643.6148, + "eval_samples_per_second": 23.444, + "eval_steps_per_second": 2.932, + "eval_wer": 1.0248044719981957, + "step": 57400 + }, + { + "epoch": 10.4, + "learning_rate": 9.260252365930599e-05, + "loss": 0.0686, + "step": 57500 + }, + { + "epoch": 10.4, + "eval_loss": 0.15961088240146637, + "eval_runtime": 581.127, + "eval_samples_per_second": 25.965, + "eval_steps_per_second": 3.247, + "eval_wer": 1.0097535402303055, + "step": 57500 + }, + { + "epoch": 10.42, + "eval_loss": 0.16058142483234406, + "eval_runtime": 581.0057, + "eval_samples_per_second": 25.97, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0031394207616295, + "step": 57600 + }, + { + "epoch": 10.44, + "eval_loss": 0.16196614503860474, + "eval_runtime": 661.9802, + "eval_samples_per_second": 22.794, + "eval_steps_per_second": 2.851, + "eval_wer": 1.0045780679455996, + "step": 57700 + }, + { + "epoch": 10.46, + "eval_loss": 0.15916328132152557, + "eval_runtime": 581.8543, + "eval_samples_per_second": 25.933, + "eval_steps_per_second": 3.243, + "eval_wer": 1.001773925129387, + "step": 57800 + }, + { + "epoch": 10.47, + "eval_loss": 0.1592239886522293, + "eval_runtime": 585.3649, + "eval_samples_per_second": 25.777, + "eval_steps_per_second": 3.224, + "eval_wer": 1.0058399322128955, + "step": 57900 + }, + { + "epoch": 10.49, + "learning_rate": 9.07825770444067e-05, + "loss": 0.0669, + "step": 58000 + }, + { + "epoch": 10.49, + "eval_loss": 0.16053098440170288, + "eval_runtime": 580.0983, + "eval_samples_per_second": 26.011, + "eval_steps_per_second": 3.253, + "eval_wer": 0.9961168717958097, + "step": 58000 + }, + { + "epoch": 10.51, + "eval_loss": 0.163193017244339, + "eval_runtime": 597.491, + "eval_samples_per_second": 25.254, + "eval_steps_per_second": 3.158, + "eval_wer": 1.0101924495406691, + "step": 58100 + }, + { + "epoch": 10.53, + "eval_loss": 0.15927906334400177, + "eval_runtime": 692.2659, + "eval_samples_per_second": 21.797, + "eval_steps_per_second": 2.726, + "eval_wer": 1.0060654828307212, + "step": 58200 + }, + { + "epoch": 10.55, + "eval_loss": 0.1585976928472519, + "eval_runtime": 598.5348, + "eval_samples_per_second": 25.21, + "eval_steps_per_second": 3.153, + "eval_wer": 1.0091134641526918, + "step": 58300 + }, + { + "epoch": 10.56, + "eval_loss": 0.1602911651134491, + "eval_runtime": 596.6358, + "eval_samples_per_second": 25.29, + "eval_steps_per_second": 3.163, + "eval_wer": 1.0084916759630096, + "step": 58400 + }, + { + "epoch": 10.58, + "learning_rate": 8.896263042950739e-05, + "loss": 0.068, + "step": 58500 + }, + { + "epoch": 10.58, + "eval_loss": 0.15785259008407593, + "eval_runtime": 930.7715, + "eval_samples_per_second": 16.211, + "eval_steps_per_second": 2.027, + "eval_wer": 1.0030784611351902, + "step": 58500 + }, + { + "epoch": 10.6, + "eval_loss": 0.1590667963027954, + "eval_runtime": 735.2125, + "eval_samples_per_second": 20.523, + "eval_steps_per_second": 2.567, + "eval_wer": 1.0020909151868718, + "step": 58600 + }, + { + "epoch": 10.62, + "eval_loss": 0.15900607407093048, + "eval_runtime": 583.5509, + "eval_samples_per_second": 25.857, + "eval_steps_per_second": 3.234, + "eval_wer": 1.0162823162219663, + "step": 58700 + }, + { + "epoch": 10.64, + "eval_loss": 0.15844112634658813, + "eval_runtime": 580.7859, + "eval_samples_per_second": 25.98, + "eval_steps_per_second": 3.249, + "eval_wer": 1.0044866285059406, + "step": 58800 + }, + { + "epoch": 10.65, + "eval_loss": 0.1593514233827591, + "eval_runtime": 844.9985, + "eval_samples_per_second": 17.857, + "eval_steps_per_second": 2.233, + "eval_wer": 1.0158129270983827, + "step": 58900 + }, + { + "epoch": 10.67, + "learning_rate": 8.71426838146081e-05, + "loss": 0.0693, + "step": 59000 + }, + { + "epoch": 10.67, + "eval_loss": 0.15675154328346252, + "eval_runtime": 736.1944, + "eval_samples_per_second": 20.496, + "eval_steps_per_second": 2.563, + "eval_wer": 1.0052364319111453, + "step": 59000 + }, + { + "epoch": 10.69, + "eval_loss": 0.15810607373714447, + "eval_runtime": 580.7163, + "eval_samples_per_second": 25.983, + "eval_steps_per_second": 3.249, + "eval_wer": 0.9955011795687716, + "step": 59100 + }, + { + "epoch": 10.71, + "eval_loss": 0.16217058897018433, + "eval_runtime": 599.9088, + "eval_samples_per_second": 25.152, + "eval_steps_per_second": 3.145, + "eval_wer": 0.9916851069536646, + "step": 59200 + }, + { + "epoch": 10.73, + "eval_loss": 0.15796062350273132, + "eval_runtime": 618.486, + "eval_samples_per_second": 24.397, + "eval_steps_per_second": 3.051, + "eval_wer": 1.0017861170546747, + "step": 59300 + }, + { + "epoch": 10.75, + "eval_loss": 0.1600871980190277, + "eval_runtime": 610.0596, + "eval_samples_per_second": 24.734, + "eval_steps_per_second": 3.093, + "eval_wer": 1.0076931048566535, + "step": 59400 + }, + { + "epoch": 10.76, + "learning_rate": 8.53227371997088e-05, + "loss": 0.0699, + "step": 59500 + }, + { + "epoch": 10.76, + "eval_loss": 0.16046388447284698, + "eval_runtime": 593.6048, + "eval_samples_per_second": 25.419, + "eval_steps_per_second": 3.179, + "eval_wer": 0.9996708180172272, + "step": 59500 + }, + { + "epoch": 10.78, + "eval_loss": 0.15849190950393677, + "eval_runtime": 592.6817, + "eval_samples_per_second": 25.459, + "eval_steps_per_second": 3.184, + "eval_wer": 1.0008717226580834, + "step": 59600 + }, + { + "epoch": 10.8, + "eval_loss": 0.1540997177362442, + "eval_runtime": 789.9508, + "eval_samples_per_second": 19.101, + "eval_steps_per_second": 2.389, + "eval_wer": 1.0058094523996757, + "step": 59700 + }, + { + "epoch": 10.82, + "eval_loss": 0.15827548503875732, + "eval_runtime": 753.7133, + "eval_samples_per_second": 20.02, + "eval_steps_per_second": 2.504, + "eval_wer": 1.0026273598995386, + "step": 59800 + }, + { + "epoch": 10.84, + "eval_loss": 0.1591554433107376, + "eval_runtime": 609.7911, + "eval_samples_per_second": 24.745, + "eval_steps_per_second": 3.095, + "eval_wer": 0.9991648531177801, + "step": 59900 + }, + { + "epoch": 10.85, + "learning_rate": 8.35027905848095e-05, + "loss": 0.0671, + "step": 60000 + }, + { + "epoch": 10.85, + "eval_loss": 0.15896911919116974, + "eval_runtime": 595.2504, + "eval_samples_per_second": 25.349, + "eval_steps_per_second": 3.17, + "eval_wer": 1.0003596617959924, + "step": 60000 + }, + { + "epoch": 10.87, + "eval_loss": 0.15851779282093048, + "eval_runtime": 608.3387, + "eval_samples_per_second": 24.804, + "eval_steps_per_second": 3.102, + "eval_wer": 1.0060106191669258, + "step": 60100 + }, + { + "epoch": 10.89, + "eval_loss": 0.15786558389663696, + "eval_runtime": 582.1448, + "eval_samples_per_second": 25.92, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0063337051870547, + "step": 60200 + }, + { + "epoch": 10.91, + "eval_loss": 0.1582275778055191, + "eval_runtime": 580.089, + "eval_samples_per_second": 26.012, + "eval_steps_per_second": 3.253, + "eval_wer": 0.9948793913790897, + "step": 60300 + }, + { + "epoch": 10.93, + "eval_loss": 0.15619191527366638, + "eval_runtime": 591.1367, + "eval_samples_per_second": 25.525, + "eval_steps_per_second": 3.192, + "eval_wer": 1.0003962375718563, + "step": 60400 + }, + { + "epoch": 10.94, + "learning_rate": 8.168284396991022e-05, + "loss": 0.0661, + "step": 60500 + }, + { + "epoch": 10.94, + "eval_loss": 0.15603141486644745, + "eval_runtime": 709.5495, + "eval_samples_per_second": 21.266, + "eval_steps_per_second": 2.659, + "eval_wer": 0.9949952146693245, + "step": 60500 + }, + { + "epoch": 10.96, + "eval_loss": 0.1564040631055832, + "eval_runtime": 794.2132, + "eval_samples_per_second": 18.999, + "eval_steps_per_second": 2.376, + "eval_wer": 0.9989819742384619, + "step": 60600 + }, + { + "epoch": 10.98, + "eval_loss": 0.15524810552597046, + "eval_runtime": 598.5085, + "eval_samples_per_second": 25.211, + "eval_steps_per_second": 3.153, + "eval_wer": 0.9981834031321056, + "step": 60700 + }, + { + "epoch": 11.0, + "eval_loss": 0.15955734252929688, + "eval_runtime": 587.4842, + "eval_samples_per_second": 25.684, + "eval_steps_per_second": 3.212, + "eval_wer": 1.0018287887931823, + "step": 60800 + }, + { + "epoch": 11.02, + "eval_loss": 0.16182269155979156, + "eval_runtime": 1030.4887, + "eval_samples_per_second": 14.643, + "eval_steps_per_second": 1.831, + "eval_wer": 0.9904720103875203, + "step": 60900 + }, + { + "epoch": 11.03, + "learning_rate": 7.987017714147051e-05, + "loss": 0.0634, + "step": 61000 + }, + { + "epoch": 11.03, + "eval_loss": 0.16515201330184937, + "eval_runtime": 607.7817, + "eval_samples_per_second": 24.826, + "eval_steps_per_second": 3.105, + "eval_wer": 0.9889663076144669, + "step": 61000 + }, + { + "epoch": 11.05, + "eval_loss": 0.16492097079753876, + "eval_runtime": 598.9216, + "eval_samples_per_second": 25.194, + "eval_steps_per_second": 3.151, + "eval_wer": 0.988643221594338, + "step": 61100 + }, + { + "epoch": 11.07, + "eval_loss": 0.16676683723926544, + "eval_runtime": 595.7546, + "eval_samples_per_second": 25.328, + "eval_steps_per_second": 3.167, + "eval_wer": 0.9870338874563377, + "step": 61200 + }, + { + "epoch": 11.09, + "eval_loss": 0.16629168391227722, + "eval_runtime": 654.8399, + "eval_samples_per_second": 23.042, + "eval_steps_per_second": 2.882, + "eval_wer": 0.9921179203013843, + "step": 61300 + }, + { + "epoch": 11.11, + "eval_loss": 0.1650213599205017, + "eval_runtime": 773.1318, + "eval_samples_per_second": 19.517, + "eval_steps_per_second": 2.441, + "eval_wer": 0.9918923696835585, + "step": 61400 + }, + { + "epoch": 11.13, + "learning_rate": 7.805023052657121e-05, + "loss": 0.0587, + "step": 61500 + }, + { + "epoch": 11.13, + "eval_loss": 0.16744260489940643, + "eval_runtime": 596.1745, + "eval_samples_per_second": 25.31, + "eval_steps_per_second": 3.165, + "eval_wer": 0.9830715117377761, + "step": 61500 + }, + { + "epoch": 11.14, + "eval_loss": 0.16329726576805115, + "eval_runtime": 590.0495, + "eval_samples_per_second": 25.572, + "eval_steps_per_second": 3.198, + "eval_wer": 0.9792981108611767, + "step": 61600 + }, + { + "epoch": 11.16, + "eval_loss": 0.1665409654378891, + "eval_runtime": 872.8813, + "eval_samples_per_second": 17.286, + "eval_steps_per_second": 2.162, + "eval_wer": 0.9781093981456082, + "step": 61700 + }, + { + "epoch": 11.18, + "eval_loss": 0.16423752903938293, + "eval_runtime": 772.8941, + "eval_samples_per_second": 19.523, + "eval_steps_per_second": 2.441, + "eval_wer": 0.982053485976238, + "step": 61800 + }, + { + "epoch": 11.2, + "eval_loss": 0.16376256942749023, + "eval_runtime": 580.3017, + "eval_samples_per_second": 26.002, + "eval_steps_per_second": 3.252, + "eval_wer": 0.9796577726571691, + "step": 61900 + }, + { + "epoch": 11.22, + "learning_rate": 7.623028391167192e-05, + "loss": 0.0581, + "step": 62000 + }, + { + "epoch": 11.22, + "eval_loss": 0.1627783179283142, + "eval_runtime": 581.6544, + "eval_samples_per_second": 25.942, + "eval_steps_per_second": 3.244, + "eval_wer": 0.9726778954298568, + "step": 62000 + }, + { + "epoch": 11.23, + "eval_loss": 0.16605274379253387, + "eval_runtime": 737.7411, + "eval_samples_per_second": 20.453, + "eval_steps_per_second": 2.558, + "eval_wer": 0.9796394847692373, + "step": 62100 + }, + { + "epoch": 11.25, + "eval_loss": 0.164078027009964, + "eval_runtime": 696.1898, + "eval_samples_per_second": 21.674, + "eval_steps_per_second": 2.71, + "eval_wer": 0.9829617844101851, + "step": 62200 + }, + { + "epoch": 11.27, + "eval_loss": 0.1601402908563614, + "eval_runtime": 593.4458, + "eval_samples_per_second": 25.426, + "eval_steps_per_second": 3.18, + "eval_wer": 0.9866620337350572, + "step": 62300 + }, + { + "epoch": 11.29, + "eval_loss": 0.16263510286808014, + "eval_runtime": 599.2385, + "eval_samples_per_second": 25.18, + "eval_steps_per_second": 3.149, + "eval_wer": 0.9756832050133197, + "step": 62400 + }, + { + "epoch": 11.31, + "learning_rate": 7.441033729677263e-05, + "loss": 0.0584, + "step": 62500 + }, + { + "epoch": 11.31, + "eval_loss": 0.16319765150547028, + "eval_runtime": 819.3596, + "eval_samples_per_second": 18.416, + "eval_steps_per_second": 2.303, + "eval_wer": 1.0013654956322429, + "step": 62500 + }, + { + "epoch": 11.32, + "eval_loss": 0.16259542107582092, + "eval_runtime": 772.2475, + "eval_samples_per_second": 19.539, + "eval_steps_per_second": 2.444, + "eval_wer": 1.005169376322062, + "step": 62600 + }, + { + "epoch": 11.34, + "eval_loss": 0.1586335301399231, + "eval_runtime": 596.9725, + "eval_samples_per_second": 25.276, + "eval_steps_per_second": 3.161, + "eval_wer": 1.0098388837073207, + "step": 62700 + }, + { + "epoch": 11.36, + "eval_loss": 0.15968169271945953, + "eval_runtime": 581.6566, + "eval_samples_per_second": 25.941, + "eval_steps_per_second": 3.244, + "eval_wer": 1.015063123693178, + "step": 62800 + }, + { + "epoch": 11.38, + "eval_loss": 0.162418931722641, + "eval_runtime": 736.848, + "eval_samples_per_second": 20.478, + "eval_steps_per_second": 2.561, + "eval_wer": 1.0054254067531074, + "step": 62900 + }, + { + "epoch": 11.4, + "learning_rate": 7.259039068187334e-05, + "loss": 0.0589, + "step": 63000 + }, + { + "epoch": 11.4, + "eval_loss": 0.16180075705051422, + "eval_runtime": 774.1276, + "eval_samples_per_second": 19.492, + "eval_steps_per_second": 2.438, + "eval_wer": 1.0017800210920307, + "step": 63000 + }, + { + "epoch": 11.41, + "eval_loss": 0.16354435682296753, + "eval_runtime": 594.6962, + "eval_samples_per_second": 25.373, + "eval_steps_per_second": 3.173, + "eval_wer": 1.0031699005748493, + "step": 63100 + }, + { + "epoch": 11.43, + "eval_loss": 0.16535265743732452, + "eval_runtime": 592.2376, + "eval_samples_per_second": 25.478, + "eval_steps_per_second": 3.186, + "eval_wer": 1.0141974969977383, + "step": 63200 + }, + { + "epoch": 11.45, + "eval_loss": 0.16461621224880219, + "eval_runtime": 716.9918, + "eval_samples_per_second": 21.045, + "eval_steps_per_second": 2.632, + "eval_wer": 1.00310894094841, + "step": 63300 + }, + { + "epoch": 11.47, + "eval_loss": 0.16176651418209076, + "eval_runtime": 647.4, + "eval_samples_per_second": 23.307, + "eval_steps_per_second": 2.915, + "eval_wer": 1.011753015977518, + "step": 63400 + }, + { + "epoch": 11.49, + "learning_rate": 7.077044406697403e-05, + "loss": 0.0579, + "step": 63500 + }, + { + "epoch": 11.49, + "eval_loss": 0.16339966654777527, + "eval_runtime": 586.1423, + "eval_samples_per_second": 25.743, + "eval_steps_per_second": 3.219, + "eval_wer": 1.021756490676225, + "step": 63500 + }, + { + "epoch": 11.51, + "eval_loss": 0.16159561276435852, + "eval_runtime": 580.4665, + "eval_samples_per_second": 25.995, + "eval_steps_per_second": 3.251, + "eval_wer": 1.0179221301731862, + "step": 63600 + }, + { + "epoch": 11.52, + "eval_loss": 0.16033950448036194, + "eval_runtime": 1050.4902, + "eval_samples_per_second": 14.364, + "eval_steps_per_second": 1.796, + "eval_wer": 1.0035539462214176, + "step": 63700 + }, + { + "epoch": 11.54, + "eval_loss": 0.16100841760635376, + "eval_runtime": 798.7889, + "eval_samples_per_second": 18.89, + "eval_steps_per_second": 2.362, + "eval_wer": 1.0150143559920264, + "step": 63800 + }, + { + "epoch": 11.56, + "eval_loss": 0.16050441563129425, + "eval_runtime": 586.8618, + "eval_samples_per_second": 25.711, + "eval_steps_per_second": 3.215, + "eval_wer": 1.0285047213230678, + "step": 63900 + }, + { + "epoch": 11.58, + "learning_rate": 6.895049745207474e-05, + "loss": 0.0572, + "step": 64000 + }, + { + "epoch": 11.58, + "eval_loss": 0.16212163865566254, + "eval_runtime": 581.4798, + "eval_samples_per_second": 25.949, + "eval_steps_per_second": 3.245, + "eval_wer": 1.0261333918545748, + "step": 64000 + }, + { + "epoch": 11.6, + "eval_loss": 0.16254810988903046, + "eval_runtime": 605.5049, + "eval_samples_per_second": 24.92, + "eval_steps_per_second": 3.116, + "eval_wer": 1.0251580378315441, + "step": 64100 + }, + { + "epoch": 11.61, + "eval_loss": 0.1677384078502655, + "eval_runtime": 890.1937, + "eval_samples_per_second": 16.95, + "eval_steps_per_second": 2.12, + "eval_wer": 1.0256761946562791, + "step": 64200 + }, + { + "epoch": 11.63, + "eval_loss": 0.16564221680164337, + "eval_runtime": 584.838, + "eval_samples_per_second": 25.8, + "eval_steps_per_second": 3.227, + "eval_wer": 1.024341178837256, + "step": 64300 + }, + { + "epoch": 11.65, + "eval_loss": 0.1668614149093628, + "eval_runtime": 599.9212, + "eval_samples_per_second": 25.152, + "eval_steps_per_second": 3.145, + "eval_wer": 1.02702340240059, + "step": 64400 + }, + { + "epoch": 11.67, + "learning_rate": 6.713419073040524e-05, + "loss": 0.0592, + "step": 64500 + }, + { + "epoch": 11.67, + "eval_loss": 0.16048605740070343, + "eval_runtime": 1005.1834, + "eval_samples_per_second": 15.011, + "eval_steps_per_second": 1.877, + "eval_wer": 1.0305163889955682, + "step": 64500 + }, + { + "epoch": 11.69, + "eval_loss": 0.16325299441814423, + "eval_runtime": 666.8824, + "eval_samples_per_second": 22.626, + "eval_steps_per_second": 2.83, + "eval_wer": 1.0277244381046433, + "step": 64600 + }, + { + "epoch": 11.7, + "eval_loss": 0.16055461764335632, + "eval_runtime": 580.9411, + "eval_samples_per_second": 25.973, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0175563724145498, + "step": 64700 + }, + { + "epoch": 11.72, + "eval_loss": 0.1617630422115326, + "eval_runtime": 581.6126, + "eval_samples_per_second": 25.943, + "eval_steps_per_second": 3.244, + "eval_wer": 1.0248776235499228, + "step": 64800 + }, + { + "epoch": 11.74, + "eval_loss": 0.16090288758277893, + "eval_runtime": 1362.575, + "eval_samples_per_second": 11.074, + "eval_steps_per_second": 1.385, + "eval_wer": 1.01133849051773, + "step": 64900 + }, + { + "epoch": 11.76, + "learning_rate": 6.531424411550595e-05, + "loss": 0.0595, + "step": 65000 + }, + { + "epoch": 11.76, + "eval_loss": 0.16091392934322357, + "eval_runtime": 585.1401, + "eval_samples_per_second": 25.787, + "eval_steps_per_second": 3.225, + "eval_wer": 1.0254079722999458, + "step": 65000 + }, + { + "epoch": 11.78, + "eval_loss": 0.16618193686008453, + "eval_runtime": 582.6728, + "eval_samples_per_second": 25.896, + "eval_steps_per_second": 3.239, + "eval_wer": 1.0274927915241736, + "step": 65100 + }, + { + "epoch": 11.79, + "eval_loss": 0.16519132256507874, + "eval_runtime": 581.4475, + "eval_samples_per_second": 25.951, + "eval_steps_per_second": 3.245, + "eval_wer": 1.0163676596989815, + "step": 65200 + }, + { + "epoch": 11.81, + "eval_loss": 0.16376902163028717, + "eval_runtime": 743.8564, + "eval_samples_per_second": 20.285, + "eval_steps_per_second": 2.537, + "eval_wer": 1.026614972903446, + "step": 65300 + }, + { + "epoch": 11.83, + "eval_loss": 0.1588725447654724, + "eval_runtime": 656.9651, + "eval_samples_per_second": 22.968, + "eval_steps_per_second": 2.872, + "eval_wer": 1.0273952561218704, + "step": 65400 + }, + { + "epoch": 11.85, + "learning_rate": 6.349429750060664e-05, + "loss": 0.0588, + "step": 65500 + }, + { + "epoch": 11.85, + "eval_loss": 0.16070173680782318, + "eval_runtime": 596.2298, + "eval_samples_per_second": 25.307, + "eval_steps_per_second": 3.165, + "eval_wer": 1.0135635168827686, + "step": 65500 + }, + { + "epoch": 11.87, + "eval_loss": 0.15919756889343262, + "eval_runtime": 582.5632, + "eval_samples_per_second": 25.901, + "eval_steps_per_second": 3.239, + "eval_wer": 1.0135818047707004, + "step": 65600 + }, + { + "epoch": 11.88, + "eval_loss": 0.15812398493289948, + "eval_runtime": 885.713, + "eval_samples_per_second": 17.036, + "eval_steps_per_second": 2.13, + "eval_wer": 1.018281791969179, + "step": 65700 + }, + { + "epoch": 11.9, + "eval_loss": 0.15873989462852478, + "eval_runtime": 753.9732, + "eval_samples_per_second": 20.013, + "eval_steps_per_second": 2.503, + "eval_wer": 1.0132891985637913, + "step": 65800 + }, + { + "epoch": 11.92, + "eval_loss": 0.15961608290672302, + "eval_runtime": 581.7374, + "eval_samples_per_second": 25.938, + "eval_steps_per_second": 3.244, + "eval_wer": 1.0169894478886634, + "step": 65900 + }, + { + "epoch": 11.94, + "learning_rate": 6.167435088570735e-05, + "loss": 0.0558, + "step": 66000 + }, + { + "epoch": 11.94, + "eval_loss": 0.15900225937366486, + "eval_runtime": 581.5784, + "eval_samples_per_second": 25.945, + "eval_steps_per_second": 3.245, + "eval_wer": 1.016099437342648, + "step": 66000 + }, + { + "epoch": 11.96, + "eval_loss": 0.15970025956630707, + "eval_runtime": 777.4608, + "eval_samples_per_second": 19.408, + "eval_steps_per_second": 2.427, + "eval_wer": 1.0193485854318685, + "step": 66100 + }, + { + "epoch": 11.98, + "eval_loss": 0.15903662145137787, + "eval_runtime": 626.8518, + "eval_samples_per_second": 24.071, + "eval_steps_per_second": 3.01, + "eval_wer": 1.019287625805429, + "step": 66200 + }, + { + "epoch": 11.99, + "eval_loss": 0.16078583896160126, + "eval_runtime": 597.6499, + "eval_samples_per_second": 25.247, + "eval_steps_per_second": 3.157, + "eval_wer": 1.0242131636217333, + "step": 66300 + }, + { + "epoch": 12.01, + "eval_loss": 0.16416209936141968, + "eval_runtime": 583.6843, + "eval_samples_per_second": 25.851, + "eval_steps_per_second": 3.233, + "eval_wer": 1.0231036984205362, + "step": 66400 + }, + { + "epoch": 12.03, + "learning_rate": 5.985440427080805e-05, + "loss": 0.0555, + "step": 66500 + }, + { + "epoch": 12.03, + "eval_loss": 0.16788017749786377, + "eval_runtime": 707.5448, + "eval_samples_per_second": 21.326, + "eval_steps_per_second": 2.667, + "eval_wer": 1.0167882811214133, + "step": 66500 + }, + { + "epoch": 12.05, + "eval_loss": 0.16742467880249023, + "eval_runtime": 622.7757, + "eval_samples_per_second": 24.229, + "eval_steps_per_second": 3.03, + "eval_wer": 1.0083331809342673, + "step": 66600 + }, + { + "epoch": 12.07, + "eval_loss": 0.16581884026527405, + "eval_runtime": 602.3727, + "eval_samples_per_second": 25.049, + "eval_steps_per_second": 3.133, + "eval_wer": 1.006912821638229, + "step": 66700 + }, + { + "epoch": 12.08, + "eval_loss": 0.16606904566287994, + "eval_runtime": 608.0454, + "eval_samples_per_second": 24.816, + "eval_steps_per_second": 3.103, + "eval_wer": 1.0133867339660942, + "step": 66800 + }, + { + "epoch": 12.1, + "eval_loss": 0.16823889315128326, + "eval_runtime": 947.3259, + "eval_samples_per_second": 15.928, + "eval_steps_per_second": 1.992, + "eval_wer": 1.0274318318977342, + "step": 66900 + }, + { + "epoch": 12.12, + "learning_rate": 5.8034457655908755e-05, + "loss": 0.0508, + "step": 67000 + }, + { + "epoch": 12.12, + "eval_loss": 0.1702161282300949, + "eval_runtime": 601.9908, + "eval_samples_per_second": 25.065, + "eval_steps_per_second": 3.135, + "eval_wer": 1.0219271776302554, + "step": 67000 + }, + { + "epoch": 12.14, + "eval_loss": 0.16944070160388947, + "eval_runtime": 582.5035, + "eval_samples_per_second": 25.904, + "eval_steps_per_second": 3.239, + "eval_wer": 1.021860122041172, + "step": 67100 + }, + { + "epoch": 12.16, + "eval_loss": 0.16666612029075623, + "eval_runtime": 581.5026, + "eval_samples_per_second": 25.948, + "eval_steps_per_second": 3.245, + "eval_wer": 1.023640143133203, + "step": 67200 + }, + { + "epoch": 12.17, + "eval_loss": 0.16717979311943054, + "eval_runtime": 586.3236, + "eval_samples_per_second": 25.735, + "eval_steps_per_second": 3.218, + "eval_wer": 1.0253226288229307, + "step": 67300 + }, + { + "epoch": 12.19, + "eval_loss": 0.16397833824157715, + "eval_runtime": 754.9429, + "eval_samples_per_second": 19.987, + "eval_steps_per_second": 2.5, + "eval_wer": 1.021457788506672, + "step": 67400 + }, + { + "epoch": 12.21, + "learning_rate": 5.621451104100946e-05, + "loss": 0.0513, + "step": 67500 + }, + { + "epoch": 12.21, + "eval_loss": 0.16485707461833954, + "eval_runtime": 604.5571, + "eval_samples_per_second": 24.959, + "eval_steps_per_second": 3.121, + "eval_wer": 1.024237547472309, + "step": 67500 + }, + { + "epoch": 12.23, + "eval_loss": 0.16873668134212494, + "eval_runtime": 594.5739, + "eval_samples_per_second": 25.378, + "eval_steps_per_second": 3.174, + "eval_wer": 1.026224831294234, + "step": 67600 + }, + { + "epoch": 12.25, + "eval_loss": 0.16546061635017395, + "eval_runtime": 1060.8443, + "eval_samples_per_second": 14.224, + "eval_steps_per_second": 1.779, + "eval_wer": 1.0231036984205362, + "step": 67700 + }, + { + "epoch": 12.26, + "eval_loss": 0.1691717505455017, + "eval_runtime": 598.0013, + "eval_samples_per_second": 25.232, + "eval_steps_per_second": 3.156, + "eval_wer": 1.0176112360783454, + "step": 67800 + }, + { + "epoch": 12.28, + "eval_loss": 0.16749083995819092, + "eval_runtime": 584.068, + "eval_samples_per_second": 25.834, + "eval_steps_per_second": 3.231, + "eval_wer": 1.0201654444261565, + "step": 67900 + }, + { + "epoch": 12.3, + "learning_rate": 5.439456442611016e-05, + "loss": 0.0519, + "step": 68000 + }, + { + "epoch": 12.3, + "eval_loss": 0.16435594856739044, + "eval_runtime": 581.2292, + "eval_samples_per_second": 25.961, + "eval_steps_per_second": 3.247, + "eval_wer": 1.0240973403314984, + "step": 68000 + }, + { + "epoch": 12.32, + "eval_loss": 0.16505275666713715, + "eval_runtime": 865.456, + "eval_samples_per_second": 17.435, + "eval_steps_per_second": 2.18, + "eval_wer": 1.029717817889212, + "step": 68100 + }, + { + "epoch": 12.34, + "eval_loss": 0.16610455513000488, + "eval_runtime": 617.3975, + "eval_samples_per_second": 24.44, + "eval_steps_per_second": 3.056, + "eval_wer": 1.0287363679035375, + "step": 68200 + }, + { + "epoch": 12.36, + "eval_loss": 0.16653628647327423, + "eval_runtime": 579.7196, + "eval_samples_per_second": 26.028, + "eval_steps_per_second": 3.255, + "eval_wer": 1.0256761946562791, + "step": 68300 + }, + { + "epoch": 12.37, + "eval_loss": 0.16854335367679596, + "eval_runtime": 582.7632, + "eval_samples_per_second": 25.892, + "eval_steps_per_second": 3.238, + "eval_wer": 1.0232743853745665, + "step": 68400 + }, + { + "epoch": 12.39, + "learning_rate": 5.258189759767046e-05, + "loss": 0.0522, + "step": 68500 + }, + { + "epoch": 12.39, + "eval_loss": 0.1635940819978714, + "eval_runtime": 1242.3531, + "eval_samples_per_second": 12.146, + "eval_steps_per_second": 1.519, + "eval_wer": 1.017733155331224, + "step": 68500 + }, + { + "epoch": 12.41, + "eval_loss": 0.17086556553840637, + "eval_runtime": 604.527, + "eval_samples_per_second": 24.96, + "eval_steps_per_second": 3.121, + "eval_wer": 1.0199947574721262, + "step": 68600 + }, + { + "epoch": 12.43, + "eval_loss": 0.16842861473560333, + "eval_runtime": 594.3258, + "eval_samples_per_second": 25.388, + "eval_steps_per_second": 3.175, + "eval_wer": 1.0164347152880646, + "step": 68700 + }, + { + "epoch": 12.45, + "eval_loss": 0.16664543747901917, + "eval_runtime": 582.5029, + "eval_samples_per_second": 25.904, + "eval_steps_per_second": 3.239, + "eval_wer": 1.0118810311930408, + "step": 68800 + }, + { + "epoch": 12.46, + "eval_loss": 0.16832029819488525, + "eval_runtime": 794.8021, + "eval_samples_per_second": 18.985, + "eval_steps_per_second": 2.374, + "eval_wer": 1.0136427643971397, + "step": 68900 + }, + { + "epoch": 12.48, + "learning_rate": 5.076195098277117e-05, + "loss": 0.05, + "step": 69000 + }, + { + "epoch": 12.48, + "eval_loss": 0.16963930428028107, + "eval_runtime": 582.3733, + "eval_samples_per_second": 25.909, + "eval_steps_per_second": 3.24, + "eval_wer": 1.012703986149973, + "step": 69000 + }, + { + "epoch": 12.5, + "eval_loss": 0.17076294124126434, + "eval_runtime": 586.0869, + "eval_samples_per_second": 25.745, + "eval_steps_per_second": 3.22, + "eval_wer": 1.01836103948355, + "step": 69100 + }, + { + "epoch": 12.52, + "eval_loss": 0.1653919816017151, + "eval_runtime": 580.9443, + "eval_samples_per_second": 25.973, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0282486908920223, + "step": 69200 + }, + { + "epoch": 12.54, + "eval_loss": 0.17003265023231506, + "eval_runtime": 864.4381, + "eval_samples_per_second": 17.455, + "eval_steps_per_second": 2.183, + "eval_wer": 1.0234633602165286, + "step": 69300 + }, + { + "epoch": 12.55, + "eval_loss": 0.1688261330127716, + "eval_runtime": 728.1606, + "eval_samples_per_second": 20.722, + "eval_steps_per_second": 2.591, + "eval_wer": 1.0257188663947867, + "step": 69400 + }, + { + "epoch": 12.57, + "learning_rate": 4.894200436787187e-05, + "loss": 0.0513, + "step": 69500 + }, + { + "epoch": 12.57, + "eval_loss": 0.16455566883087158, + "eval_runtime": 591.0272, + "eval_samples_per_second": 25.53, + "eval_steps_per_second": 3.193, + "eval_wer": 1.0273525843833629, + "step": 69500 + }, + { + "epoch": 12.59, + "eval_loss": 0.16600140929222107, + "eval_runtime": 581.0392, + "eval_samples_per_second": 25.969, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0246520729320971, + "step": 69600 + }, + { + "epoch": 12.61, + "eval_loss": 0.16570237278938293, + "eval_runtime": 845.5309, + "eval_samples_per_second": 17.846, + "eval_steps_per_second": 2.232, + "eval_wer": 1.0187511810927623, + "step": 69700 + }, + { + "epoch": 12.63, + "eval_loss": 0.1653689593076706, + "eval_runtime": 623.5969, + "eval_samples_per_second": 24.197, + "eval_steps_per_second": 3.026, + "eval_wer": 1.008668458879684, + "step": 69800 + }, + { + "epoch": 12.64, + "eval_loss": 0.1681143045425415, + "eval_runtime": 585.1239, + "eval_samples_per_second": 25.788, + "eval_steps_per_second": 3.225, + "eval_wer": 1.0145876386069506, + "step": 69900 + }, + { + "epoch": 12.66, + "learning_rate": 4.712205775297258e-05, + "loss": 0.0512, + "step": 70000 + }, + { + "epoch": 12.66, + "eval_loss": 0.16601833701133728, + "eval_runtime": 581.0502, + "eval_samples_per_second": 25.968, + "eval_steps_per_second": 3.248, + "eval_wer": 1.018458574885853, + "step": 70000 + }, + { + "epoch": 12.68, + "eval_loss": 0.16897162795066833, + "eval_runtime": 678.6995, + "eval_samples_per_second": 22.232, + "eval_steps_per_second": 2.78, + "eval_wer": 1.0214212127308084, + "step": 70100 + }, + { + "epoch": 12.7, + "eval_loss": 0.16828937828540802, + "eval_runtime": 648.0173, + "eval_samples_per_second": 23.285, + "eval_steps_per_second": 2.912, + "eval_wer": 1.015995805977701, + "step": 70200 + }, + { + "epoch": 12.72, + "eval_loss": 0.16954827308654785, + "eval_runtime": 587.6953, + "eval_samples_per_second": 25.675, + "eval_steps_per_second": 3.211, + "eval_wer": 1.019811878592808, + "step": 70300 + }, + { + "epoch": 12.74, + "eval_loss": 0.1666439175605774, + "eval_runtime": 588.0923, + "eval_samples_per_second": 25.658, + "eval_steps_per_second": 3.209, + "eval_wer": 1.0192693379174973, + "step": 70400 + }, + { + "epoch": 12.75, + "learning_rate": 4.530575103130307e-05, + "loss": 0.0484, + "step": 70500 + }, + { + "epoch": 12.75, + "eval_loss": 0.16543133556842804, + "eval_runtime": 812.0461, + "eval_samples_per_second": 18.581, + "eval_steps_per_second": 2.324, + "eval_wer": 1.0141609212218747, + "step": 70500 + }, + { + "epoch": 12.77, + "eval_loss": 0.15983402729034424, + "eval_runtime": 628.158, + "eval_samples_per_second": 24.021, + "eval_steps_per_second": 3.004, + "eval_wer": 1.015374017788019, + "step": 70600 + }, + { + "epoch": 12.79, + "eval_loss": 0.1623169183731079, + "eval_runtime": 586.556, + "eval_samples_per_second": 25.725, + "eval_steps_per_second": 3.217, + "eval_wer": 1.013923178678761, + "step": 70700 + }, + { + "epoch": 12.81, + "eval_loss": 0.16623294353485107, + "eval_runtime": 590.6252, + "eval_samples_per_second": 25.548, + "eval_steps_per_second": 3.195, + "eval_wer": 1.0180013776875576, + "step": 70800 + }, + { + "epoch": 12.83, + "eval_loss": 0.16593489050865173, + "eval_runtime": 853.4994, + "eval_samples_per_second": 17.679, + "eval_steps_per_second": 2.211, + "eval_wer": 1.0231646580469755, + "step": 70900 + }, + { + "epoch": 12.84, + "learning_rate": 4.348580441640378e-05, + "loss": 0.0501, + "step": 71000 + }, + { + "epoch": 12.84, + "eval_loss": 0.16620078682899475, + "eval_runtime": 581.8553, + "eval_samples_per_second": 25.933, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0202446919405277, + "step": 71000 + }, + { + "epoch": 12.86, + "eval_loss": 0.16386279463768005, + "eval_runtime": 588.8821, + "eval_samples_per_second": 25.623, + "eval_steps_per_second": 3.204, + "eval_wer": 1.0161299171558678, + "step": 71100 + }, + { + "epoch": 12.88, + "eval_loss": 0.1666136533021927, + "eval_runtime": 585.387, + "eval_samples_per_second": 25.776, + "eval_steps_per_second": 3.224, + "eval_wer": 1.0151423712075491, + "step": 71200 + }, + { + "epoch": 12.9, + "eval_loss": 0.16440027952194214, + "eval_runtime": 707.9711, + "eval_samples_per_second": 21.313, + "eval_steps_per_second": 2.665, + "eval_wer": 1.0128624811787152, + "step": 71300 + }, + { + "epoch": 12.92, + "eval_loss": 0.16417254507541656, + "eval_runtime": 706.7784, + "eval_samples_per_second": 21.349, + "eval_steps_per_second": 2.67, + "eval_wer": 1.0170625994403906, + "step": 71400 + }, + { + "epoch": 12.93, + "learning_rate": 4.1665857801504485e-05, + "loss": 0.0482, + "step": 71500 + }, + { + "epoch": 12.93, + "eval_loss": 0.16351790726184845, + "eval_runtime": 590.5254, + "eval_samples_per_second": 25.552, + "eval_steps_per_second": 3.195, + "eval_wer": 1.0162396444834587, + "step": 71500 + }, + { + "epoch": 12.95, + "eval_loss": 0.1636749505996704, + "eval_runtime": 601.6692, + "eval_samples_per_second": 25.079, + "eval_steps_per_second": 3.136, + "eval_wer": 1.0186170699145956, + "step": 71600 + }, + { + "epoch": 12.97, + "eval_loss": 0.16393718123435974, + "eval_runtime": 684.7308, + "eval_samples_per_second": 22.036, + "eval_steps_per_second": 2.756, + "eval_wer": 1.014221880848314, + "step": 71700 + }, + { + "epoch": 12.99, + "eval_loss": 0.1642550379037857, + "eval_runtime": 792.2739, + "eval_samples_per_second": 19.045, + "eval_steps_per_second": 2.382, + "eval_wer": 1.0122345970263895, + "step": 71800 + }, + { + "epoch": 13.01, + "eval_loss": 0.16787484288215637, + "eval_runtime": 581.9813, + "eval_samples_per_second": 25.927, + "eval_steps_per_second": 3.242, + "eval_wer": 1.0156117603311328, + "step": 71900 + }, + { + "epoch": 13.02, + "learning_rate": 3.984955107983499e-05, + "loss": 0.0483, + "step": 72000 + }, + { + "epoch": 13.02, + "eval_loss": 0.17167212069034576, + "eval_runtime": 581.162, + "eval_samples_per_second": 25.964, + "eval_steps_per_second": 3.247, + "eval_wer": 1.0223721829032633, + "step": 72000 + }, + { + "epoch": 13.04, + "eval_loss": 0.17421314120292664, + "eval_runtime": 1273.8126, + "eval_samples_per_second": 11.846, + "eval_steps_per_second": 1.481, + "eval_wer": 1.02290862761593, + "step": 72100 + }, + { + "epoch": 13.06, + "eval_loss": 0.1717776656150818, + "eval_runtime": 638.8652, + "eval_samples_per_second": 23.618, + "eval_steps_per_second": 2.954, + "eval_wer": 1.0236950067969983, + "step": 72200 + }, + { + "epoch": 13.08, + "eval_loss": 0.17424285411834717, + "eval_runtime": 596.8233, + "eval_samples_per_second": 25.282, + "eval_steps_per_second": 3.162, + "eval_wer": 1.0265723011649384, + "step": 72300 + }, + { + "epoch": 13.1, + "eval_loss": 0.1735859364271164, + "eval_runtime": 584.6288, + "eval_samples_per_second": 25.81, + "eval_steps_per_second": 3.228, + "eval_wer": 1.0257310583200747, + "step": 72400 + }, + { + "epoch": 13.12, + "learning_rate": 3.80296044649357e-05, + "loss": 0.0443, + "step": 72500 + }, + { + "epoch": 13.12, + "eval_loss": 0.17412111163139343, + "eval_runtime": 583.8537, + "eval_samples_per_second": 25.844, + "eval_steps_per_second": 3.232, + "eval_wer": 1.027541559225325, + "step": 72500 + }, + { + "epoch": 13.13, + "eval_loss": 0.17448225617408752, + "eval_runtime": 582.1865, + "eval_samples_per_second": 25.918, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0325280566680688, + "step": 72600 + }, + { + "epoch": 13.15, + "eval_loss": 0.17374877631664276, + "eval_runtime": 591.7623, + "eval_samples_per_second": 25.498, + "eval_steps_per_second": 3.189, + "eval_wer": 1.0295593228604696, + "step": 72700 + }, + { + "epoch": 13.17, + "eval_loss": 0.17223623394966125, + "eval_runtime": 580.7728, + "eval_samples_per_second": 25.981, + "eval_steps_per_second": 3.249, + "eval_wer": 1.0302847424150985, + "step": 72800 + }, + { + "epoch": 13.19, + "eval_loss": 0.17018476128578186, + "eval_runtime": 754.3079, + "eval_samples_per_second": 20.004, + "eval_steps_per_second": 2.502, + "eval_wer": 1.0304615253317728, + "step": 72900 + }, + { + "epoch": 13.21, + "learning_rate": 3.620965785003639e-05, + "loss": 0.0424, + "step": 73000 + }, + { + "epoch": 13.21, + "eval_loss": 0.17333687841892242, + "eval_runtime": 620.495, + "eval_samples_per_second": 24.318, + "eval_steps_per_second": 3.041, + "eval_wer": 1.0240546685929908, + "step": 73000 + }, + { + "epoch": 13.22, + "eval_loss": 0.1748303323984146, + "eval_runtime": 581.8368, + "eval_samples_per_second": 25.933, + "eval_steps_per_second": 3.243, + "eval_wer": 1.0243046030613925, + "step": 73100 + }, + { + "epoch": 13.24, + "eval_loss": 0.175998255610466, + "eval_runtime": 582.7142, + "eval_samples_per_second": 25.894, + "eval_steps_per_second": 3.238, + "eval_wer": 1.0230732186073164, + "step": 73200 + }, + { + "epoch": 13.26, + "eval_loss": 0.17454344034194946, + "eval_runtime": 991.8052, + "eval_samples_per_second": 15.214, + "eval_steps_per_second": 1.903, + "eval_wer": 1.0241339161073622, + "step": 73300 + }, + { + "epoch": 13.28, + "eval_loss": 0.17719770967960358, + "eval_runtime": 699.1737, + "eval_samples_per_second": 21.581, + "eval_steps_per_second": 2.699, + "eval_wer": 1.0217077229750735, + "step": 73400 + }, + { + "epoch": 13.3, + "learning_rate": 3.4389711235137095e-05, + "loss": 0.0424, + "step": 73500 + }, + { + "epoch": 13.3, + "eval_loss": 0.17551423609256744, + "eval_runtime": 581.4162, + "eval_samples_per_second": 25.952, + "eval_steps_per_second": 3.246, + "eval_wer": 1.0205677779606566, + "step": 73500 + }, + { + "epoch": 13.31, + "eval_loss": 0.17427977919578552, + "eval_runtime": 583.119, + "eval_samples_per_second": 25.876, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0241948757338015, + "step": 73600 + }, + { + "epoch": 13.33, + "eval_loss": 0.1737585812807083, + "eval_runtime": 648.7553, + "eval_samples_per_second": 23.258, + "eval_steps_per_second": 2.909, + "eval_wer": 1.02083600031699, + "step": 73700 + }, + { + "epoch": 13.35, + "eval_loss": 0.17359158396720886, + "eval_runtime": 582.3603, + "eval_samples_per_second": 25.91, + "eval_steps_per_second": 3.24, + "eval_wer": 1.0248715275872788, + "step": 73800 + }, + { + "epoch": 13.37, + "eval_loss": 0.17472000420093536, + "eval_runtime": 582.9221, + "eval_samples_per_second": 25.885, + "eval_steps_per_second": 3.237, + "eval_wer": 1.0270599781764538, + "step": 73900 + }, + { + "epoch": 13.39, + "learning_rate": 3.2569764620237805e-05, + "loss": 0.0437, + "step": 74000 + }, + { + "epoch": 13.39, + "eval_loss": 0.17074641585350037, + "eval_runtime": 580.5198, + "eval_samples_per_second": 25.992, + "eval_steps_per_second": 3.251, + "eval_wer": 1.0240729564809228, + "step": 74000 + }, + { + "epoch": 13.4, + "eval_loss": 0.17314904928207397, + "eval_runtime": 1076.3581, + "eval_samples_per_second": 14.019, + "eval_steps_per_second": 1.753, + "eval_wer": 1.0268588114092037, + "step": 74100 + }, + { + "epoch": 13.42, + "eval_loss": 0.17427843809127808, + "eval_runtime": 629.3424, + "eval_samples_per_second": 23.976, + "eval_steps_per_second": 2.998, + "eval_wer": 1.0290228781478028, + "step": 74200 + }, + { + "epoch": 13.44, + "eval_loss": 0.17391642928123474, + "eval_runtime": 588.8228, + "eval_samples_per_second": 25.626, + "eval_steps_per_second": 3.205, + "eval_wer": 1.0265783971275824, + "step": 74300 + }, + { + "epoch": 13.46, + "eval_loss": 0.17630253732204437, + "eval_runtime": 596.5515, + "eval_samples_per_second": 25.294, + "eval_steps_per_second": 3.163, + "eval_wer": 1.024566729455082, + "step": 74400 + }, + { + "epoch": 13.48, + "learning_rate": 3.074981800533851e-05, + "loss": 0.0443, + "step": 74500 + }, + { + "epoch": 13.48, + "eval_loss": 0.1723669320344925, + "eval_runtime": 696.4206, + "eval_samples_per_second": 21.667, + "eval_steps_per_second": 2.71, + "eval_wer": 1.020933535719293, + "step": 74500 + }, + { + "epoch": 13.49, + "eval_loss": 0.17442239820957184, + "eval_runtime": 634.1169, + "eval_samples_per_second": 23.795, + "eval_steps_per_second": 2.976, + "eval_wer": 1.0244204263516272, + "step": 74600 + }, + { + "epoch": 13.51, + "eval_loss": 0.171742781996727, + "eval_runtime": 588.0795, + "eval_samples_per_second": 25.658, + "eval_steps_per_second": 3.209, + "eval_wer": 1.0231646580469755, + "step": 74700 + }, + { + "epoch": 13.53, + "eval_loss": 0.17540408670902252, + "eval_runtime": 584.6829, + "eval_samples_per_second": 25.807, + "eval_steps_per_second": 3.227, + "eval_wer": 1.0217016270124297, + "step": 74800 + }, + { + "epoch": 13.55, + "eval_loss": 0.17214533686637878, + "eval_runtime": 720.7618, + "eval_samples_per_second": 20.935, + "eval_steps_per_second": 2.618, + "eval_wer": 1.023414592515377, + "step": 74900 + }, + { + "epoch": 13.57, + "learning_rate": 2.8929871390439213e-05, + "loss": 0.0435, + "step": 75000 + }, + { + "epoch": 13.57, + "eval_loss": 0.17512725293636322, + "eval_runtime": 739.201, + "eval_samples_per_second": 20.413, + "eval_steps_per_second": 2.553, + "eval_wer": 1.0196960553025731, + "step": 75000 + }, + { + "epoch": 13.59, + "eval_loss": 0.1726856231689453, + "eval_runtime": 583.0039, + "eval_samples_per_second": 25.881, + "eval_steps_per_second": 3.237, + "eval_wer": 1.0285230092109996, + "step": 75100 + }, + { + "epoch": 13.6, + "eval_loss": 0.1715420037508011, + "eval_runtime": 601.6364, + "eval_samples_per_second": 25.08, + "eval_steps_per_second": 3.136, + "eval_wer": 1.0220612888084222, + "step": 75200 + }, + { + "epoch": 13.62, + "eval_loss": 0.17459963262081146, + "eval_runtime": 650.5666, + "eval_samples_per_second": 23.194, + "eval_steps_per_second": 2.901, + "eval_wer": 1.0247130325585365, + "step": 75300 + }, + { + "epoch": 13.64, + "eval_loss": 0.1712324321269989, + "eval_runtime": 710.0998, + "eval_samples_per_second": 21.249, + "eval_steps_per_second": 2.657, + "eval_wer": 1.0230610266820286, + "step": 75400 + }, + { + "epoch": 13.66, + "learning_rate": 2.7109924775539916e-05, + "loss": 0.0436, + "step": 75500 + }, + { + "epoch": 13.66, + "eval_loss": 0.1718807965517044, + "eval_runtime": 593.922, + "eval_samples_per_second": 25.406, + "eval_steps_per_second": 3.177, + "eval_wer": 1.0228110922136269, + "step": 75500 + }, + { + "epoch": 13.68, + "eval_loss": 0.1727399230003357, + "eval_runtime": 583.5966, + "eval_samples_per_second": 25.855, + "eval_steps_per_second": 3.233, + "eval_wer": 1.0196777674146413, + "step": 75600 + }, + { + "epoch": 13.69, + "eval_loss": 0.17502325773239136, + "eval_runtime": 764.0324, + "eval_samples_per_second": 19.749, + "eval_steps_per_second": 2.47, + "eval_wer": 1.0252494772712033, + "step": 75700 + }, + { + "epoch": 13.71, + "eval_loss": 0.17015357315540314, + "eval_runtime": 668.0971, + "eval_samples_per_second": 22.585, + "eval_steps_per_second": 2.824, + "eval_wer": 1.0240729564809228, + "step": 75800 + }, + { + "epoch": 13.73, + "eval_loss": 0.17203068733215332, + "eval_runtime": 590.9321, + "eval_samples_per_second": 25.534, + "eval_steps_per_second": 3.193, + "eval_wer": 1.0249873508775138, + "step": 75900 + }, + { + "epoch": 13.75, + "learning_rate": 2.528997816064062e-05, + "loss": 0.0433, + "step": 76000 + }, + { + "epoch": 13.75, + "eval_loss": 0.17436811327934265, + "eval_runtime": 583.8521, + "eval_samples_per_second": 25.844, + "eval_steps_per_second": 3.232, + "eval_wer": 1.0209823034204446, + "step": 76000 + }, + { + "epoch": 13.77, + "eval_loss": 0.17346572875976562, + "eval_runtime": 751.961, + "eval_samples_per_second": 20.066, + "eval_steps_per_second": 2.509, + "eval_wer": 1.0211164145986114, + "step": 76100 + }, + { + "epoch": 13.78, + "eval_loss": 0.17268899083137512, + "eval_runtime": 698.8382, + "eval_samples_per_second": 21.592, + "eval_steps_per_second": 2.7, + "eval_wer": 1.020537298147437, + "step": 76200 + }, + { + "epoch": 13.8, + "eval_loss": 0.17062433063983917, + "eval_runtime": 597.277, + "eval_samples_per_second": 25.263, + "eval_steps_per_second": 3.159, + "eval_wer": 1.0218174503026645, + "step": 76300 + }, + { + "epoch": 13.82, + "eval_loss": 0.17094029486179352, + "eval_runtime": 582.5296, + "eval_samples_per_second": 25.903, + "eval_steps_per_second": 3.239, + "eval_wer": 1.0237681583487257, + "step": 76400 + }, + { + "epoch": 13.84, + "learning_rate": 2.347003154574132e-05, + "loss": 0.0431, + "step": 76500 + }, + { + "epoch": 13.84, + "eval_loss": 0.17047877609729767, + "eval_runtime": 1185.1824, + "eval_samples_per_second": 12.731, + "eval_steps_per_second": 1.592, + "eval_wer": 1.0196716714519973, + "step": 76500 + }, + { + "epoch": 13.86, + "eval_loss": 0.1734394133090973, + "eval_runtime": 607.5712, + "eval_samples_per_second": 24.835, + "eval_steps_per_second": 3.106, + "eval_wer": 1.0222929353888919, + "step": 76600 + }, + { + "epoch": 13.87, + "eval_loss": 0.1695163995027542, + "eval_runtime": 597.2652, + "eval_samples_per_second": 25.263, + "eval_steps_per_second": 3.159, + "eval_wer": 1.024969062989582, + "step": 76700 + }, + { + "epoch": 13.89, + "eval_loss": 0.17340916395187378, + "eval_runtime": 583.1636, + "eval_samples_per_second": 25.874, + "eval_steps_per_second": 3.236, + "eval_wer": 1.0231524661216875, + "step": 76800 + }, + { + "epoch": 13.91, + "eval_loss": 0.17240017652511597, + "eval_runtime": 675.155, + "eval_samples_per_second": 22.349, + "eval_steps_per_second": 2.795, + "eval_wer": 1.0219454655181872, + "step": 76900 + }, + { + "epoch": 13.93, + "learning_rate": 2.1653724824071823e-05, + "loss": 0.041, + "step": 77000 + }, + { + "epoch": 13.93, + "eval_loss": 0.17061379551887512, + "eval_runtime": 661.5346, + "eval_samples_per_second": 22.809, + "eval_steps_per_second": 2.852, + "eval_wer": 1.0236035673573392, + "step": 77000 + }, + { + "epoch": 13.95, + "eval_loss": 0.1688837707042694, + "eval_runtime": 591.3973, + "eval_samples_per_second": 25.514, + "eval_steps_per_second": 3.191, + "eval_wer": 1.0220430009204904, + "step": 77100 + }, + { + "epoch": 13.97, + "eval_loss": 0.17377950251102448, + "eval_runtime": 578.3142, + "eval_samples_per_second": 26.091, + "eval_steps_per_second": 3.263, + "eval_wer": 1.0229939710929452, + "step": 77200 + }, + { + "epoch": 13.98, + "eval_loss": 0.17272156476974487, + "eval_runtime": 885.5429, + "eval_samples_per_second": 17.039, + "eval_steps_per_second": 2.131, + "eval_wer": 1.0253653005614383, + "step": 77300 + }, + { + "epoch": 14.0, + "eval_loss": 0.17211805284023285, + "eval_runtime": 766.7304, + "eval_samples_per_second": 19.68, + "eval_steps_per_second": 2.461, + "eval_wer": 1.026109008003999, + "step": 77400 + }, + { + "epoch": 14.02, + "learning_rate": 1.983377820917253e-05, + "loss": 0.041, + "step": 77500 + }, + { + "epoch": 14.02, + "eval_loss": 0.1759880930185318, + "eval_runtime": 597.2455, + "eval_samples_per_second": 25.264, + "eval_steps_per_second": 3.16, + "eval_wer": 1.0261394878172188, + "step": 77500 + }, + { + "epoch": 14.04, + "eval_loss": 0.17724254727363586, + "eval_runtime": 582.654, + "eval_samples_per_second": 25.897, + "eval_steps_per_second": 3.239, + "eval_wer": 1.020226404052596, + "step": 77600 + }, + { + "epoch": 14.06, + "eval_loss": 0.1781727820634842, + "eval_runtime": 692.1827, + "eval_samples_per_second": 21.799, + "eval_steps_per_second": 2.726, + "eval_wer": 1.02020202020202, + "step": 77700 + }, + { + "epoch": 14.07, + "eval_loss": 0.17770732939243317, + "eval_runtime": 745.6874, + "eval_samples_per_second": 20.235, + "eval_steps_per_second": 2.531, + "eval_wer": 1.0221527282480813, + "step": 77800 + }, + { + "epoch": 14.09, + "eval_loss": 0.17872411012649536, + "eval_runtime": 597.5444, + "eval_samples_per_second": 25.252, + "eval_steps_per_second": 3.158, + "eval_wer": 1.0202812677163915, + "step": 77900 + }, + { + "epoch": 14.11, + "learning_rate": 1.8013831594273232e-05, + "loss": 0.0383, + "step": 78000 + }, + { + "epoch": 14.11, + "eval_loss": 0.17896606028079987, + "eval_runtime": 582.3356, + "eval_samples_per_second": 25.911, + "eval_steps_per_second": 3.24, + "eval_wer": 1.023634047170559, + "step": 78000 + }, + { + "epoch": 14.13, + "eval_loss": 0.18120603263378143, + "eval_runtime": 1029.6119, + "eval_samples_per_second": 14.655, + "eval_steps_per_second": 1.833, + "eval_wer": 1.0244691940527788, + "step": 78100 + }, + { + "epoch": 14.15, + "eval_loss": 0.17780369520187378, + "eval_runtime": 616.7541, + "eval_samples_per_second": 24.465, + "eval_steps_per_second": 3.06, + "eval_wer": 1.0223721829032633, + "step": 78200 + }, + { + "epoch": 14.16, + "eval_loss": 0.17714247107505798, + "eval_runtime": 582.3156, + "eval_samples_per_second": 25.912, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0230610266820286, + "step": 78300 + }, + { + "epoch": 14.18, + "eval_loss": 0.17816708981990814, + "eval_runtime": 594.1683, + "eval_samples_per_second": 25.395, + "eval_steps_per_second": 3.176, + "eval_wer": 1.0241765878458697, + "step": 78400 + }, + { + "epoch": 14.2, + "learning_rate": 1.6193884979373938e-05, + "loss": 0.0391, + "step": 78500 + }, + { + "epoch": 14.2, + "eval_loss": 0.17851784825325012, + "eval_runtime": 671.7395, + "eval_samples_per_second": 22.463, + "eval_steps_per_second": 2.809, + "eval_wer": 1.026206543406302, + "step": 78500 + }, + { + "epoch": 14.22, + "eval_loss": 0.17911860346794128, + "eval_runtime": 683.1816, + "eval_samples_per_second": 22.086, + "eval_steps_per_second": 2.762, + "eval_wer": 1.0261211999292867, + "step": 78600 + }, + { + "epoch": 14.24, + "eval_loss": 0.1769927740097046, + "eval_runtime": 582.2029, + "eval_samples_per_second": 25.917, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0253592045987943, + "step": 78700 + }, + { + "epoch": 14.25, + "eval_loss": 0.1810205727815628, + "eval_runtime": 581.863, + "eval_samples_per_second": 25.932, + "eval_steps_per_second": 3.243, + "eval_wer": 1.025706674469499, + "step": 78800 + }, + { + "epoch": 14.27, + "eval_loss": 0.17939230799674988, + "eval_runtime": 1170.3051, + "eval_samples_per_second": 12.893, + "eval_steps_per_second": 1.612, + "eval_wer": 1.0240668605182788, + "step": 78900 + }, + { + "epoch": 14.29, + "learning_rate": 1.437393836447464e-05, + "loss": 0.0387, + "step": 79000 + }, + { + "epoch": 14.29, + "eval_loss": 0.1773802638053894, + "eval_runtime": 591.6412, + "eval_samples_per_second": 25.504, + "eval_steps_per_second": 3.189, + "eval_wer": 1.0255542754034004, + "step": 79000 + }, + { + "epoch": 14.31, + "eval_loss": 0.17738394439220428, + "eval_runtime": 592.5471, + "eval_samples_per_second": 25.465, + "eval_steps_per_second": 3.185, + "eval_wer": 1.0236462390958467, + "step": 79100 + }, + { + "epoch": 14.33, + "eval_loss": 0.17587357759475708, + "eval_runtime": 591.8296, + "eval_samples_per_second": 25.496, + "eval_steps_per_second": 3.188, + "eval_wer": 1.0221710161360131, + "step": 79200 + }, + { + "epoch": 14.35, + "eval_loss": 0.178709477186203, + "eval_runtime": 645.1624, + "eval_samples_per_second": 23.388, + "eval_steps_per_second": 2.925, + "eval_wer": 1.023749870460794, + "step": 79300 + }, + { + "epoch": 14.36, + "eval_loss": 0.17875047028064728, + "eval_runtime": 650.6934, + "eval_samples_per_second": 23.189, + "eval_steps_per_second": 2.9, + "eval_wer": 1.0226525971848845, + "step": 79400 + }, + { + "epoch": 14.38, + "learning_rate": 1.2553991749575345e-05, + "loss": 0.0372, + "step": 79500 + }, + { + "epoch": 14.38, + "eval_loss": 0.1789141446352005, + "eval_runtime": 582.3073, + "eval_samples_per_second": 25.912, + "eval_steps_per_second": 3.241, + "eval_wer": 1.0232073297854831, + "step": 79500 + }, + { + "epoch": 14.4, + "eval_loss": 0.17705988883972168, + "eval_runtime": 581.24, + "eval_samples_per_second": 25.96, + "eval_steps_per_second": 3.247, + "eval_wer": 1.0254201642252336, + "step": 79600 + }, + { + "epoch": 14.42, + "eval_loss": 0.17766208946704865, + "eval_runtime": 833.161, + "eval_samples_per_second": 18.111, + "eval_steps_per_second": 2.265, + "eval_wer": 1.0243655626878319, + "step": 79700 + }, + { + "epoch": 14.44, + "eval_loss": 0.17914512753486633, + "eval_runtime": 650.6571, + "eval_samples_per_second": 23.19, + "eval_steps_per_second": 2.9, + "eval_wer": 1.0224575263802784, + "step": 79800 + }, + { + "epoch": 14.45, + "eval_loss": 0.17859181761741638, + "eval_runtime": 584.4617, + "eval_samples_per_second": 25.817, + "eval_steps_per_second": 3.229, + "eval_wer": 1.0236584310211347, + "step": 79900 + }, + { + "epoch": 14.47, + "learning_rate": 1.0734045134676047e-05, + "loss": 0.0385, + "step": 80000 + }, + { + "epoch": 14.47, + "eval_loss": 0.17818927764892578, + "eval_runtime": 582.4141, + "eval_samples_per_second": 25.908, + "eval_steps_per_second": 3.24, + "eval_wer": 1.0243106990240365, + "step": 80000 + }, + { + "epoch": 14.49, + "eval_loss": 0.17697465419769287, + "eval_runtime": 823.197, + "eval_samples_per_second": 18.33, + "eval_steps_per_second": 2.292, + "eval_wer": 1.0235608956188316, + "step": 80100 + }, + { + "epoch": 14.51, + "eval_loss": 0.17824648320674896, + "eval_runtime": 744.1916, + "eval_samples_per_second": 20.276, + "eval_steps_per_second": 2.536, + "eval_wer": 1.024048572630347, + "step": 80200 + }, + { + "epoch": 14.53, + "eval_loss": 0.17638903856277466, + "eval_runtime": 648.9894, + "eval_samples_per_second": 23.25, + "eval_steps_per_second": 2.908, + "eval_wer": 1.0242924111361045, + "step": 80300 + }, + { + "epoch": 14.54, + "eval_loss": 0.17475561797618866, + "eval_runtime": 598.8711, + "eval_samples_per_second": 25.196, + "eval_steps_per_second": 3.151, + "eval_wer": 1.0247922800729077, + "step": 80400 + }, + { + "epoch": 14.56, + "learning_rate": 8.914098519776751e-06, + "loss": 0.039, + "step": 80500 + }, + { + "epoch": 14.56, + "eval_loss": 0.17579643428325653, + "eval_runtime": 581.6292, + "eval_samples_per_second": 25.943, + "eval_steps_per_second": 3.244, + "eval_wer": 1.0231768499722633, + "step": 80500 + }, + { + "epoch": 14.58, + "eval_loss": 0.17633995413780212, + "eval_runtime": 582.92, + "eval_samples_per_second": 25.885, + "eval_steps_per_second": 3.237, + "eval_wer": 1.024554537529794, + "step": 80600 + }, + { + "epoch": 14.6, + "eval_loss": 0.17696543037891388, + "eval_runtime": 601.3023, + "eval_samples_per_second": 25.094, + "eval_steps_per_second": 3.138, + "eval_wer": 1.0219637534061192, + "step": 80700 + }, + { + "epoch": 14.62, + "eval_loss": 0.1788012832403183, + "eval_runtime": 593.5049, + "eval_samples_per_second": 25.424, + "eval_steps_per_second": 3.179, + "eval_wer": 1.0225123900440738, + "step": 80800 + }, + { + "epoch": 14.63, + "eval_loss": 0.178111732006073, + "eval_runtime": 660.5078, + "eval_samples_per_second": 22.845, + "eval_steps_per_second": 2.857, + "eval_wer": 1.0229817791676572, + "step": 80900 + }, + { + "epoch": 14.65, + "learning_rate": 7.0941519048774565e-06, + "loss": 0.039, + "step": 81000 + }, + { + "epoch": 14.65, + "eval_loss": 0.1779184192419052, + "eval_runtime": 664.0205, + "eval_samples_per_second": 22.724, + "eval_steps_per_second": 2.842, + "eval_wer": 1.0229634912797254, + "step": 81000 + }, + { + "epoch": 14.67, + "eval_loss": 0.17550311982631683, + "eval_runtime": 596.9003, + "eval_samples_per_second": 25.279, + "eval_steps_per_second": 3.161, + "eval_wer": 1.0212261419262023, + "step": 81100 + }, + { + "epoch": 14.69, + "eval_loss": 0.17648081481456757, + "eval_runtime": 601.4761, + "eval_samples_per_second": 25.087, + "eval_steps_per_second": 3.137, + "eval_wer": 1.0226221173716648, + "step": 81200 + }, + { + "epoch": 14.71, + "eval_loss": 0.17868663370609283, + "eval_runtime": 993.2238, + "eval_samples_per_second": 15.192, + "eval_steps_per_second": 1.9, + "eval_wer": 1.0241095322567864, + "step": 81300 + }, + { + "epoch": 14.72, + "eval_loss": 0.17815029621124268, + "eval_runtime": 781.2891, + "eval_samples_per_second": 19.313, + "eval_steps_per_second": 2.415, + "eval_wer": 1.0249507751016502, + "step": 81400 + }, + { + "epoch": 14.74, + "learning_rate": 5.274205289978161e-06, + "loss": 0.0368, + "step": 81500 + }, + { + "epoch": 14.74, + "eval_loss": 0.1779765784740448, + "eval_runtime": 580.5095, + "eval_samples_per_second": 25.993, + "eval_steps_per_second": 3.251, + "eval_wer": 1.0248471437367033, + "step": 81500 + }, + { + "epoch": 14.76, + "eval_loss": 0.17816530168056488, + "eval_runtime": 580.9073, + "eval_samples_per_second": 25.975, + "eval_steps_per_second": 3.248, + "eval_wer": 1.0242009716964455, + "step": 81600 + }, + { + "epoch": 14.78, + "eval_loss": 0.17820771038532257, + "eval_runtime": 616.5224, + "eval_samples_per_second": 24.474, + "eval_steps_per_second": 3.061, + "eval_wer": 1.0241948757338015, + "step": 81700 + }, + { + "epoch": 14.8, + "eval_loss": 0.17921525239944458, + "eval_runtime": 743.3365, + "eval_samples_per_second": 20.299, + "eval_steps_per_second": 2.539, + "eval_wer": 1.0240607645556348, + "step": 81800 + }, + { + "epoch": 14.82, + "eval_loss": 0.17964446544647217, + "eval_runtime": 601.8651, + "eval_samples_per_second": 25.07, + "eval_steps_per_second": 3.135, + "eval_wer": 1.0237864462366575, + "step": 81900 + }, + { + "epoch": 14.83, + "learning_rate": 3.454258675078864e-06, + "loss": 0.0378, + "step": 82000 + }, + { + "epoch": 14.83, + "eval_loss": 0.179461270570755, + "eval_runtime": 589.9434, + "eval_samples_per_second": 25.577, + "eval_steps_per_second": 3.199, + "eval_wer": 1.0235852794694074, + "step": 82000 + }, + { + "epoch": 14.85, + "eval_loss": 0.17961536347866058, + "eval_runtime": 789.7316, + "eval_samples_per_second": 19.106, + "eval_steps_per_second": 2.389, + "eval_wer": 1.0238595977883846, + "step": 82100 + }, + { + "epoch": 14.87, + "eval_loss": 0.17919617891311646, + "eval_runtime": 675.851, + "eval_samples_per_second": 22.326, + "eval_steps_per_second": 2.792, + "eval_wer": 1.023627951207915, + "step": 82200 + }, + { + "epoch": 14.89, + "eval_loss": 0.17886628210544586, + "eval_runtime": 587.1989, + "eval_samples_per_second": 25.697, + "eval_steps_per_second": 3.214, + "eval_wer": 1.0239205574148242, + "step": 82300 + }, + { + "epoch": 14.91, + "eval_loss": 0.17884646356105804, + "eval_runtime": 588.7054, + "eval_samples_per_second": 25.631, + "eval_steps_per_second": 3.205, + "eval_wer": 1.0237559664234377, + "step": 82400 + }, + { + "epoch": 14.92, + "learning_rate": 1.6379519534093665e-06, + "loss": 0.0386, + "step": 82500 + }, + { + "epoch": 14.92, + "eval_loss": 0.1787010282278061, + "eval_runtime": 856.6484, + "eval_samples_per_second": 17.614, + "eval_steps_per_second": 2.203, + "eval_wer": 1.023926653377468, + "step": 82500 + }, + { + "epoch": 14.94, + "eval_loss": 0.178622305393219, + "eval_runtime": 701.0154, + "eval_samples_per_second": 21.524, + "eval_steps_per_second": 2.692, + "eval_wer": 1.0236096633199832, + "step": 82600 + }, + { + "epoch": 14.96, + "eval_loss": 0.17859022319316864, + "eval_runtime": 596.8373, + "eval_samples_per_second": 25.282, + "eval_steps_per_second": 3.162, + "eval_wer": 1.023749870460794, + "step": 82700 + }, + { + "epoch": 14.98, + "eval_loss": 0.17872443795204163, + "eval_runtime": 582.8487, + "eval_samples_per_second": 25.888, + "eval_steps_per_second": 3.238, + "eval_wer": 1.0239449412654, + "step": 82800 + }, + { + "epoch": 15.0, + "eval_loss": 0.17875000834465027, + "eval_runtime": 977.9873, + "eval_samples_per_second": 15.429, + "eval_steps_per_second": 1.929, + "eval_wer": 1.0237925421993015, + "step": 82900 + }, + { + "epoch": 15.0, + "step": 82920, + "total_flos": 4.324450877447923e+20, + "train_loss": 0.14314281111228197, + "train_runtime": 767473.646, + "train_samples_per_second": 3.457, + "train_steps_per_second": 0.108 + } + ], + "max_steps": 82920, + "num_train_epochs": 15, + "total_flos": 4.324450877447923e+20, + "trial_name": null, + "trial_params": null +}