diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,8866 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 15.0, + "global_step": 86730, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "eval_loss": Infinity, + "eval_runtime": 555.4159, + "eval_samples_per_second": 20.293, + "eval_steps_per_second": 2.537, + "eval_wer": 1.0, + "step": 100 + }, + { + "epoch": 0.03, + "eval_loss": Infinity, + "eval_runtime": 545.0664, + "eval_samples_per_second": 20.678, + "eval_steps_per_second": 2.585, + "eval_wer": 1.0, + "step": 200 + }, + { + "epoch": 0.05, + "eval_loss": Infinity, + "eval_runtime": 543.6935, + "eval_samples_per_second": 20.73, + "eval_steps_per_second": 2.592, + "eval_wer": 0.999978988065221, + "step": 300 + }, + { + "epoch": 0.07, + "eval_loss": Infinity, + "eval_runtime": 546.0816, + "eval_samples_per_second": 20.64, + "eval_steps_per_second": 2.58, + "eval_wer": 0.7648344259539418, + "step": 400 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002982, + "loss": 3.8863, + "step": 500 + }, + { + "epoch": 0.09, + "eval_loss": Infinity, + "eval_runtime": 544.2871, + "eval_samples_per_second": 20.708, + "eval_steps_per_second": 2.589, + "eval_wer": 0.6947386115313499, + "step": 500 + }, + { + "epoch": 0.1, + "eval_loss": Infinity, + "eval_runtime": 544.7171, + "eval_samples_per_second": 20.691, + "eval_steps_per_second": 2.587, + "eval_wer": 0.6413262733232477, + "step": 600 + }, + { + "epoch": 0.12, + "eval_loss": Infinity, + "eval_runtime": 545.5744, + "eval_samples_per_second": 20.659, + "eval_steps_per_second": 2.583, + "eval_wer": 0.5953521600268953, + "step": 700 + }, + { + "epoch": 0.14, + "eval_loss": Infinity, + "eval_runtime": 545.5238, + "eval_samples_per_second": 20.661, + "eval_steps_per_second": 2.583, + "eval_wer": 0.619494873087914, + "step": 800 + }, + { + "epoch": 0.16, + "eval_loss": Infinity, + "eval_runtime": 544.0596, + "eval_samples_per_second": 20.716, + "eval_steps_per_second": 2.59, + "eval_wer": 0.530624894940326, + "step": 900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002982709033978893, + "loss": 0.5864, + "step": 1000 + }, + { + "epoch": 0.17, + "eval_loss": Infinity, + "eval_runtime": 544.4141, + "eval_samples_per_second": 20.703, + "eval_steps_per_second": 2.588, + "eval_wer": 0.5510379895780804, + "step": 1000 + }, + { + "epoch": 0.19, + "eval_loss": Infinity, + "eval_runtime": 549.751, + "eval_samples_per_second": 20.502, + "eval_steps_per_second": 2.563, + "eval_wer": 0.5625105059673895, + "step": 1100 + }, + { + "epoch": 0.21, + "eval_loss": Infinity, + "eval_runtime": 543.401, + "eval_samples_per_second": 20.742, + "eval_steps_per_second": 2.593, + "eval_wer": 0.5268742645822827, + "step": 1200 + }, + { + "epoch": 0.22, + "eval_loss": Infinity, + "eval_runtime": 543.2604, + "eval_samples_per_second": 20.747, + "eval_steps_per_second": 2.594, + "eval_wer": 0.4834425953941839, + "step": 1300 + }, + { + "epoch": 0.24, + "eval_loss": Infinity, + "eval_runtime": 544.1865, + "eval_samples_per_second": 20.712, + "eval_steps_per_second": 2.589, + "eval_wer": 0.4874138510674063, + "step": 1400 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029653136959294907, + "loss": 0.4471, + "step": 1500 + }, + { + "epoch": 0.26, + "eval_loss": Infinity, + "eval_runtime": 543.1806, + "eval_samples_per_second": 20.75, + "eval_steps_per_second": 2.594, + "eval_wer": 0.466559505799294, + "step": 1500 + }, + { + "epoch": 0.28, + "eval_loss": Infinity, + "eval_runtime": 543.9283, + "eval_samples_per_second": 20.721, + "eval_steps_per_second": 2.59, + "eval_wer": 0.4632816439737771, + "step": 1600 + }, + { + "epoch": 0.29, + "eval_loss": Infinity, + "eval_runtime": 543.32, + "eval_samples_per_second": 20.745, + "eval_steps_per_second": 2.593, + "eval_wer": 0.4523029080517734, + "step": 1700 + }, + { + "epoch": 0.31, + "eval_loss": Infinity, + "eval_runtime": 542.6473, + "eval_samples_per_second": 20.77, + "eval_steps_per_second": 2.597, + "eval_wer": 0.45108421583459407, + "step": 1800 + }, + { + "epoch": 0.33, + "eval_loss": Infinity, + "eval_runtime": 544.9665, + "eval_samples_per_second": 20.682, + "eval_steps_per_second": 2.585, + "eval_wer": 0.46307152462598755, + "step": 1900 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029479183578800877, + "loss": 0.4075, + "step": 2000 + }, + { + "epoch": 0.35, + "eval_loss": Infinity, + "eval_runtime": 543.0548, + "eval_samples_per_second": 20.755, + "eval_steps_per_second": 2.595, + "eval_wer": 0.4614641116153975, + "step": 2000 + }, + { + "epoch": 0.36, + "eval_loss": Infinity, + "eval_runtime": 543.3783, + "eval_samples_per_second": 20.742, + "eval_steps_per_second": 2.593, + "eval_wer": 0.4452113800638763, + "step": 2100 + }, + { + "epoch": 0.38, + "eval_loss": Infinity, + "eval_runtime": 556.7449, + "eval_samples_per_second": 20.244, + "eval_steps_per_second": 2.531, + "eval_wer": 0.438424525130274, + "step": 2200 + }, + { + "epoch": 0.4, + "eval_loss": Infinity, + "eval_runtime": 545.6186, + "eval_samples_per_second": 20.657, + "eval_steps_per_second": 2.582, + "eval_wer": 0.4395381576735586, + "step": 2300 + }, + { + "epoch": 0.42, + "eval_loss": Infinity, + "eval_runtime": 548.6849, + "eval_samples_per_second": 20.542, + "eval_steps_per_second": 2.568, + "eval_wer": 0.432898386283409, + "step": 2400 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002930523019830685, + "loss": 0.3885, + "step": 2500 + }, + { + "epoch": 0.43, + "eval_loss": Infinity, + "eval_runtime": 543.661, + "eval_samples_per_second": 20.732, + "eval_steps_per_second": 2.592, + "eval_wer": 0.42552319717599596, + "step": 2500 + }, + { + "epoch": 0.45, + "eval_loss": Infinity, + "eval_runtime": 544.3496, + "eval_samples_per_second": 20.705, + "eval_steps_per_second": 2.588, + "eval_wer": 0.4184106572533199, + "step": 2600 + }, + { + "epoch": 0.47, + "eval_loss": Infinity, + "eval_runtime": 545.2818, + "eval_samples_per_second": 20.67, + "eval_steps_per_second": 2.584, + "eval_wer": 0.42287569339384773, + "step": 2700 + }, + { + "epoch": 0.48, + "eval_loss": Infinity, + "eval_runtime": 543.2493, + "eval_samples_per_second": 20.747, + "eval_steps_per_second": 2.594, + "eval_wer": 0.40858757774415866, + "step": 2800 + }, + { + "epoch": 0.5, + "eval_loss": Infinity, + "eval_runtime": 544.043, + "eval_samples_per_second": 20.717, + "eval_steps_per_second": 2.59, + "eval_wer": 0.41017397881996975, + "step": 2900 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002913127681781282, + "loss": 0.3744, + "step": 3000 + }, + { + "epoch": 0.52, + "eval_loss": Infinity, + "eval_runtime": 546.2103, + "eval_samples_per_second": 20.635, + "eval_steps_per_second": 2.58, + "eval_wer": 0.3903597243234157, + "step": 3000 + }, + { + "epoch": 0.54, + "eval_loss": Infinity, + "eval_runtime": 545.1789, + "eval_samples_per_second": 20.674, + "eval_steps_per_second": 2.584, + "eval_wer": 0.39412086064884855, + "step": 3100 + }, + { + "epoch": 0.55, + "eval_loss": Infinity, + "eval_runtime": 544.832, + "eval_samples_per_second": 20.687, + "eval_steps_per_second": 2.586, + "eval_wer": 0.38530635400907715, + "step": 3200 + }, + { + "epoch": 0.57, + "eval_loss": Infinity, + "eval_runtime": 543.4333, + "eval_samples_per_second": 20.74, + "eval_steps_per_second": 2.593, + "eval_wer": 0.38726046394351993, + "step": 3300 + }, + { + "epoch": 0.59, + "eval_loss": Infinity, + "eval_runtime": 546.7602, + "eval_samples_per_second": 20.614, + "eval_steps_per_second": 2.577, + "eval_wer": 0.3931753235837956, + "step": 3400 + }, + { + "epoch": 0.61, + "learning_rate": 0.00028957323437318796, + "loss": 0.3538, + "step": 3500 + }, + { + "epoch": 0.61, + "eval_loss": Infinity, + "eval_runtime": 545.2677, + "eval_samples_per_second": 20.671, + "eval_steps_per_second": 2.584, + "eval_wer": 0.38855269793242564, + "step": 3500 + }, + { + "epoch": 0.62, + "eval_loss": Infinity, + "eval_runtime": 542.3889, + "eval_samples_per_second": 20.78, + "eval_steps_per_second": 2.598, + "eval_wer": 0.4128635064716759, + "step": 3600 + }, + { + "epoch": 0.64, + "eval_loss": Infinity, + "eval_runtime": 542.5923, + "eval_samples_per_second": 20.773, + "eval_steps_per_second": 2.597, + "eval_wer": 0.3857370986720457, + "step": 3700 + }, + { + "epoch": 0.66, + "eval_loss": Infinity, + "eval_runtime": 543.4133, + "eval_samples_per_second": 20.741, + "eval_steps_per_second": 2.593, + "eval_wer": 0.38266935619431836, + "step": 3800 + }, + { + "epoch": 0.67, + "eval_loss": Infinity, + "eval_runtime": 543.805, + "eval_samples_per_second": 20.726, + "eval_steps_per_second": 2.591, + "eval_wer": 0.39107413010590014, + "step": 3900 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002878337005682477, + "loss": 0.3577, + "step": 4000 + }, + { + "epoch": 0.69, + "eval_loss": Infinity, + "eval_runtime": 544.2518, + "eval_samples_per_second": 20.709, + "eval_steps_per_second": 2.589, + "eval_wer": 0.4018427466801143, + "step": 4000 + }, + { + "epoch": 0.71, + "eval_loss": Infinity, + "eval_runtime": 541.8941, + "eval_samples_per_second": 20.799, + "eval_steps_per_second": 2.6, + "eval_wer": 0.39127374348630023, + "step": 4100 + }, + { + "epoch": 0.73, + "eval_loss": Infinity, + "eval_runtime": 542.2205, + "eval_samples_per_second": 20.787, + "eval_steps_per_second": 2.599, + "eval_wer": 0.3795175659774752, + "step": 4200 + }, + { + "epoch": 0.74, + "eval_loss": Infinity, + "eval_runtime": 540.8985, + "eval_samples_per_second": 20.838, + "eval_steps_per_second": 2.605, + "eval_wer": 0.3949193141704488, + "step": 4300 + }, + { + "epoch": 0.76, + "eval_loss": Infinity, + "eval_runtime": 541.2726, + "eval_samples_per_second": 20.823, + "eval_steps_per_second": 2.603, + "eval_wer": 0.38375147083543454, + "step": 4400 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002860941667633074, + "loss": 0.349, + "step": 4500 + }, + { + "epoch": 0.78, + "eval_loss": Infinity, + "eval_runtime": 546.7973, + "eval_samples_per_second": 20.613, + "eval_steps_per_second": 2.577, + "eval_wer": 0.37175365607665156, + "step": 4500 + }, + { + "epoch": 0.8, + "eval_loss": Infinity, + "eval_runtime": 543.3484, + "eval_samples_per_second": 20.744, + "eval_steps_per_second": 2.593, + "eval_wer": 0.36440998487140697, + "step": 4600 + }, + { + "epoch": 0.81, + "eval_loss": Infinity, + "eval_runtime": 542.3944, + "eval_samples_per_second": 20.78, + "eval_steps_per_second": 2.598, + "eval_wer": 0.3591780131114473, + "step": 4700 + }, + { + "epoch": 0.83, + "eval_loss": Infinity, + "eval_runtime": 543.0473, + "eval_samples_per_second": 20.755, + "eval_steps_per_second": 2.595, + "eval_wer": 0.3694213313161876, + "step": 4800 + }, + { + "epoch": 0.85, + "eval_loss": Infinity, + "eval_runtime": 542.8039, + "eval_samples_per_second": 20.764, + "eval_steps_per_second": 2.596, + "eval_wer": 0.36223524962178516, + "step": 4900 + }, + { + "epoch": 0.86, + "learning_rate": 0.00028435463295836715, + "loss": 0.327, + "step": 5000 + }, + { + "epoch": 0.86, + "eval_loss": Infinity, + "eval_runtime": 542.4774, + "eval_samples_per_second": 20.777, + "eval_steps_per_second": 2.597, + "eval_wer": 0.359083459404942, + "step": 5000 + }, + { + "epoch": 0.88, + "eval_loss": Infinity, + "eval_runtime": 546.0865, + "eval_samples_per_second": 20.64, + "eval_steps_per_second": 2.58, + "eval_wer": 0.37074508320726174, + "step": 5100 + }, + { + "epoch": 0.9, + "eval_loss": Infinity, + "eval_runtime": 543.8013, + "eval_samples_per_second": 20.726, + "eval_steps_per_second": 2.591, + "eval_wer": 0.35611027063371997, + "step": 5200 + }, + { + "epoch": 0.92, + "eval_loss": Infinity, + "eval_runtime": 542.7376, + "eval_samples_per_second": 20.767, + "eval_steps_per_second": 2.596, + "eval_wer": 0.3559421751554883, + "step": 5300 + }, + { + "epoch": 0.93, + "eval_loss": Infinity, + "eval_runtime": 541.9303, + "eval_samples_per_second": 20.798, + "eval_steps_per_second": 2.6, + "eval_wer": 0.36291813750210117, + "step": 5400 + }, + { + "epoch": 0.95, + "learning_rate": 0.00028261509915342685, + "loss": 0.3328, + "step": 5500 + }, + { + "epoch": 0.95, + "eval_loss": Infinity, + "eval_runtime": 541.7032, + "eval_samples_per_second": 20.807, + "eval_steps_per_second": 2.601, + "eval_wer": 0.35176080013447636, + "step": 5500 + }, + { + "epoch": 0.97, + "eval_loss": Infinity, + "eval_runtime": 542.8204, + "eval_samples_per_second": 20.764, + "eval_steps_per_second": 2.596, + "eval_wer": 0.34550974953773744, + "step": 5600 + }, + { + "epoch": 0.99, + "eval_loss": Infinity, + "eval_runtime": 544.376, + "eval_samples_per_second": 20.704, + "eval_steps_per_second": 2.588, + "eval_wer": 0.3792023869557909, + "step": 5700 + }, + { + "epoch": 1.0, + "eval_loss": Infinity, + "eval_runtime": 543.1296, + "eval_samples_per_second": 20.752, + "eval_steps_per_second": 2.594, + "eval_wer": 0.35637291981845687, + "step": 5800 + }, + { + "epoch": 1.02, + "eval_loss": Infinity, + "eval_runtime": 542.0195, + "eval_samples_per_second": 20.794, + "eval_steps_per_second": 2.6, + "eval_wer": 0.3562363422423937, + "step": 5900 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002808755653484866, + "loss": 0.2984, + "step": 6000 + }, + { + "epoch": 1.04, + "eval_loss": Infinity, + "eval_runtime": 542.3963, + "eval_samples_per_second": 20.78, + "eval_steps_per_second": 2.598, + "eval_wer": 0.34357665153807365, + "step": 6000 + }, + { + "epoch": 1.05, + "eval_loss": Infinity, + "eval_runtime": 542.7224, + "eval_samples_per_second": 20.768, + "eval_steps_per_second": 2.596, + "eval_wer": 0.34884014120020174, + "step": 6100 + }, + { + "epoch": 1.07, + "eval_loss": Infinity, + "eval_runtime": 541.1971, + "eval_samples_per_second": 20.826, + "eval_steps_per_second": 2.603, + "eval_wer": 0.3464973104723483, + "step": 6200 + }, + { + "epoch": 1.09, + "eval_loss": Infinity, + "eval_runtime": 542.2512, + "eval_samples_per_second": 20.786, + "eval_steps_per_second": 2.598, + "eval_wer": 0.33660068919146074, + "step": 6300 + }, + { + "epoch": 1.11, + "eval_loss": Infinity, + "eval_runtime": 541.5435, + "eval_samples_per_second": 20.813, + "eval_steps_per_second": 2.602, + "eval_wer": 0.3417906370818625, + "step": 6400 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002791360315435463, + "loss": 0.2773, + "step": 6500 + }, + { + "epoch": 1.12, + "eval_loss": Infinity, + "eval_runtime": 543.2211, + "eval_samples_per_second": 20.748, + "eval_steps_per_second": 2.594, + "eval_wer": 0.3393427466801143, + "step": 6500 + }, + { + "epoch": 1.14, + "eval_loss": Infinity, + "eval_runtime": 540.5493, + "eval_samples_per_second": 20.851, + "eval_steps_per_second": 2.607, + "eval_wer": 0.34255757270129433, + "step": 6600 + }, + { + "epoch": 1.16, + "eval_loss": Infinity, + "eval_runtime": 545.9558, + "eval_samples_per_second": 20.645, + "eval_steps_per_second": 2.581, + "eval_wer": 0.33338586317028074, + "step": 6700 + }, + { + "epoch": 1.18, + "eval_loss": Infinity, + "eval_runtime": 540.5178, + "eval_samples_per_second": 20.852, + "eval_steps_per_second": 2.607, + "eval_wer": 0.3470121028744327, + "step": 6800 + }, + { + "epoch": 1.19, + "eval_loss": Infinity, + "eval_runtime": 541.1405, + "eval_samples_per_second": 20.828, + "eval_steps_per_second": 2.604, + "eval_wer": 0.3309905026054799, + "step": 6900 + }, + { + "epoch": 1.21, + "learning_rate": 0.00027739649773860604, + "loss": 0.2777, + "step": 7000 + }, + { + "epoch": 1.21, + "eval_loss": Infinity, + "eval_runtime": 545.61, + "eval_samples_per_second": 20.658, + "eval_steps_per_second": 2.582, + "eval_wer": 0.33262943351823837, + "step": 7000 + }, + { + "epoch": 1.23, + "eval_loss": Infinity, + "eval_runtime": 540.9626, + "eval_samples_per_second": 20.835, + "eval_steps_per_second": 2.605, + "eval_wer": 0.3390695915279879, + "step": 7100 + }, + { + "epoch": 1.25, + "eval_loss": Infinity, + "eval_runtime": 541.732, + "eval_samples_per_second": 20.805, + "eval_steps_per_second": 2.601, + "eval_wer": 0.345940494200706, + "step": 7200 + }, + { + "epoch": 1.26, + "eval_loss": Infinity, + "eval_runtime": 543.292, + "eval_samples_per_second": 20.746, + "eval_steps_per_second": 2.593, + "eval_wer": 0.32880526138846866, + "step": 7300 + }, + { + "epoch": 1.28, + "eval_loss": Infinity, + "eval_runtime": 541.9911, + "eval_samples_per_second": 20.796, + "eval_steps_per_second": 2.6, + "eval_wer": 0.3483883846024542, + "step": 7400 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027565696393366573, + "loss": 0.2775, + "step": 7500 + }, + { + "epoch": 1.3, + "eval_loss": Infinity, + "eval_runtime": 542.1379, + "eval_samples_per_second": 20.79, + "eval_steps_per_second": 2.599, + "eval_wer": 0.33937426458228276, + "step": 7500 + }, + { + "epoch": 1.31, + "eval_loss": Infinity, + "eval_runtime": 543.314, + "eval_samples_per_second": 20.745, + "eval_steps_per_second": 2.593, + "eval_wer": 0.336253992267608, + "step": 7600 + }, + { + "epoch": 1.33, + "eval_loss": Infinity, + "eval_runtime": 543.9348, + "eval_samples_per_second": 20.721, + "eval_steps_per_second": 2.59, + "eval_wer": 0.3464132627332325, + "step": 7700 + }, + { + "epoch": 1.35, + "eval_loss": Infinity, + "eval_runtime": 541.7191, + "eval_samples_per_second": 20.806, + "eval_steps_per_second": 2.601, + "eval_wer": 0.3530110102538242, + "step": 7800 + }, + { + "epoch": 1.37, + "eval_loss": Infinity, + "eval_runtime": 543.1641, + "eval_samples_per_second": 20.751, + "eval_steps_per_second": 2.594, + "eval_wer": 0.33844973945200874, + "step": 7900 + }, + { + "epoch": 1.38, + "learning_rate": 0.0002739174301287255, + "loss": 0.2833, + "step": 8000 + }, + { + "epoch": 1.38, + "eval_loss": Infinity, + "eval_runtime": 543.1917, + "eval_samples_per_second": 20.75, + "eval_steps_per_second": 2.594, + "eval_wer": 0.3380925365607665, + "step": 8000 + }, + { + "epoch": 1.4, + "eval_loss": Infinity, + "eval_runtime": 541.3015, + "eval_samples_per_second": 20.822, + "eval_steps_per_second": 2.603, + "eval_wer": 0.3407610522776937, + "step": 8100 + }, + { + "epoch": 1.42, + "eval_loss": Infinity, + "eval_runtime": 540.4975, + "eval_samples_per_second": 20.853, + "eval_steps_per_second": 2.607, + "eval_wer": 0.33338586317028074, + "step": 8200 + }, + { + "epoch": 1.44, + "eval_loss": Infinity, + "eval_runtime": 541.3309, + "eval_samples_per_second": 20.821, + "eval_steps_per_second": 2.603, + "eval_wer": 0.3391116153975458, + "step": 8300 + }, + { + "epoch": 1.45, + "eval_loss": Infinity, + "eval_runtime": 540.5391, + "eval_samples_per_second": 20.851, + "eval_steps_per_second": 2.607, + "eval_wer": 0.330486216170785, + "step": 8400 + }, + { + "epoch": 1.47, + "learning_rate": 0.00027217789632378523, + "loss": 0.2793, + "step": 8500 + }, + { + "epoch": 1.47, + "eval_loss": Infinity, + "eval_runtime": 543.2054, + "eval_samples_per_second": 20.749, + "eval_steps_per_second": 2.594, + "eval_wer": 0.3472222222222222, + "step": 8500 + }, + { + "epoch": 1.49, + "eval_loss": Infinity, + "eval_runtime": 542.7471, + "eval_samples_per_second": 20.767, + "eval_steps_per_second": 2.596, + "eval_wer": 0.32446629685661454, + "step": 8600 + }, + { + "epoch": 1.5, + "eval_loss": Infinity, + "eval_runtime": 543.1292, + "eval_samples_per_second": 20.752, + "eval_steps_per_second": 2.594, + "eval_wer": 0.3266095142040679, + "step": 8700 + }, + { + "epoch": 1.52, + "eval_loss": Infinity, + "eval_runtime": 554.6022, + "eval_samples_per_second": 20.323, + "eval_steps_per_second": 2.541, + "eval_wer": 0.32360480753067744, + "step": 8800 + }, + { + "epoch": 1.54, + "eval_loss": Infinity, + "eval_runtime": 541.8471, + "eval_samples_per_second": 20.801, + "eval_steps_per_second": 2.6, + "eval_wer": 0.32525424441082534, + "step": 8900 + }, + { + "epoch": 1.56, + "learning_rate": 0.00027043836251884493, + "loss": 0.2693, + "step": 9000 + }, + { + "epoch": 1.56, + "eval_loss": Infinity, + "eval_runtime": 541.1695, + "eval_samples_per_second": 20.827, + "eval_steps_per_second": 2.604, + "eval_wer": 0.3280593377038158, + "step": 9000 + }, + { + "epoch": 1.57, + "eval_loss": Infinity, + "eval_runtime": 542.036, + "eval_samples_per_second": 20.794, + "eval_steps_per_second": 2.599, + "eval_wer": 0.32761808707345774, + "step": 9100 + }, + { + "epoch": 1.59, + "eval_loss": Infinity, + "eval_runtime": 543.8181, + "eval_samples_per_second": 20.726, + "eval_steps_per_second": 2.591, + "eval_wer": 0.34042486132123045, + "step": 9200 + }, + { + "epoch": 1.61, + "eval_loss": Infinity, + "eval_runtime": 545.4298, + "eval_samples_per_second": 20.664, + "eval_steps_per_second": 2.583, + "eval_wer": 0.3477054967221382, + "step": 9300 + }, + { + "epoch": 1.63, + "eval_loss": Infinity, + "eval_runtime": 547.3255, + "eval_samples_per_second": 20.593, + "eval_steps_per_second": 2.574, + "eval_wer": 0.32468692217179357, + "step": 9400 + }, + { + "epoch": 1.64, + "learning_rate": 0.0002687023077815145, + "loss": 0.2735, + "step": 9500 + }, + { + "epoch": 1.64, + "eval_loss": Infinity, + "eval_runtime": 546.7521, + "eval_samples_per_second": 20.614, + "eval_steps_per_second": 2.577, + "eval_wer": 0.3282694570516053, + "step": 9500 + }, + { + "epoch": 1.66, + "eval_loss": Infinity, + "eval_runtime": 546.8572, + "eval_samples_per_second": 20.61, + "eval_steps_per_second": 2.577, + "eval_wer": 0.32723987224743656, + "step": 9600 + }, + { + "epoch": 1.68, + "eval_loss": Infinity, + "eval_runtime": 542.4218, + "eval_samples_per_second": 20.779, + "eval_steps_per_second": 2.598, + "eval_wer": 0.3346045553874601, + "step": 9700 + }, + { + "epoch": 1.69, + "eval_loss": Infinity, + "eval_runtime": 543.0577, + "eval_samples_per_second": 20.755, + "eval_steps_per_second": 2.595, + "eval_wer": 0.34167507144057824, + "step": 9800 + }, + { + "epoch": 1.71, + "eval_loss": Infinity, + "eval_runtime": 543.4435, + "eval_samples_per_second": 20.74, + "eval_steps_per_second": 2.593, + "eval_wer": 0.3227748361069087, + "step": 9900 + }, + { + "epoch": 1.73, + "learning_rate": 0.0002669627739765743, + "loss": 0.27, + "step": 10000 + }, + { + "epoch": 1.73, + "eval_loss": Infinity, + "eval_runtime": 543.9959, + "eval_samples_per_second": 20.719, + "eval_steps_per_second": 2.59, + "eval_wer": 0.3264204067910573, + "step": 10000 + }, + { + "epoch": 1.75, + "eval_loss": Infinity, + "eval_runtime": 541.6787, + "eval_samples_per_second": 20.808, + "eval_steps_per_second": 2.601, + "eval_wer": 0.3197281055639603, + "step": 10100 + }, + { + "epoch": 1.76, + "eval_loss": Infinity, + "eval_runtime": 544.3682, + "eval_samples_per_second": 20.705, + "eval_steps_per_second": 2.588, + "eval_wer": 0.3207156664985712, + "step": 10200 + }, + { + "epoch": 1.78, + "eval_loss": Infinity, + "eval_runtime": 541.8579, + "eval_samples_per_second": 20.801, + "eval_steps_per_second": 2.6, + "eval_wer": 0.3160510169776433, + "step": 10300 + }, + { + "epoch": 1.8, + "eval_loss": Infinity, + "eval_runtime": 542.4905, + "eval_samples_per_second": 20.776, + "eval_steps_per_second": 2.597, + "eval_wer": 0.30929567994620943, + "step": 10400 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026522324017163397, + "loss": 0.2632, + "step": 10500 + }, + { + "epoch": 1.82, + "eval_loss": Infinity, + "eval_runtime": 543.1131, + "eval_samples_per_second": 20.753, + "eval_steps_per_second": 2.594, + "eval_wer": 0.32033745167255, + "step": 10500 + }, + { + "epoch": 1.83, + "eval_loss": Infinity, + "eval_runtime": 543.354, + "eval_samples_per_second": 20.743, + "eval_steps_per_second": 2.593, + "eval_wer": 0.31596696923852746, + "step": 10600 + }, + { + "epoch": 1.85, + "eval_loss": Infinity, + "eval_runtime": 543.51, + "eval_samples_per_second": 20.737, + "eval_steps_per_second": 2.592, + "eval_wer": 0.31722768532526474, + "step": 10700 + }, + { + "epoch": 1.87, + "eval_loss": Infinity, + "eval_runtime": 543.0833, + "eval_samples_per_second": 20.754, + "eval_steps_per_second": 2.594, + "eval_wer": 0.3213040006723819, + "step": 10800 + }, + { + "epoch": 1.89, + "eval_loss": Infinity, + "eval_runtime": 545.9727, + "eval_samples_per_second": 20.644, + "eval_steps_per_second": 2.581, + "eval_wer": 0.3135611027063372, + "step": 10900 + }, + { + "epoch": 1.9, + "learning_rate": 0.0002634871854343036, + "loss": 0.2615, + "step": 11000 + }, + { + "epoch": 1.9, + "eval_loss": Infinity, + "eval_runtime": 543.6394, + "eval_samples_per_second": 20.732, + "eval_steps_per_second": 2.592, + "eval_wer": 0.31185913598924186, + "step": 11000 + }, + { + "epoch": 1.92, + "eval_loss": Infinity, + "eval_runtime": 546.0573, + "eval_samples_per_second": 20.641, + "eval_steps_per_second": 2.58, + "eval_wer": 0.3111552361741469, + "step": 11100 + }, + { + "epoch": 1.94, + "eval_loss": Infinity, + "eval_runtime": 544.569, + "eval_samples_per_second": 20.697, + "eval_steps_per_second": 2.587, + "eval_wer": 0.33042318036644813, + "step": 11200 + }, + { + "epoch": 1.95, + "eval_loss": Infinity, + "eval_runtime": 545.5464, + "eval_samples_per_second": 20.66, + "eval_steps_per_second": 2.583, + "eval_wer": 0.31183812405446293, + "step": 11300 + }, + { + "epoch": 1.97, + "eval_loss": Infinity, + "eval_runtime": 543.6903, + "eval_samples_per_second": 20.731, + "eval_steps_per_second": 2.592, + "eval_wer": 0.3163767019667171, + "step": 11400 + }, + { + "epoch": 1.99, + "learning_rate": 0.0002617476516293633, + "loss": 0.2665, + "step": 11500 + }, + { + "epoch": 1.99, + "eval_loss": Infinity, + "eval_runtime": 543.0226, + "eval_samples_per_second": 20.756, + "eval_steps_per_second": 2.595, + "eval_wer": 0.31048285426122035, + "step": 11500 + }, + { + "epoch": 2.01, + "eval_loss": Infinity, + "eval_runtime": 543.9768, + "eval_samples_per_second": 20.72, + "eval_steps_per_second": 2.59, + "eval_wer": 0.29904185577407966, + "step": 11600 + }, + { + "epoch": 2.02, + "eval_loss": Infinity, + "eval_runtime": 544.806, + "eval_samples_per_second": 20.688, + "eval_steps_per_second": 2.586, + "eval_wer": 0.3090855605984199, + "step": 11700 + }, + { + "epoch": 2.04, + "eval_loss": Infinity, + "eval_runtime": 541.7677, + "eval_samples_per_second": 20.804, + "eval_steps_per_second": 2.601, + "eval_wer": 0.29954614220877457, + "step": 11800 + }, + { + "epoch": 2.06, + "eval_loss": Infinity, + "eval_runtime": 543.1744, + "eval_samples_per_second": 20.75, + "eval_steps_per_second": 2.594, + "eval_wer": 0.30464153639267105, + "step": 11900 + }, + { + "epoch": 2.08, + "learning_rate": 0.000260008117824423, + "loss": 0.2272, + "step": 12000 + }, + { + "epoch": 2.08, + "eval_loss": Infinity, + "eval_runtime": 541.7916, + "eval_samples_per_second": 20.803, + "eval_steps_per_second": 2.601, + "eval_wer": 0.31607202891242225, + "step": 12000 + }, + { + "epoch": 2.09, + "eval_loss": Infinity, + "eval_runtime": 544.0285, + "eval_samples_per_second": 20.718, + "eval_steps_per_second": 2.59, + "eval_wer": 0.31450663977139015, + "step": 12100 + }, + { + "epoch": 2.11, + "eval_loss": Infinity, + "eval_runtime": 541.9109, + "eval_samples_per_second": 20.799, + "eval_steps_per_second": 2.6, + "eval_wer": 0.3083816607833249, + "step": 12200 + }, + { + "epoch": 2.13, + "eval_loss": Infinity, + "eval_runtime": 541.3453, + "eval_samples_per_second": 20.82, + "eval_steps_per_second": 2.603, + "eval_wer": 0.3082030593377038, + "step": 12300 + }, + { + "epoch": 2.14, + "eval_loss": Infinity, + "eval_runtime": 542.8224, + "eval_samples_per_second": 20.764, + "eval_steps_per_second": 2.596, + "eval_wer": 0.3013531685997647, + "step": 12400 + }, + { + "epoch": 2.16, + "learning_rate": 0.00025826858401948276, + "loss": 0.2235, + "step": 12500 + }, + { + "epoch": 2.16, + "eval_loss": Infinity, + "eval_runtime": 544.2628, + "eval_samples_per_second": 20.709, + "eval_steps_per_second": 2.589, + "eval_wer": 0.3140233652714742, + "step": 12500 + }, + { + "epoch": 2.18, + "eval_loss": Infinity, + "eval_runtime": 544.0918, + "eval_samples_per_second": 20.715, + "eval_steps_per_second": 2.59, + "eval_wer": 0.30928517397882, + "step": 12600 + }, + { + "epoch": 2.2, + "eval_loss": Infinity, + "eval_runtime": 542.7651, + "eval_samples_per_second": 20.766, + "eval_steps_per_second": 2.596, + "eval_wer": 0.3025403429147756, + "step": 12700 + }, + { + "epoch": 2.21, + "eval_loss": Infinity, + "eval_runtime": 543.9574, + "eval_samples_per_second": 20.72, + "eval_steps_per_second": 2.59, + "eval_wer": 0.3109451168263574, + "step": 12800 + }, + { + "epoch": 2.23, + "eval_loss": Infinity, + "eval_runtime": 544.6133, + "eval_samples_per_second": 20.695, + "eval_steps_per_second": 2.587, + "eval_wer": 0.29886325432845856, + "step": 12900 + }, + { + "epoch": 2.25, + "learning_rate": 0.0002565290502145425, + "loss": 0.2287, + "step": 13000 + }, + { + "epoch": 2.25, + "eval_loss": Infinity, + "eval_runtime": 542.6763, + "eval_samples_per_second": 20.769, + "eval_steps_per_second": 2.596, + "eval_wer": 0.3071209446965877, + "step": 13000 + }, + { + "epoch": 2.27, + "eval_loss": Infinity, + "eval_runtime": 544.2325, + "eval_samples_per_second": 20.71, + "eval_steps_per_second": 2.589, + "eval_wer": 0.31163851067406284, + "step": 13100 + }, + { + "epoch": 2.28, + "eval_loss": Infinity, + "eval_runtime": 544.5274, + "eval_samples_per_second": 20.699, + "eval_steps_per_second": 2.588, + "eval_wer": 0.30776180870734576, + "step": 13200 + }, + { + "epoch": 2.3, + "eval_loss": Infinity, + "eval_runtime": 544.8554, + "eval_samples_per_second": 20.686, + "eval_steps_per_second": 2.586, + "eval_wer": 0.30717347453353505, + "step": 13300 + }, + { + "epoch": 2.32, + "eval_loss": Infinity, + "eval_runtime": 544.5413, + "eval_samples_per_second": 20.698, + "eval_steps_per_second": 2.587, + "eval_wer": 0.3042423096318709, + "step": 13400 + }, + { + "epoch": 2.33, + "learning_rate": 0.00025479299547721205, + "loss": 0.2343, + "step": 13500 + }, + { + "epoch": 2.33, + "eval_loss": Infinity, + "eval_runtime": 541.9379, + "eval_samples_per_second": 20.798, + "eval_steps_per_second": 2.6, + "eval_wer": 0.2993675407631535, + "step": 13500 + }, + { + "epoch": 2.35, + "eval_loss": Infinity, + "eval_runtime": 544.0455, + "eval_samples_per_second": 20.717, + "eval_steps_per_second": 2.59, + "eval_wer": 0.3025823667843335, + "step": 13600 + }, + { + "epoch": 2.37, + "eval_loss": Infinity, + "eval_runtime": 542.9108, + "eval_samples_per_second": 20.76, + "eval_steps_per_second": 2.595, + "eval_wer": 0.307215498403093, + "step": 13700 + }, + { + "epoch": 2.39, + "eval_loss": Infinity, + "eval_runtime": 542.1131, + "eval_samples_per_second": 20.791, + "eval_steps_per_second": 2.599, + "eval_wer": 0.31030425281559926, + "step": 13800 + }, + { + "epoch": 2.4, + "eval_loss": Infinity, + "eval_runtime": 543.103, + "eval_samples_per_second": 20.753, + "eval_steps_per_second": 2.594, + "eval_wer": 0.3074781475878299, + "step": 13900 + }, + { + "epoch": 2.42, + "learning_rate": 0.0002530534616722718, + "loss": 0.2255, + "step": 14000 + }, + { + "epoch": 2.42, + "eval_loss": Infinity, + "eval_runtime": 541.4673, + "eval_samples_per_second": 20.816, + "eval_steps_per_second": 2.602, + "eval_wer": 0.3033072785342074, + "step": 14000 + }, + { + "epoch": 2.44, + "eval_loss": Infinity, + "eval_runtime": 544.3551, + "eval_samples_per_second": 20.705, + "eval_steps_per_second": 2.588, + "eval_wer": 0.301668347621449, + "step": 14100 + }, + { + "epoch": 2.46, + "eval_loss": Infinity, + "eval_runtime": 543.9092, + "eval_samples_per_second": 20.722, + "eval_steps_per_second": 2.591, + "eval_wer": 0.3094742813918306, + "step": 14200 + }, + { + "epoch": 2.47, + "eval_loss": Infinity, + "eval_runtime": 543.9507, + "eval_samples_per_second": 20.721, + "eval_steps_per_second": 2.59, + "eval_wer": 0.3030026054799126, + "step": 14300 + }, + { + "epoch": 2.49, + "eval_loss": Infinity, + "eval_runtime": 548.8025, + "eval_samples_per_second": 20.537, + "eval_steps_per_second": 2.567, + "eval_wer": 0.29882123045890063, + "step": 14400 + }, + { + "epoch": 2.51, + "learning_rate": 0.00025131392786733155, + "loss": 0.2266, + "step": 14500 + }, + { + "epoch": 2.51, + "eval_loss": Infinity, + "eval_runtime": 542.8924, + "eval_samples_per_second": 20.761, + "eval_steps_per_second": 2.595, + "eval_wer": 0.3069633551857455, + "step": 14500 + }, + { + "epoch": 2.53, + "eval_loss": Infinity, + "eval_runtime": 544.5732, + "eval_samples_per_second": 20.697, + "eval_steps_per_second": 2.587, + "eval_wer": 0.29389393175323586, + "step": 14600 + }, + { + "epoch": 2.54, + "eval_loss": Infinity, + "eval_runtime": 548.0549, + "eval_samples_per_second": 20.565, + "eval_steps_per_second": 2.571, + "eval_wer": 0.30245629517565975, + "step": 14700 + }, + { + "epoch": 2.56, + "eval_loss": Infinity, + "eval_runtime": 546.5456, + "eval_samples_per_second": 20.622, + "eval_steps_per_second": 2.578, + "eval_wer": 0.305366448142545, + "step": 14800 + }, + { + "epoch": 2.58, + "eval_loss": Infinity, + "eval_runtime": 542.2527, + "eval_samples_per_second": 20.786, + "eval_steps_per_second": 2.598, + "eval_wer": 0.30794041015296686, + "step": 14900 + }, + { + "epoch": 2.59, + "learning_rate": 0.00024957439406239124, + "loss": 0.2298, + "step": 15000 + }, + { + "epoch": 2.59, + "eval_loss": Infinity, + "eval_runtime": 541.872, + "eval_samples_per_second": 20.8, + "eval_steps_per_second": 2.6, + "eval_wer": 0.2883362750042024, + "step": 15000 + }, + { + "epoch": 2.61, + "eval_loss": Infinity, + "eval_runtime": 542.3187, + "eval_samples_per_second": 20.783, + "eval_steps_per_second": 2.598, + "eval_wer": 0.2941250630358043, + "step": 15100 + }, + { + "epoch": 2.63, + "eval_loss": Infinity, + "eval_runtime": 542.164, + "eval_samples_per_second": 20.789, + "eval_steps_per_second": 2.599, + "eval_wer": 0.2994515885022693, + "step": 15200 + }, + { + "epoch": 2.65, + "eval_loss": Infinity, + "eval_runtime": 543.4743, + "eval_samples_per_second": 20.739, + "eval_steps_per_second": 2.593, + "eval_wer": 0.3017523953605648, + "step": 15300 + }, + { + "epoch": 2.66, + "eval_loss": Infinity, + "eval_runtime": 544.8229, + "eval_samples_per_second": 20.687, + "eval_steps_per_second": 2.586, + "eval_wer": 0.30269793242561777, + "step": 15400 + }, + { + "epoch": 2.68, + "learning_rate": 0.000247834860257451, + "loss": 0.2269, + "step": 15500 + }, + { + "epoch": 2.68, + "eval_loss": Infinity, + "eval_runtime": 541.6192, + "eval_samples_per_second": 20.81, + "eval_steps_per_second": 2.601, + "eval_wer": 0.294051521264078, + "step": 15500 + }, + { + "epoch": 2.7, + "eval_loss": Infinity, + "eval_runtime": 543.4863, + "eval_samples_per_second": 20.738, + "eval_steps_per_second": 2.593, + "eval_wer": 0.2966254832744999, + "step": 15600 + }, + { + "epoch": 2.72, + "eval_loss": Infinity, + "eval_runtime": 543.1533, + "eval_samples_per_second": 20.751, + "eval_steps_per_second": 2.594, + "eval_wer": 0.29043746848209784, + "step": 15700 + }, + { + "epoch": 2.73, + "eval_loss": Infinity, + "eval_runtime": 545.1777, + "eval_samples_per_second": 20.674, + "eval_steps_per_second": 2.584, + "eval_wer": 0.2978336695242898, + "step": 15800 + }, + { + "epoch": 2.75, + "eval_loss": Infinity, + "eval_runtime": 542.6934, + "eval_samples_per_second": 20.769, + "eval_steps_per_second": 2.596, + "eval_wer": 0.28683392166750715, + "step": 15900 + }, + { + "epoch": 2.77, + "learning_rate": 0.0002460988055201206, + "loss": 0.2222, + "step": 16000 + }, + { + "epoch": 2.77, + "eval_loss": Infinity, + "eval_runtime": 541.9593, + "eval_samples_per_second": 20.797, + "eval_steps_per_second": 2.6, + "eval_wer": 0.3007858463607329, + "step": 16000 + }, + { + "epoch": 2.78, + "eval_loss": Infinity, + "eval_runtime": 544.4119, + "eval_samples_per_second": 20.703, + "eval_steps_per_second": 2.588, + "eval_wer": 0.2976235501765003, + "step": 16100 + }, + { + "epoch": 2.8, + "eval_loss": Infinity, + "eval_runtime": 542.8691, + "eval_samples_per_second": 20.762, + "eval_steps_per_second": 2.595, + "eval_wer": 0.29393595562279373, + "step": 16200 + }, + { + "epoch": 2.82, + "eval_loss": Infinity, + "eval_runtime": 543.4284, + "eval_samples_per_second": 20.741, + "eval_steps_per_second": 2.593, + "eval_wer": 0.2976970919482266, + "step": 16300 + }, + { + "epoch": 2.84, + "eval_loss": Infinity, + "eval_runtime": 540.9365, + "eval_samples_per_second": 20.836, + "eval_steps_per_second": 2.605, + "eval_wer": 0.2913724995797613, + "step": 16400 + }, + { + "epoch": 2.85, + "learning_rate": 0.0002443592717151803, + "loss": 0.2336, + "step": 16500 + }, + { + "epoch": 2.85, + "eval_loss": Infinity, + "eval_runtime": 542.3035, + "eval_samples_per_second": 20.784, + "eval_steps_per_second": 2.598, + "eval_wer": 0.2862981173306438, + "step": 16500 + }, + { + "epoch": 2.87, + "eval_loss": Infinity, + "eval_runtime": 540.4767, + "eval_samples_per_second": 20.854, + "eval_steps_per_second": 2.607, + "eval_wer": 0.29223398890569846, + "step": 16600 + }, + { + "epoch": 2.89, + "eval_loss": Infinity, + "eval_runtime": 544.1303, + "eval_samples_per_second": 20.714, + "eval_steps_per_second": 2.589, + "eval_wer": 0.29320053790553036, + "step": 16700 + }, + { + "epoch": 2.91, + "eval_loss": Infinity, + "eval_runtime": 544.5968, + "eval_samples_per_second": 20.696, + "eval_steps_per_second": 2.587, + "eval_wer": 0.2959741132963523, + "step": 16800 + }, + { + "epoch": 2.92, + "eval_loss": Infinity, + "eval_runtime": 544.104, + "eval_samples_per_second": 20.715, + "eval_steps_per_second": 2.59, + "eval_wer": 0.2904059505799294, + "step": 16900 + }, + { + "epoch": 2.94, + "learning_rate": 0.00024261973791024004, + "loss": 0.2275, + "step": 17000 + }, + { + "epoch": 2.94, + "eval_loss": Infinity, + "eval_runtime": 549.5031, + "eval_samples_per_second": 20.511, + "eval_steps_per_second": 2.564, + "eval_wer": 0.29583753572028915, + "step": 17000 + }, + { + "epoch": 2.96, + "eval_loss": Infinity, + "eval_runtime": 550.5262, + "eval_samples_per_second": 20.473, + "eval_steps_per_second": 2.559, + "eval_wer": 0.29877920658934276, + "step": 17100 + }, + { + "epoch": 2.97, + "eval_loss": Infinity, + "eval_runtime": 545.837, + "eval_samples_per_second": 20.649, + "eval_steps_per_second": 2.581, + "eval_wer": 0.2908787191124559, + "step": 17200 + }, + { + "epoch": 2.99, + "eval_loss": Infinity, + "eval_runtime": 542.7983, + "eval_samples_per_second": 20.765, + "eval_steps_per_second": 2.596, + "eval_wer": 0.30473609009917635, + "step": 17300 + }, + { + "epoch": 3.01, + "eval_loss": Infinity, + "eval_runtime": 542.8109, + "eval_samples_per_second": 20.764, + "eval_steps_per_second": 2.596, + "eval_wer": 0.3058182047402925, + "step": 17400 + }, + { + "epoch": 3.03, + "learning_rate": 0.00024088020410529976, + "loss": 0.2208, + "step": 17500 + }, + { + "epoch": 3.03, + "eval_loss": Infinity, + "eval_runtime": 544.3135, + "eval_samples_per_second": 20.707, + "eval_steps_per_second": 2.589, + "eval_wer": 0.2900172297865187, + "step": 17500 + }, + { + "epoch": 3.04, + "eval_loss": Infinity, + "eval_runtime": 544.1566, + "eval_samples_per_second": 20.713, + "eval_steps_per_second": 2.589, + "eval_wer": 0.2941040511010254, + "step": 17600 + }, + { + "epoch": 3.06, + "eval_loss": Infinity, + "eval_runtime": 544.4905, + "eval_samples_per_second": 20.7, + "eval_steps_per_second": 2.588, + "eval_wer": 0.28978609850395026, + "step": 17700 + }, + { + "epoch": 3.08, + "eval_loss": Infinity, + "eval_runtime": 542.4047, + "eval_samples_per_second": 20.78, + "eval_steps_per_second": 2.598, + "eval_wer": 0.2869389813414019, + "step": 17800 + }, + { + "epoch": 3.1, + "eval_loss": Infinity, + "eval_runtime": 542.3956, + "eval_samples_per_second": 20.78, + "eval_steps_per_second": 2.598, + "eval_wer": 0.3040847201210287, + "step": 17900 + }, + { + "epoch": 3.11, + "learning_rate": 0.00023914067030035948, + "loss": 0.192, + "step": 18000 + }, + { + "epoch": 3.11, + "eval_loss": Infinity, + "eval_runtime": 541.1082, + "eval_samples_per_second": 20.829, + "eval_steps_per_second": 2.604, + "eval_wer": 0.29535426122037317, + "step": 18000 + }, + { + "epoch": 3.13, + "eval_loss": Infinity, + "eval_runtime": 543.6529, + "eval_samples_per_second": 20.732, + "eval_steps_per_second": 2.592, + "eval_wer": 0.28465918641788535, + "step": 18100 + }, + { + "epoch": 3.15, + "eval_loss": Infinity, + "eval_runtime": 540.5467, + "eval_samples_per_second": 20.851, + "eval_steps_per_second": 2.607, + "eval_wer": 0.2999873928391326, + "step": 18200 + }, + { + "epoch": 3.16, + "eval_loss": Infinity, + "eval_runtime": 541.4182, + "eval_samples_per_second": 20.818, + "eval_steps_per_second": 2.602, + "eval_wer": 0.28889309127584467, + "step": 18300 + }, + { + "epoch": 3.18, + "eval_loss": Infinity, + "eval_runtime": 542.5022, + "eval_samples_per_second": 20.776, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2883677929063708, + "step": 18400 + }, + { + "epoch": 3.2, + "learning_rate": 0.00023740113649541923, + "loss": 0.1883, + "step": 18500 + }, + { + "epoch": 3.2, + "eval_loss": Infinity, + "eval_runtime": 544.1075, + "eval_samples_per_second": 20.715, + "eval_steps_per_second": 2.59, + "eval_wer": 0.29573247604639435, + "step": 18500 + }, + { + "epoch": 3.22, + "eval_loss": Infinity, + "eval_runtime": 542.3164, + "eval_samples_per_second": 20.783, + "eval_steps_per_second": 2.598, + "eval_wer": 0.28954446125399225, + "step": 18600 + }, + { + "epoch": 3.23, + "eval_loss": Infinity, + "eval_runtime": 543.3924, + "eval_samples_per_second": 20.742, + "eval_steps_per_second": 2.593, + "eval_wer": 0.282978231635569, + "step": 18700 + }, + { + "epoch": 3.25, + "eval_loss": Infinity, + "eval_runtime": 542.6139, + "eval_samples_per_second": 20.772, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2868759455370651, + "step": 18800 + }, + { + "epoch": 3.27, + "eval_loss": Infinity, + "eval_runtime": 543.143, + "eval_samples_per_second": 20.751, + "eval_steps_per_second": 2.594, + "eval_wer": 0.28079299041855776, + "step": 18900 + }, + { + "epoch": 3.29, + "learning_rate": 0.00023566160269047892, + "loss": 0.195, + "step": 19000 + }, + { + "epoch": 3.29, + "eval_loss": Infinity, + "eval_runtime": 542.4472, + "eval_samples_per_second": 20.778, + "eval_steps_per_second": 2.597, + "eval_wer": 0.28243192133131617, + "step": 19000 + }, + { + "epoch": 3.3, + "eval_loss": Infinity, + "eval_runtime": 540.0992, + "eval_samples_per_second": 20.868, + "eval_steps_per_second": 2.609, + "eval_wer": 0.29113086232980334, + "step": 19100 + }, + { + "epoch": 3.32, + "eval_loss": Infinity, + "eval_runtime": 542.3617, + "eval_samples_per_second": 20.781, + "eval_steps_per_second": 2.598, + "eval_wer": 0.2887144898302236, + "step": 19200 + }, + { + "epoch": 3.34, + "eval_loss": Infinity, + "eval_runtime": 541.9599, + "eval_samples_per_second": 20.797, + "eval_steps_per_second": 2.6, + "eval_wer": 0.28065641284249454, + "step": 19300 + }, + { + "epoch": 3.36, + "eval_loss": Infinity, + "eval_runtime": 544.4396, + "eval_samples_per_second": 20.702, + "eval_steps_per_second": 2.588, + "eval_wer": 0.28173852748361067, + "step": 19400 + }, + { + "epoch": 3.37, + "learning_rate": 0.00023392554795314855, + "loss": 0.1917, + "step": 19500 + }, + { + "epoch": 3.37, + "eval_loss": Infinity, + "eval_runtime": 541.3966, + "eval_samples_per_second": 20.818, + "eval_steps_per_second": 2.603, + "eval_wer": 0.29162464279710876, + "step": 19500 + }, + { + "epoch": 3.39, + "eval_loss": Infinity, + "eval_runtime": 541.7731, + "eval_samples_per_second": 20.804, + "eval_steps_per_second": 2.601, + "eval_wer": 0.28613002185241215, + "step": 19600 + }, + { + "epoch": 3.41, + "eval_loss": Infinity, + "eval_runtime": 542.4733, + "eval_samples_per_second": 20.777, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2870545469826862, + "step": 19700 + }, + { + "epoch": 3.42, + "eval_loss": Infinity, + "eval_runtime": 541.7667, + "eval_samples_per_second": 20.804, + "eval_steps_per_second": 2.601, + "eval_wer": 0.28756933938477053, + "step": 19800 + }, + { + "epoch": 3.44, + "eval_loss": Infinity, + "eval_runtime": 541.3431, + "eval_samples_per_second": 20.82, + "eval_steps_per_second": 2.603, + "eval_wer": 0.28075096654899984, + "step": 19900 + }, + { + "epoch": 3.46, + "learning_rate": 0.00023218601414820827, + "loss": 0.1925, + "step": 20000 + }, + { + "epoch": 3.46, + "eval_loss": Infinity, + "eval_runtime": 541.8278, + "eval_samples_per_second": 20.802, + "eval_steps_per_second": 2.6, + "eval_wer": 0.29112035636241385, + "step": 20000 + }, + { + "epoch": 3.48, + "eval_loss": Infinity, + "eval_runtime": 547.1285, + "eval_samples_per_second": 20.6, + "eval_steps_per_second": 2.575, + "eval_wer": 0.2812237350815263, + "step": 20100 + }, + { + "epoch": 3.49, + "eval_loss": Infinity, + "eval_runtime": 541.0571, + "eval_samples_per_second": 20.831, + "eval_steps_per_second": 2.604, + "eval_wer": 0.27968986384266264, + "step": 20200 + }, + { + "epoch": 3.51, + "eval_loss": Infinity, + "eval_runtime": 541.9172, + "eval_samples_per_second": 20.798, + "eval_steps_per_second": 2.6, + "eval_wer": 0.282515969070432, + "step": 20300 + }, + { + "epoch": 3.53, + "eval_loss": Infinity, + "eval_runtime": 544.2103, + "eval_samples_per_second": 20.711, + "eval_steps_per_second": 2.589, + "eval_wer": 0.2877479408303917, + "step": 20400 + }, + { + "epoch": 3.55, + "learning_rate": 0.000230446480343268, + "loss": 0.1952, + "step": 20500 + }, + { + "epoch": 3.55, + "eval_loss": Infinity, + "eval_runtime": 544.2822, + "eval_samples_per_second": 20.708, + "eval_steps_per_second": 2.589, + "eval_wer": 0.2850058833417381, + "step": 20500 + }, + { + "epoch": 3.56, + "eval_loss": Infinity, + "eval_runtime": 540.3288, + "eval_samples_per_second": 20.86, + "eval_steps_per_second": 2.608, + "eval_wer": 0.2826630526138847, + "step": 20600 + }, + { + "epoch": 3.58, + "eval_loss": Infinity, + "eval_runtime": 540.8405, + "eval_samples_per_second": 20.84, + "eval_steps_per_second": 2.605, + "eval_wer": 0.2861195158850227, + "step": 20700 + }, + { + "epoch": 3.6, + "eval_loss": Infinity, + "eval_runtime": 543.3795, + "eval_samples_per_second": 20.742, + "eval_steps_per_second": 2.593, + "eval_wer": 0.284344007396201, + "step": 20800 + }, + { + "epoch": 3.61, + "eval_loss": Infinity, + "eval_runtime": 542.5007, + "eval_samples_per_second": 20.776, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2957534879811733, + "step": 20900 + }, + { + "epoch": 3.63, + "learning_rate": 0.00022870694653832769, + "loss": 0.194, + "step": 21000 + }, + { + "epoch": 3.63, + "eval_loss": Infinity, + "eval_runtime": 541.5576, + "eval_samples_per_second": 20.812, + "eval_steps_per_second": 2.602, + "eval_wer": 0.2867708858631703, + "step": 21000 + }, + { + "epoch": 3.65, + "eval_loss": Infinity, + "eval_runtime": 542.9935, + "eval_samples_per_second": 20.757, + "eval_steps_per_second": 2.595, + "eval_wer": 0.2838082030593377, + "step": 21100 + }, + { + "epoch": 3.67, + "eval_loss": Infinity, + "eval_runtime": 541.3856, + "eval_samples_per_second": 20.819, + "eval_steps_per_second": 2.603, + "eval_wer": 0.2771999495713565, + "step": 21200 + }, + { + "epoch": 3.68, + "eval_loss": Infinity, + "eval_runtime": 542.358, + "eval_samples_per_second": 20.781, + "eval_steps_per_second": 2.598, + "eval_wer": 0.2796163220709363, + "step": 21300 + }, + { + "epoch": 3.7, + "eval_loss": Infinity, + "eval_runtime": 541.9323, + "eval_samples_per_second": 20.798, + "eval_steps_per_second": 2.6, + "eval_wer": 0.27928013111447303, + "step": 21400 + }, + { + "epoch": 3.72, + "learning_rate": 0.00022696741273338744, + "loss": 0.1912, + "step": 21500 + }, + { + "epoch": 3.72, + "eval_loss": Infinity, + "eval_runtime": 542.4498, + "eval_samples_per_second": 20.778, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2811186754076315, + "step": 21500 + }, + { + "epoch": 3.74, + "eval_loss": Infinity, + "eval_runtime": 541.1622, + "eval_samples_per_second": 20.827, + "eval_steps_per_second": 2.604, + "eval_wer": 0.27576063203899814, + "step": 21600 + }, + { + "epoch": 3.75, + "eval_loss": Infinity, + "eval_runtime": 544.4094, + "eval_samples_per_second": 20.703, + "eval_steps_per_second": 2.588, + "eval_wer": 0.28317784501596904, + "step": 21700 + }, + { + "epoch": 3.77, + "eval_loss": Infinity, + "eval_runtime": 541.8456, + "eval_samples_per_second": 20.801, + "eval_steps_per_second": 2.6, + "eval_wer": 0.2731131282568499, + "step": 21800 + }, + { + "epoch": 3.79, + "eval_loss": Infinity, + "eval_runtime": 541.5491, + "eval_samples_per_second": 20.813, + "eval_steps_per_second": 2.602, + "eval_wer": 0.27668515716927217, + "step": 21900 + }, + { + "epoch": 3.8, + "learning_rate": 0.00022522787892844716, + "loss": 0.1966, + "step": 22000 + }, + { + "epoch": 3.8, + "eval_loss": Infinity, + "eval_runtime": 542.4841, + "eval_samples_per_second": 20.777, + "eval_steps_per_second": 2.597, + "eval_wer": 0.27910152966885193, + "step": 22000 + }, + { + "epoch": 3.82, + "eval_loss": Infinity, + "eval_runtime": 545.5878, + "eval_samples_per_second": 20.658, + "eval_steps_per_second": 2.583, + "eval_wer": 0.28655026054799126, + "step": 22100 + }, + { + "epoch": 3.84, + "eval_loss": Infinity, + "eval_runtime": 541.4456, + "eval_samples_per_second": 20.816, + "eval_steps_per_second": 2.602, + "eval_wer": 0.28485879979828543, + "step": 22200 + }, + { + "epoch": 3.86, + "eval_loss": Infinity, + "eval_runtime": 541.8429, + "eval_samples_per_second": 20.801, + "eval_steps_per_second": 2.6, + "eval_wer": 0.28729618423264414, + "step": 22300 + }, + { + "epoch": 3.87, + "eval_loss": Infinity, + "eval_runtime": 546.2903, + "eval_samples_per_second": 20.632, + "eval_steps_per_second": 2.579, + "eval_wer": 0.28351403597243235, + "step": 22400 + }, + { + "epoch": 3.89, + "learning_rate": 0.00022349182419111678, + "loss": 0.1932, + "step": 22500 + }, + { + "epoch": 3.89, + "eval_loss": Infinity, + "eval_runtime": 544.9851, + "eval_samples_per_second": 20.681, + "eval_steps_per_second": 2.585, + "eval_wer": 0.2781454866364095, + "step": 22500 + }, + { + "epoch": 3.91, + "eval_loss": Infinity, + "eval_runtime": 543.4194, + "eval_samples_per_second": 20.741, + "eval_steps_per_second": 2.593, + "eval_wer": 0.27511976802824006, + "step": 22600 + }, + { + "epoch": 3.93, + "eval_loss": Infinity, + "eval_runtime": 542.5928, + "eval_samples_per_second": 20.772, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2871280887544125, + "step": 22700 + }, + { + "epoch": 3.94, + "eval_loss": Infinity, + "eval_runtime": 543.1769, + "eval_samples_per_second": 20.75, + "eval_steps_per_second": 2.594, + "eval_wer": 0.2715162212136494, + "step": 22800 + }, + { + "epoch": 3.96, + "eval_loss": Infinity, + "eval_runtime": 542.7369, + "eval_samples_per_second": 20.767, + "eval_steps_per_second": 2.596, + "eval_wer": 0.28232686165742144, + "step": 22900 + }, + { + "epoch": 3.98, + "learning_rate": 0.00022175229038617648, + "loss": 0.1928, + "step": 23000 + }, + { + "epoch": 3.98, + "eval_loss": Infinity, + "eval_runtime": 541.6129, + "eval_samples_per_second": 20.81, + "eval_steps_per_second": 2.601, + "eval_wer": 0.28185409312489496, + "step": 23000 + }, + { + "epoch": 4.0, + "eval_loss": Infinity, + "eval_runtime": 541.322, + "eval_samples_per_second": 20.821, + "eval_steps_per_second": 2.603, + "eval_wer": 0.27848167759287273, + "step": 23100 + }, + { + "epoch": 4.01, + "eval_loss": Infinity, + "eval_runtime": 543.2229, + "eval_samples_per_second": 20.748, + "eval_steps_per_second": 2.594, + "eval_wer": 0.2746680114304925, + "step": 23200 + }, + { + "epoch": 4.03, + "eval_loss": Infinity, + "eval_runtime": 545.8357, + "eval_samples_per_second": 20.649, + "eval_steps_per_second": 2.581, + "eval_wer": 0.27156875105059675, + "step": 23300 + }, + { + "epoch": 4.05, + "eval_loss": Infinity, + "eval_runtime": 543.6397, + "eval_samples_per_second": 20.732, + "eval_steps_per_second": 2.592, + "eval_wer": 0.2673243402252479, + "step": 23400 + }, + { + "epoch": 4.06, + "learning_rate": 0.0002200127565812362, + "loss": 0.1651, + "step": 23500 + }, + { + "epoch": 4.06, + "eval_loss": Infinity, + "eval_runtime": 545.2541, + "eval_samples_per_second": 20.671, + "eval_steps_per_second": 2.584, + "eval_wer": 0.2795637922339889, + "step": 23500 + }, + { + "epoch": 4.08, + "eval_loss": Infinity, + "eval_runtime": 541.1431, + "eval_samples_per_second": 20.828, + "eval_steps_per_second": 2.604, + "eval_wer": 0.2786602790384939, + "step": 23600 + }, + { + "epoch": 4.1, + "eval_loss": Infinity, + "eval_runtime": 542.8901, + "eval_samples_per_second": 20.761, + "eval_steps_per_second": 2.595, + "eval_wer": 0.2709488989746176, + "step": 23700 + }, + { + "epoch": 4.12, + "eval_loss": Infinity, + "eval_runtime": 541.6991, + "eval_samples_per_second": 20.807, + "eval_steps_per_second": 2.601, + "eval_wer": 0.28349302403765336, + "step": 23800 + }, + { + "epoch": 4.13, + "eval_loss": Infinity, + "eval_runtime": 542.3686, + "eval_samples_per_second": 20.781, + "eval_steps_per_second": 2.598, + "eval_wer": 0.27752563456043033, + "step": 23900 + }, + { + "epoch": 4.15, + "learning_rate": 0.00021827322277629592, + "loss": 0.1678, + "step": 24000 + }, + { + "epoch": 4.15, + "eval_loss": Infinity, + "eval_runtime": 543.089, + "eval_samples_per_second": 20.754, + "eval_steps_per_second": 2.594, + "eval_wer": 0.27352286098503953, + "step": 24000 + }, + { + "epoch": 4.17, + "eval_loss": Infinity, + "eval_runtime": 545.6128, + "eval_samples_per_second": 20.658, + "eval_steps_per_second": 2.582, + "eval_wer": 0.2738695579088922, + "step": 24100 + }, + { + "epoch": 4.19, + "eval_loss": Infinity, + "eval_runtime": 541.6932, + "eval_samples_per_second": 20.807, + "eval_steps_per_second": 2.601, + "eval_wer": 0.2723041687678601, + "step": 24200 + }, + { + "epoch": 4.2, + "eval_loss": Infinity, + "eval_runtime": 543.1454, + "eval_samples_per_second": 20.751, + "eval_steps_per_second": 2.594, + "eval_wer": 0.27206253151790216, + "step": 24300 + }, + { + "epoch": 4.22, + "eval_loss": Infinity, + "eval_runtime": 541.1009, + "eval_samples_per_second": 20.83, + "eval_steps_per_second": 2.604, + "eval_wer": 0.2682698772903009, + "step": 24400 + }, + { + "epoch": 4.24, + "learning_rate": 0.00021653716803896555, + "loss": 0.1701, + "step": 24500 + }, + { + "epoch": 4.24, + "eval_loss": Infinity, + "eval_runtime": 547.7655, + "eval_samples_per_second": 20.576, + "eval_steps_per_second": 2.572, + "eval_wer": 0.270539166246428, + "step": 24500 + }, + { + "epoch": 4.25, + "eval_loss": Infinity, + "eval_runtime": 546.8009, + "eval_samples_per_second": 20.613, + "eval_steps_per_second": 2.577, + "eval_wer": 0.27438435031097663, + "step": 24600 + }, + { + "epoch": 4.27, + "eval_loss": Infinity, + "eval_runtime": 544.7395, + "eval_samples_per_second": 20.691, + "eval_steps_per_second": 2.587, + "eval_wer": 0.2675029416708691, + "step": 24700 + }, + { + "epoch": 4.29, + "eval_loss": Infinity, + "eval_runtime": 541.3702, + "eval_samples_per_second": 20.819, + "eval_steps_per_second": 2.603, + "eval_wer": 0.272125567322239, + "step": 24800 + }, + { + "epoch": 4.31, + "eval_loss": Infinity, + "eval_runtime": 541.2194, + "eval_samples_per_second": 20.825, + "eval_steps_per_second": 2.603, + "eval_wer": 0.270055891746512, + "step": 24900 + }, + { + "epoch": 4.32, + "learning_rate": 0.00021479763423402524, + "loss": 0.1681, + "step": 25000 + }, + { + "epoch": 4.32, + "eval_loss": Infinity, + "eval_runtime": 543.6583, + "eval_samples_per_second": 20.732, + "eval_steps_per_second": 2.592, + "eval_wer": 0.2697407127248277, + "step": 25000 + }, + { + "epoch": 4.34, + "eval_loss": Infinity, + "eval_runtime": 541.8047, + "eval_samples_per_second": 20.803, + "eval_steps_per_second": 2.601, + "eval_wer": 0.26358421583459407, + "step": 25100 + }, + { + "epoch": 4.36, + "eval_loss": Infinity, + "eval_runtime": 542.7168, + "eval_samples_per_second": 20.768, + "eval_steps_per_second": 2.596, + "eval_wer": 0.2710329467137334, + "step": 25200 + }, + { + "epoch": 4.38, + "eval_loss": Infinity, + "eval_runtime": 542.9637, + "eval_samples_per_second": 20.758, + "eval_steps_per_second": 2.595, + "eval_wer": 0.2671982686165742, + "step": 25300 + }, + { + "epoch": 4.39, + "eval_loss": Infinity, + "eval_runtime": 544.2227, + "eval_samples_per_second": 20.71, + "eval_steps_per_second": 2.589, + "eval_wer": 0.26634728525802653, + "step": 25400 + }, + { + "epoch": 4.41, + "learning_rate": 0.00021306157949669486, + "loss": 0.1686, + "step": 25500 + }, + { + "epoch": 4.41, + "eval_loss": Infinity, + "eval_runtime": 543.0802, + "eval_samples_per_second": 20.754, + "eval_steps_per_second": 2.594, + "eval_wer": 0.2682173474533535, + "step": 25500 + }, + { + "epoch": 4.43, + "eval_loss": Infinity, + "eval_runtime": 542.2325, + "eval_samples_per_second": 20.786, + "eval_steps_per_second": 2.599, + "eval_wer": 0.2665363926710371, + "step": 25600 + }, + { + "epoch": 4.44, + "eval_loss": Infinity, + "eval_runtime": 544.8929, + "eval_samples_per_second": 20.685, + "eval_steps_per_second": 2.586, + "eval_wer": 0.2659480584972264, + "step": 25700 + }, + { + "epoch": 4.46, + "eval_loss": Infinity, + "eval_runtime": 544.4755, + "eval_samples_per_second": 20.701, + "eval_steps_per_second": 2.588, + "eval_wer": 0.26376281728021517, + "step": 25800 + }, + { + "epoch": 4.48, + "eval_loss": Infinity, + "eval_runtime": 545.5151, + "eval_samples_per_second": 20.661, + "eval_steps_per_second": 2.583, + "eval_wer": 0.2654437720625315, + "step": 25900 + }, + { + "epoch": 4.5, + "learning_rate": 0.00021132204569175459, + "loss": 0.1704, + "step": 26000 + }, + { + "epoch": 4.5, + "eval_loss": Infinity, + "eval_runtime": 544.8363, + "eval_samples_per_second": 20.687, + "eval_steps_per_second": 2.586, + "eval_wer": 0.2693624978988065, + "step": 26000 + }, + { + "epoch": 4.51, + "eval_loss": Infinity, + "eval_runtime": 542.9637, + "eval_samples_per_second": 20.758, + "eval_steps_per_second": 2.595, + "eval_wer": 0.2657379391494369, + "step": 26100 + }, + { + "epoch": 4.53, + "eval_loss": Infinity, + "eval_runtime": 542.0387, + "eval_samples_per_second": 20.794, + "eval_steps_per_second": 2.599, + "eval_wer": 0.26736636409480585, + "step": 26200 + }, + { + "epoch": 4.55, + "eval_loss": Infinity, + "eval_runtime": 540.8149, + "eval_samples_per_second": 20.841, + "eval_steps_per_second": 2.605, + "eval_wer": 0.27195747184400737, + "step": 26300 + }, + { + "epoch": 4.57, + "eval_loss": Infinity, + "eval_runtime": 543.2221, + "eval_samples_per_second": 20.748, + "eval_steps_per_second": 2.594, + "eval_wer": 0.2743108085392503, + "step": 26400 + }, + { + "epoch": 4.58, + "learning_rate": 0.00020958251188681434, + "loss": 0.1646, + "step": 26500 + }, + { + "epoch": 4.58, + "eval_loss": Infinity, + "eval_runtime": 544.9463, + "eval_samples_per_second": 20.683, + "eval_steps_per_second": 2.586, + "eval_wer": 0.27350184905026054, + "step": 26500 + }, + { + "epoch": 4.6, + "eval_loss": Infinity, + "eval_runtime": 544.3881, + "eval_samples_per_second": 20.704, + "eval_steps_per_second": 2.588, + "eval_wer": 0.2658745167255001, + "step": 26600 + }, + { + "epoch": 4.62, + "eval_loss": Infinity, + "eval_runtime": 544.4068, + "eval_samples_per_second": 20.703, + "eval_steps_per_second": 2.588, + "eval_wer": 0.26746091780131115, + "step": 26700 + }, + { + "epoch": 4.64, + "eval_loss": Infinity, + "eval_runtime": 543.2382, + "eval_samples_per_second": 20.748, + "eval_steps_per_second": 2.594, + "eval_wer": 0.2743108085392503, + "step": 26800 + }, + { + "epoch": 4.65, + "eval_loss": Infinity, + "eval_runtime": 543.0733, + "eval_samples_per_second": 20.754, + "eval_steps_per_second": 2.594, + "eval_wer": 0.2641725500084048, + "step": 26900 + }, + { + "epoch": 4.67, + "learning_rate": 0.00020784297808187406, + "loss": 0.1662, + "step": 27000 + }, + { + "epoch": 4.67, + "eval_loss": Infinity, + "eval_runtime": 542.9197, + "eval_samples_per_second": 20.76, + "eval_steps_per_second": 2.595, + "eval_wer": 0.2652231467473525, + "step": 27000 + }, + { + "epoch": 4.69, + "eval_loss": Infinity, + "eval_runtime": 543.0343, + "eval_samples_per_second": 20.756, + "eval_steps_per_second": 2.595, + "eval_wer": 0.26765002521432174, + "step": 27100 + }, + { + "epoch": 4.7, + "eval_loss": Infinity, + "eval_runtime": 543.1054, + "eval_samples_per_second": 20.753, + "eval_steps_per_second": 2.594, + "eval_wer": 0.26988779626828036, + "step": 27200 + }, + { + "epoch": 4.72, + "eval_loss": Infinity, + "eval_runtime": 543.2158, + "eval_samples_per_second": 20.749, + "eval_steps_per_second": 2.594, + "eval_wer": 0.26490796772566816, + "step": 27300 + }, + { + "epoch": 4.74, + "eval_loss": Infinity, + "eval_runtime": 542.913, + "eval_samples_per_second": 20.76, + "eval_steps_per_second": 2.595, + "eval_wer": 0.26394141872583626, + "step": 27400 + }, + { + "epoch": 4.76, + "learning_rate": 0.00020610344427693375, + "loss": 0.1713, + "step": 27500 + }, + { + "epoch": 4.76, + "eval_loss": Infinity, + "eval_runtime": 543.0263, + "eval_samples_per_second": 20.756, + "eval_steps_per_second": 2.595, + "eval_wer": 0.2634056143889729, + "step": 27500 + }, + { + "epoch": 4.77, + "eval_loss": Infinity, + "eval_runtime": 542.6947, + "eval_samples_per_second": 20.769, + "eval_steps_per_second": 2.596, + "eval_wer": 0.26396243066061525, + "step": 27600 + }, + { + "epoch": 4.79, + "eval_loss": Infinity, + "eval_runtime": 553.6288, + "eval_samples_per_second": 20.358, + "eval_steps_per_second": 2.545, + "eval_wer": 0.2604744494873088, + "step": 27700 + }, + { + "epoch": 4.81, + "eval_loss": Infinity, + "eval_runtime": 542.7462, + "eval_samples_per_second": 20.767, + "eval_steps_per_second": 2.596, + "eval_wer": 0.25767986216170785, + "step": 27800 + }, + { + "epoch": 4.83, + "eval_loss": Infinity, + "eval_runtime": 543.1573, + "eval_samples_per_second": 20.751, + "eval_steps_per_second": 2.594, + "eval_wer": 0.26473987224743656, + "step": 27900 + }, + { + "epoch": 4.84, + "learning_rate": 0.00020436391047199347, + "loss": 0.1674, + "step": 28000 + }, + { + "epoch": 4.84, + "eval_loss": Infinity, + "eval_runtime": 542.5497, + "eval_samples_per_second": 20.774, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2605164733568667, + "step": 28000 + }, + { + "epoch": 4.86, + "eval_loss": Infinity, + "eval_runtime": 542.4903, + "eval_samples_per_second": 20.776, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2551689359556228, + "step": 28100 + }, + { + "epoch": 4.88, + "eval_loss": Infinity, + "eval_runtime": 542.4923, + "eval_samples_per_second": 20.776, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2640254664649521, + "step": 28200 + }, + { + "epoch": 4.89, + "eval_loss": Infinity, + "eval_runtime": 543.3538, + "eval_samples_per_second": 20.743, + "eval_steps_per_second": 2.593, + "eval_wer": 0.26158808203059336, + "step": 28300 + }, + { + "epoch": 4.91, + "eval_loss": Infinity, + "eval_runtime": 544.8688, + "eval_samples_per_second": 20.686, + "eval_steps_per_second": 2.586, + "eval_wer": 0.2625021011934779, + "step": 28400 + }, + { + "epoch": 4.93, + "learning_rate": 0.00020262437666705322, + "loss": 0.1627, + "step": 28500 + }, + { + "epoch": 4.93, + "eval_loss": Infinity, + "eval_runtime": 545.1106, + "eval_samples_per_second": 20.677, + "eval_steps_per_second": 2.585, + "eval_wer": 0.2595919482265927, + "step": 28500 + }, + { + "epoch": 4.95, + "eval_loss": Infinity, + "eval_runtime": 545.1809, + "eval_samples_per_second": 20.674, + "eval_steps_per_second": 2.584, + "eval_wer": 0.2587724827702135, + "step": 28600 + }, + { + "epoch": 4.96, + "eval_loss": Infinity, + "eval_runtime": 543.2839, + "eval_samples_per_second": 20.746, + "eval_steps_per_second": 2.593, + "eval_wer": 0.27188393007228107, + "step": 28700 + }, + { + "epoch": 4.98, + "eval_loss": Infinity, + "eval_runtime": 543.3434, + "eval_samples_per_second": 20.744, + "eval_steps_per_second": 2.593, + "eval_wer": 0.26246007732391996, + "step": 28800 + }, + { + "epoch": 5.0, + "eval_loss": Infinity, + "eval_runtime": 544.0956, + "eval_samples_per_second": 20.715, + "eval_steps_per_second": 2.59, + "eval_wer": 0.2631009413346781, + "step": 28900 + }, + { + "epoch": 5.02, + "learning_rate": 0.00020088484286211295, + "loss": 0.162, + "step": 29000 + }, + { + "epoch": 5.02, + "eval_loss": Infinity, + "eval_runtime": 543.4223, + "eval_samples_per_second": 20.741, + "eval_steps_per_second": 2.593, + "eval_wer": 0.26189275508488824, + "step": 29000 + }, + { + "epoch": 5.03, + "eval_loss": Infinity, + "eval_runtime": 548.0793, + "eval_samples_per_second": 20.565, + "eval_steps_per_second": 2.571, + "eval_wer": 0.25953941838964534, + "step": 29100 + }, + { + "epoch": 5.05, + "eval_loss": Infinity, + "eval_runtime": 548.6875, + "eval_samples_per_second": 20.542, + "eval_steps_per_second": 2.568, + "eval_wer": 0.2667885358883846, + "step": 29200 + }, + { + "epoch": 5.07, + "eval_loss": Infinity, + "eval_runtime": 550.2049, + "eval_samples_per_second": 20.485, + "eval_steps_per_second": 2.561, + "eval_wer": 0.26004370482434025, + "step": 29300 + }, + { + "epoch": 5.08, + "eval_loss": Infinity, + "eval_runtime": 542.8181, + "eval_samples_per_second": 20.764, + "eval_steps_per_second": 2.596, + "eval_wer": 0.2608841822154984, + "step": 29400 + }, + { + "epoch": 5.1, + "learning_rate": 0.00019914530905717264, + "loss": 0.147, + "step": 29500 + }, + { + "epoch": 5.1, + "eval_loss": Infinity, + "eval_runtime": 543.4487, + "eval_samples_per_second": 20.74, + "eval_steps_per_second": 2.593, + "eval_wer": 0.2654647839973105, + "step": 29500 + }, + { + "epoch": 5.12, + "eval_loss": Infinity, + "eval_runtime": 543.1438, + "eval_samples_per_second": 20.751, + "eval_steps_per_second": 2.594, + "eval_wer": 0.2614515044545302, + "step": 29600 + }, + { + "epoch": 5.14, + "eval_loss": Infinity, + "eval_runtime": 547.647, + "eval_samples_per_second": 20.581, + "eval_steps_per_second": 2.573, + "eval_wer": 0.26274373844343585, + "step": 29700 + }, + { + "epoch": 5.15, + "eval_loss": Infinity, + "eval_runtime": 544.3766, + "eval_samples_per_second": 20.704, + "eval_steps_per_second": 2.588, + "eval_wer": 0.26189275508488824, + "step": 29800 + }, + { + "epoch": 5.17, + "eval_loss": Infinity, + "eval_runtime": 542.734, + "eval_samples_per_second": 20.767, + "eval_steps_per_second": 2.596, + "eval_wer": 0.2622289460413515, + "step": 29900 + }, + { + "epoch": 5.19, + "learning_rate": 0.0001974057752522324, + "loss": 0.1441, + "step": 30000 + }, + { + "epoch": 5.19, + "eval_loss": Infinity, + "eval_runtime": 545.8282, + "eval_samples_per_second": 20.649, + "eval_steps_per_second": 2.581, + "eval_wer": 0.25874096486804504, + "step": 30000 + }, + { + "epoch": 5.21, + "eval_loss": Infinity, + "eval_runtime": 542.7688, + "eval_samples_per_second": 20.766, + "eval_steps_per_second": 2.596, + "eval_wer": 0.25953941838964534, + "step": 30100 + }, + { + "epoch": 5.22, + "eval_loss": Infinity, + "eval_runtime": 544.0516, + "eval_samples_per_second": 20.717, + "eval_steps_per_second": 2.59, + "eval_wer": 0.2589090603462767, + "step": 30200 + }, + { + "epoch": 5.24, + "eval_loss": Infinity, + "eval_runtime": 541.9109, + "eval_samples_per_second": 20.799, + "eval_steps_per_second": 2.6, + "eval_wer": 0.256912926542276, + "step": 30300 + }, + { + "epoch": 5.26, + "eval_loss": Infinity, + "eval_runtime": 542.1921, + "eval_samples_per_second": 20.788, + "eval_steps_per_second": 2.599, + "eval_wer": 0.26571692721465795, + "step": 30400 + }, + { + "epoch": 5.27, + "learning_rate": 0.0001956662414472921, + "loss": 0.1446, + "step": 30500 + }, + { + "epoch": 5.27, + "eval_loss": Infinity, + "eval_runtime": 541.0843, + "eval_samples_per_second": 20.83, + "eval_steps_per_second": 2.604, + "eval_wer": 0.2649499915952261, + "step": 30500 + }, + { + "epoch": 5.29, + "eval_loss": Infinity, + "eval_runtime": 542.2461, + "eval_samples_per_second": 20.786, + "eval_steps_per_second": 2.598, + "eval_wer": 0.25893007228105563, + "step": 30600 + }, + { + "epoch": 5.31, + "eval_loss": Infinity, + "eval_runtime": 542.4141, + "eval_samples_per_second": 20.779, + "eval_steps_per_second": 2.598, + "eval_wer": 0.255084888216507, + "step": 30700 + }, + { + "epoch": 5.33, + "eval_loss": Infinity, + "eval_runtime": 545.8125, + "eval_samples_per_second": 20.65, + "eval_steps_per_second": 2.581, + "eval_wer": 0.2588565305093293, + "step": 30800 + }, + { + "epoch": 5.34, + "eval_loss": Infinity, + "eval_runtime": 542.3161, + "eval_samples_per_second": 20.783, + "eval_steps_per_second": 2.598, + "eval_wer": 0.2544335182383594, + "step": 30900 + }, + { + "epoch": 5.36, + "learning_rate": 0.00019392670764235183, + "loss": 0.146, + "step": 31000 + }, + { + "epoch": 5.36, + "eval_loss": Infinity, + "eval_runtime": 543.7391, + "eval_samples_per_second": 20.729, + "eval_steps_per_second": 2.591, + "eval_wer": 0.25232181879307447, + "step": 31000 + }, + { + "epoch": 5.38, + "eval_loss": Infinity, + "eval_runtime": 543.7175, + "eval_samples_per_second": 20.73, + "eval_steps_per_second": 2.591, + "eval_wer": 0.2579845352160027, + "step": 31100 + }, + { + "epoch": 5.4, + "eval_loss": Infinity, + "eval_runtime": 545.4245, + "eval_samples_per_second": 20.665, + "eval_steps_per_second": 2.583, + "eval_wer": 0.25971801983526643, + "step": 31200 + }, + { + "epoch": 5.41, + "eval_loss": Infinity, + "eval_runtime": 543.7184, + "eval_samples_per_second": 20.729, + "eval_steps_per_second": 2.591, + "eval_wer": 0.2649499915952261, + "step": 31300 + }, + { + "epoch": 5.43, + "eval_loss": Infinity, + "eval_runtime": 544.3584, + "eval_samples_per_second": 20.705, + "eval_steps_per_second": 2.588, + "eval_wer": 0.26140948058497226, + "step": 31400 + }, + { + "epoch": 5.45, + "learning_rate": 0.00019218717383741156, + "loss": 0.1512, + "step": 31500 + }, + { + "epoch": 5.45, + "eval_loss": Infinity, + "eval_runtime": 543.9248, + "eval_samples_per_second": 20.722, + "eval_steps_per_second": 2.59, + "eval_wer": 0.2576588502269289, + "step": 31500 + }, + { + "epoch": 5.47, + "eval_loss": Infinity, + "eval_runtime": 543.2727, + "eval_samples_per_second": 20.746, + "eval_steps_per_second": 2.594, + "eval_wer": 0.2623129937804673, + "step": 31600 + }, + { + "epoch": 5.48, + "eval_loss": Infinity, + "eval_runtime": 544.7565, + "eval_samples_per_second": 20.69, + "eval_steps_per_second": 2.586, + "eval_wer": 0.25522146579257016, + "step": 31700 + }, + { + "epoch": 5.5, + "eval_loss": Infinity, + "eval_runtime": 542.465, + "eval_samples_per_second": 20.777, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2526264918473693, + "step": 31800 + }, + { + "epoch": 5.52, + "eval_loss": Infinity, + "eval_runtime": 541.8171, + "eval_samples_per_second": 20.802, + "eval_steps_per_second": 2.601, + "eval_wer": 0.25689191460749705, + "step": 31900 + }, + { + "epoch": 5.53, + "learning_rate": 0.0001904476400324713, + "loss": 0.1489, + "step": 32000 + }, + { + "epoch": 5.53, + "eval_loss": Infinity, + "eval_runtime": 554.5484, + "eval_samples_per_second": 20.325, + "eval_steps_per_second": 2.541, + "eval_wer": 0.2555681627164229, + "step": 32000 + }, + { + "epoch": 5.55, + "eval_loss": Infinity, + "eval_runtime": 541.0928, + "eval_samples_per_second": 20.83, + "eval_steps_per_second": 2.604, + "eval_wer": 0.2576483442595394, + "step": 32100 + }, + { + "epoch": 5.57, + "eval_loss": Infinity, + "eval_runtime": 555.6973, + "eval_samples_per_second": 20.283, + "eval_steps_per_second": 2.536, + "eval_wer": 0.2543389645318541, + "step": 32200 + }, + { + "epoch": 5.59, + "eval_loss": Infinity, + "eval_runtime": 541.7763, + "eval_samples_per_second": 20.804, + "eval_steps_per_second": 2.601, + "eval_wer": 0.25343545133635903, + "step": 32300 + }, + { + "epoch": 5.6, + "eval_loss": Infinity, + "eval_runtime": 543.9041, + "eval_samples_per_second": 20.722, + "eval_steps_per_second": 2.591, + "eval_wer": 0.25112413851067406, + "step": 32400 + }, + { + "epoch": 5.62, + "learning_rate": 0.00018871158529514087, + "loss": 0.1482, + "step": 32500 + }, + { + "epoch": 5.62, + "eval_loss": Infinity, + "eval_runtime": 542.0995, + "eval_samples_per_second": 20.791, + "eval_steps_per_second": 2.599, + "eval_wer": 0.2581631366616238, + "step": 32500 + }, + { + "epoch": 5.64, + "eval_loss": Infinity, + "eval_runtime": 542.5978, + "eval_samples_per_second": 20.772, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2593923348461926, + "step": 32600 + }, + { + "epoch": 5.66, + "eval_loss": Infinity, + "eval_runtime": 542.1323, + "eval_samples_per_second": 20.79, + "eval_steps_per_second": 2.599, + "eval_wer": 0.2545806017818121, + "step": 32700 + }, + { + "epoch": 5.67, + "eval_loss": Infinity, + "eval_runtime": 543.4344, + "eval_samples_per_second": 20.74, + "eval_steps_per_second": 2.593, + "eval_wer": 0.24796184232644142, + "step": 32800 + }, + { + "epoch": 5.69, + "eval_loss": Infinity, + "eval_runtime": 543.5989, + "eval_samples_per_second": 20.734, + "eval_steps_per_second": 2.592, + "eval_wer": 0.2610417717263406, + "step": 32900 + }, + { + "epoch": 5.71, + "learning_rate": 0.00018697205149020062, + "loss": 0.1379, + "step": 33000 + }, + { + "epoch": 5.71, + "eval_loss": Infinity, + "eval_runtime": 545.9938, + "eval_samples_per_second": 20.643, + "eval_steps_per_second": 2.581, + "eval_wer": 0.2549798285426122, + "step": 33000 + }, + { + "epoch": 5.72, + "eval_loss": Infinity, + "eval_runtime": 542.7219, + "eval_samples_per_second": 20.768, + "eval_steps_per_second": 2.596, + "eval_wer": 0.2584467977811397, + "step": 33100 + }, + { + "epoch": 5.74, + "eval_loss": Infinity, + "eval_runtime": 542.3547, + "eval_samples_per_second": 20.782, + "eval_steps_per_second": 2.598, + "eval_wer": 0.2568603967053286, + "step": 33200 + }, + { + "epoch": 5.76, + "eval_loss": Infinity, + "eval_runtime": 542.4176, + "eval_samples_per_second": 20.779, + "eval_steps_per_second": 2.598, + "eval_wer": 0.25814212472684483, + "step": 33300 + }, + { + "epoch": 5.78, + "eval_loss": Infinity, + "eval_runtime": 543.6528, + "eval_samples_per_second": 20.732, + "eval_steps_per_second": 2.592, + "eval_wer": 0.26317448310640446, + "step": 33400 + }, + { + "epoch": 5.79, + "learning_rate": 0.00018523599675287022, + "loss": 0.1469, + "step": 33500 + }, + { + "epoch": 5.79, + "eval_loss": Infinity, + "eval_runtime": 543.1136, + "eval_samples_per_second": 20.753, + "eval_steps_per_second": 2.594, + "eval_wer": 0.25725962346612874, + "step": 33500 + }, + { + "epoch": 5.81, + "eval_loss": Infinity, + "eval_runtime": 544.0134, + "eval_samples_per_second": 20.718, + "eval_steps_per_second": 2.59, + "eval_wer": 0.25016809547823166, + "step": 33600 + }, + { + "epoch": 5.83, + "eval_loss": Infinity, + "eval_runtime": 544.855, + "eval_samples_per_second": 20.686, + "eval_steps_per_second": 2.586, + "eval_wer": 0.25649268784669693, + "step": 33700 + }, + { + "epoch": 5.85, + "eval_loss": Infinity, + "eval_runtime": 545.0055, + "eval_samples_per_second": 20.681, + "eval_steps_per_second": 2.585, + "eval_wer": 0.2574277189443604, + "step": 33800 + }, + { + "epoch": 5.86, + "eval_loss": Infinity, + "eval_runtime": 544.8939, + "eval_samples_per_second": 20.685, + "eval_steps_per_second": 2.586, + "eval_wer": 0.25730164733568667, + "step": 33900 + }, + { + "epoch": 5.88, + "learning_rate": 0.00018349646294792992, + "loss": 0.1502, + "step": 34000 + }, + { + "epoch": 5.88, + "eval_loss": Infinity, + "eval_runtime": 542.1481, + "eval_samples_per_second": 20.79, + "eval_steps_per_second": 2.599, + "eval_wer": 0.2602433182047403, + "step": 34000 + }, + { + "epoch": 5.9, + "eval_loss": Infinity, + "eval_runtime": 543.1924, + "eval_samples_per_second": 20.75, + "eval_steps_per_second": 2.594, + "eval_wer": 0.24964279710875778, + "step": 34100 + }, + { + "epoch": 5.91, + "eval_loss": Infinity, + "eval_runtime": 544.5365, + "eval_samples_per_second": 20.698, + "eval_steps_per_second": 2.588, + "eval_wer": 0.25418137502101196, + "step": 34200 + }, + { + "epoch": 5.93, + "eval_loss": Infinity, + "eval_runtime": 544.445, + "eval_samples_per_second": 20.702, + "eval_steps_per_second": 2.588, + "eval_wer": 0.24754160363086233, + "step": 34300 + }, + { + "epoch": 5.95, + "eval_loss": Infinity, + "eval_runtime": 541.9528, + "eval_samples_per_second": 20.797, + "eval_steps_per_second": 2.6, + "eval_wer": 0.24889687342410488, + "step": 34400 + }, + { + "epoch": 5.97, + "learning_rate": 0.00018175692914298967, + "loss": 0.1414, + "step": 34500 + }, + { + "epoch": 5.97, + "eval_loss": Infinity, + "eval_runtime": 546.9612, + "eval_samples_per_second": 20.607, + "eval_steps_per_second": 2.576, + "eval_wer": 0.2520381576735586, + "step": 34500 + }, + { + "epoch": 5.98, + "eval_loss": Infinity, + "eval_runtime": 542.4137, + "eval_samples_per_second": 20.779, + "eval_steps_per_second": 2.598, + "eval_wer": 0.248613212304589, + "step": 34600 + }, + { + "epoch": 6.0, + "eval_loss": Infinity, + "eval_runtime": 543.6113, + "eval_samples_per_second": 20.734, + "eval_steps_per_second": 2.592, + "eval_wer": 0.2601592704656245, + "step": 34700 + }, + { + "epoch": 6.02, + "eval_loss": Infinity, + "eval_runtime": 544.1036, + "eval_samples_per_second": 20.715, + "eval_steps_per_second": 2.59, + "eval_wer": 0.2517019667170953, + "step": 34800 + }, + { + "epoch": 6.04, + "eval_loss": Infinity, + "eval_runtime": 544.3655, + "eval_samples_per_second": 20.705, + "eval_steps_per_second": 2.588, + "eval_wer": 0.2563771222054127, + "step": 34900 + }, + { + "epoch": 6.05, + "learning_rate": 0.0001800173953380494, + "loss": 0.1385, + "step": 35000 + }, + { + "epoch": 6.05, + "eval_loss": Infinity, + "eval_runtime": 545.9585, + "eval_samples_per_second": 20.644, + "eval_steps_per_second": 2.581, + "eval_wer": 0.2500840477391158, + "step": 35000 + }, + { + "epoch": 6.07, + "eval_loss": Infinity, + "eval_runtime": 543.5683, + "eval_samples_per_second": 20.735, + "eval_steps_per_second": 2.592, + "eval_wer": 0.24773071104387293, + "step": 35100 + }, + { + "epoch": 6.09, + "eval_loss": Infinity, + "eval_runtime": 543.8849, + "eval_samples_per_second": 20.723, + "eval_steps_per_second": 2.591, + "eval_wer": 0.25002101193477894, + "step": 35200 + }, + { + "epoch": 6.11, + "eval_loss": Infinity, + "eval_runtime": 546.0856, + "eval_samples_per_second": 20.64, + "eval_steps_per_second": 2.58, + "eval_wer": 0.2556627164229282, + "step": 35300 + }, + { + "epoch": 6.12, + "eval_loss": Infinity, + "eval_runtime": 545.6013, + "eval_samples_per_second": 20.658, + "eval_steps_per_second": 2.582, + "eval_wer": 0.25199613380400065, + "step": 35400 + }, + { + "epoch": 6.14, + "learning_rate": 0.000178281340600719, + "loss": 0.1265, + "step": 35500 + }, + { + "epoch": 6.14, + "eval_loss": Infinity, + "eval_runtime": 544.0517, + "eval_samples_per_second": 20.717, + "eval_steps_per_second": 2.59, + "eval_wer": 0.2567658429988233, + "step": 35500 + }, + { + "epoch": 6.16, + "eval_loss": Infinity, + "eval_runtime": 544.4823, + "eval_samples_per_second": 20.7, + "eval_steps_per_second": 2.588, + "eval_wer": 0.24956925533703142, + "step": 35600 + }, + { + "epoch": 6.17, + "eval_loss": Infinity, + "eval_runtime": 544.9002, + "eval_samples_per_second": 20.685, + "eval_steps_per_second": 2.586, + "eval_wer": 0.2563666162380232, + "step": 35700 + }, + { + "epoch": 6.19, + "eval_loss": Infinity, + "eval_runtime": 544.1075, + "eval_samples_per_second": 20.715, + "eval_steps_per_second": 2.59, + "eval_wer": 0.2511871743150109, + "step": 35800 + }, + { + "epoch": 6.21, + "eval_loss": Infinity, + "eval_runtime": 542.1212, + "eval_samples_per_second": 20.791, + "eval_steps_per_second": 2.599, + "eval_wer": 0.2511556564128425, + "step": 35900 + }, + { + "epoch": 6.23, + "learning_rate": 0.0001765418067957787, + "loss": 0.1267, + "step": 36000 + }, + { + "epoch": 6.23, + "eval_loss": Infinity, + "eval_runtime": 542.2556, + "eval_samples_per_second": 20.785, + "eval_steps_per_second": 2.598, + "eval_wer": 0.2540237855101698, + "step": 36000 + }, + { + "epoch": 6.24, + "eval_loss": Infinity, + "eval_runtime": 555.6145, + "eval_samples_per_second": 20.286, + "eval_steps_per_second": 2.536, + "eval_wer": 0.25, + "step": 36100 + }, + { + "epoch": 6.26, + "eval_loss": Infinity, + "eval_runtime": 545.544, + "eval_samples_per_second": 20.66, + "eval_steps_per_second": 2.583, + "eval_wer": 0.25425491679273826, + "step": 36200 + }, + { + "epoch": 6.28, + "eval_loss": Infinity, + "eval_runtime": 544.7624, + "eval_samples_per_second": 20.69, + "eval_steps_per_second": 2.586, + "eval_wer": 0.2606425449655404, + "step": 36300 + }, + { + "epoch": 6.3, + "eval_loss": Infinity, + "eval_runtime": 544.7203, + "eval_samples_per_second": 20.691, + "eval_steps_per_second": 2.587, + "eval_wer": 0.2527630694234325, + "step": 36400 + }, + { + "epoch": 6.31, + "learning_rate": 0.00017480227299083843, + "loss": 0.1271, + "step": 36500 + }, + { + "epoch": 6.31, + "eval_loss": Infinity, + "eval_runtime": 545.2904, + "eval_samples_per_second": 20.67, + "eval_steps_per_second": 2.584, + "eval_wer": 0.2536035468145907, + "step": 36500 + }, + { + "epoch": 6.33, + "eval_loss": Infinity, + "eval_runtime": 545.8896, + "eval_samples_per_second": 20.647, + "eval_steps_per_second": 2.581, + "eval_wer": 0.2473209783156833, + "step": 36600 + }, + { + "epoch": 6.35, + "eval_loss": Infinity, + "eval_runtime": 546.4085, + "eval_samples_per_second": 20.627, + "eval_steps_per_second": 2.579, + "eval_wer": 0.25052529836947385, + "step": 36700 + }, + { + "epoch": 6.36, + "eval_loss": Infinity, + "eval_runtime": 545.4805, + "eval_samples_per_second": 20.663, + "eval_steps_per_second": 2.583, + "eval_wer": 0.25445453017313835, + "step": 36800 + }, + { + "epoch": 6.38, + "eval_loss": Infinity, + "eval_runtime": 545.6649, + "eval_samples_per_second": 20.656, + "eval_steps_per_second": 2.582, + "eval_wer": 0.25120818624978986, + "step": 36900 + }, + { + "epoch": 6.4, + "learning_rate": 0.00017306273918589818, + "loss": 0.1269, + "step": 37000 + }, + { + "epoch": 6.4, + "eval_loss": Infinity, + "eval_runtime": 545.7146, + "eval_samples_per_second": 20.654, + "eval_steps_per_second": 2.582, + "eval_wer": 0.25005252983694737, + "step": 37000 + }, + { + "epoch": 6.42, + "eval_loss": Infinity, + "eval_runtime": 545.1673, + "eval_samples_per_second": 20.674, + "eval_steps_per_second": 2.585, + "eval_wer": 0.24807740796772568, + "step": 37100 + }, + { + "epoch": 6.43, + "eval_loss": Infinity, + "eval_runtime": 544.0697, + "eval_samples_per_second": 20.716, + "eval_steps_per_second": 2.59, + "eval_wer": 0.245156749033451, + "step": 37200 + }, + { + "epoch": 6.45, + "eval_loss": Infinity, + "eval_runtime": 552.8142, + "eval_samples_per_second": 20.388, + "eval_steps_per_second": 2.549, + "eval_wer": 0.2427088586317028, + "step": 37300 + }, + { + "epoch": 6.47, + "eval_loss": Infinity, + "eval_runtime": 579.5521, + "eval_samples_per_second": 19.448, + "eval_steps_per_second": 2.431, + "eval_wer": 0.25326735585812743, + "step": 37400 + }, + { + "epoch": 6.49, + "learning_rate": 0.0001713232053809579, + "loss": 0.1304, + "step": 37500 + }, + { + "epoch": 6.49, + "eval_loss": Infinity, + "eval_runtime": 609.7099, + "eval_samples_per_second": 18.486, + "eval_steps_per_second": 2.311, + "eval_wer": 0.25523197175995965, + "step": 37500 + }, + { + "epoch": 6.5, + "eval_loss": Infinity, + "eval_runtime": 611.8183, + "eval_samples_per_second": 18.422, + "eval_steps_per_second": 2.303, + "eval_wer": 0.2482455034459573, + "step": 37600 + }, + { + "epoch": 6.52, + "eval_loss": Infinity, + "eval_runtime": 609.1706, + "eval_samples_per_second": 18.502, + "eval_steps_per_second": 2.313, + "eval_wer": 0.24762565136997816, + "step": 37700 + }, + { + "epoch": 6.54, + "eval_loss": Infinity, + "eval_runtime": 610.1889, + "eval_samples_per_second": 18.471, + "eval_steps_per_second": 2.309, + "eval_wer": 0.252994200706001, + "step": 37800 + }, + { + "epoch": 6.55, + "eval_loss": Infinity, + "eval_runtime": 608.2683, + "eval_samples_per_second": 18.53, + "eval_steps_per_second": 2.316, + "eval_wer": 0.2427193645990923, + "step": 37900 + }, + { + "epoch": 6.57, + "learning_rate": 0.00016958367157601762, + "loss": 0.1259, + "step": 38000 + }, + { + "epoch": 6.57, + "eval_loss": Infinity, + "eval_runtime": 607.8109, + "eval_samples_per_second": 18.544, + "eval_steps_per_second": 2.318, + "eval_wer": 0.244473861153135, + "step": 38000 + }, + { + "epoch": 6.59, + "eval_loss": Infinity, + "eval_runtime": 611.2735, + "eval_samples_per_second": 18.439, + "eval_steps_per_second": 2.305, + "eval_wer": 0.24523029080517733, + "step": 38100 + }, + { + "epoch": 6.61, + "eval_loss": Infinity, + "eval_runtime": 611.2354, + "eval_samples_per_second": 18.44, + "eval_steps_per_second": 2.305, + "eval_wer": 0.2509560430324424, + "step": 38200 + }, + { + "epoch": 6.62, + "eval_loss": Infinity, + "eval_runtime": 607.3737, + "eval_samples_per_second": 18.557, + "eval_steps_per_second": 2.32, + "eval_wer": 0.24547192805513532, + "step": 38300 + }, + { + "epoch": 6.64, + "eval_loss": Infinity, + "eval_runtime": 557.5444, + "eval_samples_per_second": 20.215, + "eval_steps_per_second": 2.527, + "eval_wer": 0.2478777945873256, + "step": 38400 + }, + { + "epoch": 6.66, + "learning_rate": 0.00016784413777107732, + "loss": 0.1244, + "step": 38500 + }, + { + "epoch": 6.66, + "eval_loss": Infinity, + "eval_runtime": 558.0795, + "eval_samples_per_second": 20.196, + "eval_steps_per_second": 2.525, + "eval_wer": 0.25171247268448477, + "step": 38500 + }, + { + "epoch": 6.68, + "eval_loss": Infinity, + "eval_runtime": 551.4957, + "eval_samples_per_second": 20.437, + "eval_steps_per_second": 2.555, + "eval_wer": 0.25004202386955793, + "step": 38600 + }, + { + "epoch": 6.69, + "eval_loss": Infinity, + "eval_runtime": 547.5154, + "eval_samples_per_second": 20.586, + "eval_steps_per_second": 2.573, + "eval_wer": 0.24217305429483946, + "step": 38700 + }, + { + "epoch": 6.71, + "eval_loss": Infinity, + "eval_runtime": 551.8818, + "eval_samples_per_second": 20.423, + "eval_steps_per_second": 2.553, + "eval_wer": 0.2515548831736426, + "step": 38800 + }, + { + "epoch": 6.73, + "eval_loss": Infinity, + "eval_runtime": 571.7971, + "eval_samples_per_second": 19.712, + "eval_steps_per_second": 2.464, + "eval_wer": 0.24498865355521937, + "step": 38900 + }, + { + "epoch": 6.75, + "learning_rate": 0.00016610460396613707, + "loss": 0.1281, + "step": 39000 + }, + { + "epoch": 6.75, + "eval_loss": Infinity, + "eval_runtime": 559.2146, + "eval_samples_per_second": 20.155, + "eval_steps_per_second": 2.52, + "eval_wer": 0.24629139351151455, + "step": 39000 + }, + { + "epoch": 6.76, + "eval_loss": Infinity, + "eval_runtime": 549.7387, + "eval_samples_per_second": 20.502, + "eval_steps_per_second": 2.563, + "eval_wer": 0.24811943183728358, + "step": 39100 + }, + { + "epoch": 6.78, + "eval_loss": Infinity, + "eval_runtime": 546.7395, + "eval_samples_per_second": 20.615, + "eval_steps_per_second": 2.577, + "eval_wer": 0.24802487813077828, + "step": 39200 + }, + { + "epoch": 6.8, + "eval_loss": Infinity, + "eval_runtime": 556.9541, + "eval_samples_per_second": 20.237, + "eval_steps_per_second": 2.53, + "eval_wer": 0.24601823835938813, + "step": 39300 + }, + { + "epoch": 6.81, + "eval_loss": Infinity, + "eval_runtime": 546.1242, + "eval_samples_per_second": 20.638, + "eval_steps_per_second": 2.58, + "eval_wer": 0.24889687342410488, + "step": 39400 + }, + { + "epoch": 6.83, + "learning_rate": 0.00016436854922880666, + "loss": 0.1287, + "step": 39500 + }, + { + "epoch": 6.83, + "eval_loss": Infinity, + "eval_runtime": 542.5205, + "eval_samples_per_second": 20.775, + "eval_steps_per_second": 2.597, + "eval_wer": 0.24849764666330476, + "step": 39500 + }, + { + "epoch": 6.85, + "eval_loss": Infinity, + "eval_runtime": 542.3359, + "eval_samples_per_second": 20.782, + "eval_steps_per_second": 2.598, + "eval_wer": 0.24547192805513532, + "step": 39600 + }, + { + "epoch": 6.87, + "eval_loss": Infinity, + "eval_runtime": 544.5258, + "eval_samples_per_second": 20.699, + "eval_steps_per_second": 2.588, + "eval_wer": 0.2451042191965036, + "step": 39700 + }, + { + "epoch": 6.88, + "eval_loss": Infinity, + "eval_runtime": 544.0336, + "eval_samples_per_second": 20.717, + "eval_steps_per_second": 2.59, + "eval_wer": 0.2473209783156833, + "step": 39800 + }, + { + "epoch": 6.9, + "eval_loss": Infinity, + "eval_runtime": 551.3211, + "eval_samples_per_second": 20.444, + "eval_steps_per_second": 2.556, + "eval_wer": 0.25002101193477894, + "step": 39900 + }, + { + "epoch": 6.92, + "learning_rate": 0.00016263249449147626, + "loss": 0.1308, + "step": 40000 + }, + { + "epoch": 6.92, + "eval_loss": Infinity, + "eval_runtime": 554.882, + "eval_samples_per_second": 20.312, + "eval_steps_per_second": 2.539, + "eval_wer": 0.2451042191965036, + "step": 40000 + }, + { + "epoch": 6.94, + "eval_loss": Infinity, + "eval_runtime": 542.0787, + "eval_samples_per_second": 20.792, + "eval_steps_per_second": 2.599, + "eval_wer": 0.24064968902336528, + "step": 40100 + }, + { + "epoch": 6.95, + "eval_loss": Infinity, + "eval_runtime": 589.9942, + "eval_samples_per_second": 19.104, + "eval_steps_per_second": 2.388, + "eval_wer": 0.23928391326273324, + "step": 40200 + }, + { + "epoch": 6.97, + "eval_loss": Infinity, + "eval_runtime": 542.3329, + "eval_samples_per_second": 20.782, + "eval_steps_per_second": 2.598, + "eval_wer": 0.24142713061018659, + "step": 40300 + }, + { + "epoch": 6.99, + "eval_loss": Infinity, + "eval_runtime": 543.579, + "eval_samples_per_second": 20.735, + "eval_steps_per_second": 2.592, + "eval_wer": 0.23991427130610188, + "step": 40400 + }, + { + "epoch": 7.0, + "learning_rate": 0.00016089296068653598, + "loss": 0.1189, + "step": 40500 + }, + { + "epoch": 7.0, + "eval_loss": Infinity, + "eval_runtime": 546.472, + "eval_samples_per_second": 20.625, + "eval_steps_per_second": 2.578, + "eval_wer": 0.2381912926542276, + "step": 40500 + }, + { + "epoch": 7.02, + "eval_loss": Infinity, + "eval_runtime": 554.1607, + "eval_samples_per_second": 20.339, + "eval_steps_per_second": 2.543, + "eval_wer": 0.2400298369473861, + "step": 40600 + }, + { + "epoch": 7.04, + "eval_loss": Infinity, + "eval_runtime": 550.4036, + "eval_samples_per_second": 20.478, + "eval_steps_per_second": 2.56, + "eval_wer": 0.24198394688182887, + "step": 40700 + }, + { + "epoch": 7.06, + "eval_loss": Infinity, + "eval_runtime": 544.257, + "eval_samples_per_second": 20.709, + "eval_steps_per_second": 2.589, + "eval_wer": 0.24069171289292318, + "step": 40800 + }, + { + "epoch": 7.07, + "eval_loss": Infinity, + "eval_runtime": 552.2615, + "eval_samples_per_second": 20.409, + "eval_steps_per_second": 2.551, + "eval_wer": 0.24138510674062869, + "step": 40900 + }, + { + "epoch": 7.09, + "learning_rate": 0.0001591534268815957, + "loss": 0.1132, + "step": 41000 + }, + { + "epoch": 7.09, + "eval_loss": Infinity, + "eval_runtime": 544.7913, + "eval_samples_per_second": 20.689, + "eval_steps_per_second": 2.586, + "eval_wer": 0.24250924525130274, + "step": 41000 + }, + { + "epoch": 7.11, + "eval_loss": Infinity, + "eval_runtime": 549.0429, + "eval_samples_per_second": 20.528, + "eval_steps_per_second": 2.566, + "eval_wer": 0.2376870062195327, + "step": 41100 + }, + { + "epoch": 7.13, + "eval_loss": Infinity, + "eval_runtime": 549.5056, + "eval_samples_per_second": 20.511, + "eval_steps_per_second": 2.564, + "eval_wer": 0.23895822827365945, + "step": 41200 + }, + { + "epoch": 7.14, + "eval_loss": Infinity, + "eval_runtime": 551.038, + "eval_samples_per_second": 20.454, + "eval_steps_per_second": 2.557, + "eval_wer": 0.23946251470835433, + "step": 41300 + }, + { + "epoch": 7.16, + "eval_loss": Infinity, + "eval_runtime": 551.6556, + "eval_samples_per_second": 20.431, + "eval_steps_per_second": 2.554, + "eval_wer": 0.24171079172970247, + "step": 41400 + }, + { + "epoch": 7.18, + "learning_rate": 0.00015741389307665545, + "loss": 0.1058, + "step": 41500 + }, + { + "epoch": 7.18, + "eval_loss": Infinity, + "eval_runtime": 551.1685, + "eval_samples_per_second": 20.449, + "eval_steps_per_second": 2.556, + "eval_wer": 0.23923138342578584, + "step": 41500 + }, + { + "epoch": 7.19, + "eval_loss": Infinity, + "eval_runtime": 547.2412, + "eval_samples_per_second": 20.596, + "eval_steps_per_second": 2.575, + "eval_wer": 0.23935745503445957, + "step": 41600 + }, + { + "epoch": 7.21, + "eval_loss": Infinity, + "eval_runtime": 545.7997, + "eval_samples_per_second": 20.65, + "eval_steps_per_second": 2.582, + "eval_wer": 0.23876912086064886, + "step": 41700 + }, + { + "epoch": 7.23, + "eval_loss": Infinity, + "eval_runtime": 544.9052, + "eval_samples_per_second": 20.684, + "eval_steps_per_second": 2.586, + "eval_wer": 0.24115397545806017, + "step": 41800 + }, + { + "epoch": 7.25, + "eval_loss": Infinity, + "eval_runtime": 551.8822, + "eval_samples_per_second": 20.423, + "eval_steps_per_second": 2.553, + "eval_wer": 0.24514624306606153, + "step": 41900 + }, + { + "epoch": 7.26, + "learning_rate": 0.00015567435927171518, + "loss": 0.1038, + "step": 42000 + }, + { + "epoch": 7.26, + "eval_loss": Infinity, + "eval_runtime": 544.2814, + "eval_samples_per_second": 20.708, + "eval_steps_per_second": 2.589, + "eval_wer": 0.24196293494704993, + "step": 42000 + }, + { + "epoch": 7.28, + "eval_loss": Infinity, + "eval_runtime": 546.2453, + "eval_samples_per_second": 20.634, + "eval_steps_per_second": 2.579, + "eval_wer": 0.23996680114304925, + "step": 42100 + }, + { + "epoch": 7.3, + "eval_loss": Infinity, + "eval_runtime": 542.654, + "eval_samples_per_second": 20.77, + "eval_steps_per_second": 2.596, + "eval_wer": 0.24099638594721803, + "step": 42200 + }, + { + "epoch": 7.32, + "eval_loss": Infinity, + "eval_runtime": 545.7874, + "eval_samples_per_second": 20.651, + "eval_steps_per_second": 2.582, + "eval_wer": 0.2377710539586485, + "step": 42300 + }, + { + "epoch": 7.33, + "eval_loss": Infinity, + "eval_runtime": 543.8176, + "eval_samples_per_second": 20.726, + "eval_steps_per_second": 2.591, + "eval_wer": 0.24062867708858632, + "step": 42400 + }, + { + "epoch": 7.35, + "learning_rate": 0.00015393830453438477, + "loss": 0.1084, + "step": 42500 + }, + { + "epoch": 7.35, + "eval_loss": Infinity, + "eval_runtime": 542.352, + "eval_samples_per_second": 20.782, + "eval_steps_per_second": 2.598, + "eval_wer": 0.23573289628508992, + "step": 42500 + }, + { + "epoch": 7.37, + "eval_loss": Infinity, + "eval_runtime": 543.3886, + "eval_samples_per_second": 20.742, + "eval_steps_per_second": 2.593, + "eval_wer": 0.23681501092620608, + "step": 42600 + }, + { + "epoch": 7.38, + "eval_loss": Infinity, + "eval_runtime": 545.4438, + "eval_samples_per_second": 20.664, + "eval_steps_per_second": 2.583, + "eval_wer": 0.23580643805681628, + "step": 42700 + }, + { + "epoch": 7.4, + "eval_loss": Infinity, + "eval_runtime": 545.4721, + "eval_samples_per_second": 20.663, + "eval_steps_per_second": 2.583, + "eval_wer": 0.24020843839300723, + "step": 42800 + }, + { + "epoch": 7.42, + "eval_loss": Infinity, + "eval_runtime": 544.5151, + "eval_samples_per_second": 20.699, + "eval_steps_per_second": 2.588, + "eval_wer": 0.23803370314338546, + "step": 42900 + }, + { + "epoch": 7.44, + "learning_rate": 0.0001521987707294445, + "loss": 0.1094, + "step": 43000 + }, + { + "epoch": 7.44, + "eval_loss": Infinity, + "eval_runtime": 545.5739, + "eval_samples_per_second": 20.659, + "eval_steps_per_second": 2.583, + "eval_wer": 0.23912632375189108, + "step": 43000 + }, + { + "epoch": 7.45, + "eval_loss": Infinity, + "eval_runtime": 546.28, + "eval_samples_per_second": 20.632, + "eval_steps_per_second": 2.579, + "eval_wer": 0.24224659606656582, + "step": 43100 + }, + { + "epoch": 7.47, + "eval_loss": Infinity, + "eval_runtime": 546.7274, + "eval_samples_per_second": 20.615, + "eval_steps_per_second": 2.577, + "eval_wer": 0.23834888216506975, + "step": 43200 + }, + { + "epoch": 7.49, + "eval_loss": Infinity, + "eval_runtime": 546.5993, + "eval_samples_per_second": 20.62, + "eval_steps_per_second": 2.578, + "eval_wer": 0.23654185577407968, + "step": 43300 + }, + { + "epoch": 7.51, + "eval_loss": Infinity, + "eval_runtime": 544.9504, + "eval_samples_per_second": 20.683, + "eval_steps_per_second": 2.586, + "eval_wer": 0.2389372163388805, + "step": 43400 + }, + { + "epoch": 7.52, + "learning_rate": 0.00015045923692450422, + "loss": 0.1088, + "step": 43500 + }, + { + "epoch": 7.52, + "eval_loss": Infinity, + "eval_runtime": 545.8554, + "eval_samples_per_second": 20.648, + "eval_steps_per_second": 2.581, + "eval_wer": 0.2359745335350479, + "step": 43500 + }, + { + "epoch": 7.54, + "eval_loss": Infinity, + "eval_runtime": 546.547, + "eval_samples_per_second": 20.622, + "eval_steps_per_second": 2.578, + "eval_wer": 0.24074424272987058, + "step": 43600 + }, + { + "epoch": 7.56, + "eval_loss": Infinity, + "eval_runtime": 546.4586, + "eval_samples_per_second": 20.626, + "eval_steps_per_second": 2.578, + "eval_wer": 0.23735081526306942, + "step": 43700 + }, + { + "epoch": 7.58, + "eval_loss": Infinity, + "eval_runtime": 545.2466, + "eval_samples_per_second": 20.671, + "eval_steps_per_second": 2.584, + "eval_wer": 0.23444066229618424, + "step": 43800 + }, + { + "epoch": 7.59, + "eval_loss": Infinity, + "eval_runtime": 559.1801, + "eval_samples_per_second": 20.156, + "eval_steps_per_second": 2.52, + "eval_wer": 0.23550176500252143, + "step": 43900 + }, + { + "epoch": 7.61, + "learning_rate": 0.00014871970311956394, + "loss": 0.1082, + "step": 44000 + }, + { + "epoch": 7.61, + "eval_loss": Infinity, + "eval_runtime": 544.6369, + "eval_samples_per_second": 20.695, + "eval_steps_per_second": 2.587, + "eval_wer": 0.23964111615397546, + "step": 44000 + }, + { + "epoch": 7.63, + "eval_loss": Infinity, + "eval_runtime": 546.7779, + "eval_samples_per_second": 20.613, + "eval_steps_per_second": 2.577, + "eval_wer": 0.2347348293830896, + "step": 44100 + }, + { + "epoch": 7.64, + "eval_loss": Infinity, + "eval_runtime": 544.3794, + "eval_samples_per_second": 20.704, + "eval_steps_per_second": 2.588, + "eval_wer": 0.2344091443940158, + "step": 44200 + }, + { + "epoch": 7.66, + "eval_loss": Infinity, + "eval_runtime": 545.2672, + "eval_samples_per_second": 20.671, + "eval_steps_per_second": 2.584, + "eval_wer": 0.2359745335350479, + "step": 44300 + }, + { + "epoch": 7.68, + "eval_loss": Infinity, + "eval_runtime": 546.2821, + "eval_samples_per_second": 20.632, + "eval_steps_per_second": 2.579, + "eval_wer": 0.24059715918641789, + "step": 44400 + }, + { + "epoch": 7.7, + "learning_rate": 0.00014698364838223354, + "loss": 0.1101, + "step": 44500 + }, + { + "epoch": 7.7, + "eval_loss": Infinity, + "eval_runtime": 544.6729, + "eval_samples_per_second": 20.693, + "eval_steps_per_second": 2.587, + "eval_wer": 0.23647881996974282, + "step": 44500 + }, + { + "epoch": 7.71, + "eval_loss": Infinity, + "eval_runtime": 545.37, + "eval_samples_per_second": 20.667, + "eval_steps_per_second": 2.584, + "eval_wer": 0.2358799798285426, + "step": 44600 + }, + { + "epoch": 7.73, + "eval_loss": Infinity, + "eval_runtime": 546.597, + "eval_samples_per_second": 20.62, + "eval_steps_per_second": 2.578, + "eval_wer": 0.24444234325096656, + "step": 44700 + }, + { + "epoch": 7.75, + "eval_loss": Infinity, + "eval_runtime": 547.5764, + "eval_samples_per_second": 20.583, + "eval_steps_per_second": 2.573, + "eval_wer": 0.23757144057824844, + "step": 44800 + }, + { + "epoch": 7.77, + "eval_loss": Infinity, + "eval_runtime": 547.3757, + "eval_samples_per_second": 20.591, + "eval_steps_per_second": 2.574, + "eval_wer": 0.2360270633719953, + "step": 44900 + }, + { + "epoch": 7.78, + "learning_rate": 0.00014524411457729328, + "loss": 0.1114, + "step": 45000 + }, + { + "epoch": 7.78, + "eval_loss": Infinity, + "eval_runtime": 547.5394, + "eval_samples_per_second": 20.585, + "eval_steps_per_second": 2.573, + "eval_wer": 0.23577492015464785, + "step": 45000 + }, + { + "epoch": 7.8, + "eval_loss": Infinity, + "eval_runtime": 547.5618, + "eval_samples_per_second": 20.584, + "eval_steps_per_second": 2.573, + "eval_wer": 0.23652084383930072, + "step": 45100 + }, + { + "epoch": 7.82, + "eval_loss": Infinity, + "eval_runtime": 547.0038, + "eval_samples_per_second": 20.605, + "eval_steps_per_second": 2.576, + "eval_wer": 0.2381072449151118, + "step": 45200 + }, + { + "epoch": 7.83, + "eval_loss": Infinity, + "eval_runtime": 547.295, + "eval_samples_per_second": 20.594, + "eval_steps_per_second": 2.574, + "eval_wer": 0.23496596066565809, + "step": 45300 + }, + { + "epoch": 7.85, + "eval_loss": Infinity, + "eval_runtime": 547.0451, + "eval_samples_per_second": 20.603, + "eval_steps_per_second": 2.576, + "eval_wer": 0.23590099176332158, + "step": 45400 + }, + { + "epoch": 7.87, + "learning_rate": 0.00014350458077235298, + "loss": 0.1133, + "step": 45500 + }, + { + "epoch": 7.87, + "eval_loss": Infinity, + "eval_runtime": 545.0755, + "eval_samples_per_second": 20.678, + "eval_steps_per_second": 2.585, + "eval_wer": 0.23681501092620608, + "step": 45500 + }, + { + "epoch": 7.89, + "eval_loss": Infinity, + "eval_runtime": 546.4556, + "eval_samples_per_second": 20.626, + "eval_steps_per_second": 2.578, + "eval_wer": 0.24080727853420744, + "step": 45600 + }, + { + "epoch": 7.9, + "eval_loss": Infinity, + "eval_runtime": 543.2499, + "eval_samples_per_second": 20.747, + "eval_steps_per_second": 2.594, + "eval_wer": 0.23743486300218525, + "step": 45700 + }, + { + "epoch": 7.92, + "eval_loss": Infinity, + "eval_runtime": 544.8106, + "eval_samples_per_second": 20.688, + "eval_steps_per_second": 2.586, + "eval_wer": 0.23604807530677424, + "step": 45800 + }, + { + "epoch": 7.94, + "eval_loss": Infinity, + "eval_runtime": 543.3851, + "eval_samples_per_second": 20.742, + "eval_steps_per_second": 2.593, + "eval_wer": 0.23178265254664648, + "step": 45900 + }, + { + "epoch": 7.96, + "learning_rate": 0.00014176504696741273, + "loss": 0.1058, + "step": 46000 + }, + { + "epoch": 7.96, + "eval_loss": Infinity, + "eval_runtime": 543.8967, + "eval_samples_per_second": 20.723, + "eval_steps_per_second": 2.591, + "eval_wer": 0.23223440914439403, + "step": 46000 + }, + { + "epoch": 7.97, + "eval_loss": Infinity, + "eval_runtime": 544.0937, + "eval_samples_per_second": 20.715, + "eval_steps_per_second": 2.59, + "eval_wer": 0.23738233316523785, + "step": 46100 + }, + { + "epoch": 7.99, + "eval_loss": Infinity, + "eval_runtime": 544.8297, + "eval_samples_per_second": 20.687, + "eval_steps_per_second": 2.586, + "eval_wer": 0.23216086737266767, + "step": 46200 + }, + { + "epoch": 8.01, + "eval_loss": Infinity, + "eval_runtime": 544.7266, + "eval_samples_per_second": 20.691, + "eval_steps_per_second": 2.587, + "eval_wer": 0.23605858127416374, + "step": 46300 + }, + { + "epoch": 8.02, + "eval_loss": Infinity, + "eval_runtime": 543.6144, + "eval_samples_per_second": 20.733, + "eval_steps_per_second": 2.592, + "eval_wer": 0.2351970919482266, + "step": 46400 + }, + { + "epoch": 8.04, + "learning_rate": 0.00014002551316247245, + "loss": 0.1024, + "step": 46500 + }, + { + "epoch": 8.04, + "eval_loss": Infinity, + "eval_runtime": 544.0783, + "eval_samples_per_second": 20.716, + "eval_steps_per_second": 2.59, + "eval_wer": 0.23300134476382586, + "step": 46500 + }, + { + "epoch": 8.06, + "eval_loss": Infinity, + "eval_runtime": 544.1678, + "eval_samples_per_second": 20.712, + "eval_steps_per_second": 2.589, + "eval_wer": 0.23152000336190956, + "step": 46600 + }, + { + "epoch": 8.08, + "eval_loss": Infinity, + "eval_runtime": 547.7672, + "eval_samples_per_second": 20.576, + "eval_steps_per_second": 2.572, + "eval_wer": 0.23152000336190956, + "step": 46700 + }, + { + "epoch": 8.09, + "eval_loss": Infinity, + "eval_runtime": 545.4647, + "eval_samples_per_second": 20.663, + "eval_steps_per_second": 2.583, + "eval_wer": 0.23452471003530004, + "step": 46800 + }, + { + "epoch": 8.11, + "eval_loss": Infinity, + "eval_runtime": 544.6881, + "eval_samples_per_second": 20.693, + "eval_steps_per_second": 2.587, + "eval_wer": 0.2372247436543957, + "step": 46900 + }, + { + "epoch": 8.13, + "learning_rate": 0.00013828597935753217, + "loss": 0.093, + "step": 47000 + }, + { + "epoch": 8.13, + "eval_loss": Infinity, + "eval_runtime": 542.6307, + "eval_samples_per_second": 20.771, + "eval_steps_per_second": 2.597, + "eval_wer": 0.2356173306438057, + "step": 47000 + }, + { + "epoch": 8.15, + "eval_loss": Infinity, + "eval_runtime": 544.7932, + "eval_samples_per_second": 20.689, + "eval_steps_per_second": 2.586, + "eval_wer": 0.2337577744158682, + "step": 47100 + }, + { + "epoch": 8.16, + "eval_loss": Infinity, + "eval_runtime": 545.3612, + "eval_samples_per_second": 20.667, + "eval_steps_per_second": 2.584, + "eval_wer": 0.23032232307950917, + "step": 47200 + }, + { + "epoch": 8.18, + "eval_loss": Infinity, + "eval_runtime": 544.9025, + "eval_samples_per_second": 20.684, + "eval_steps_per_second": 2.586, + "eval_wer": 0.23370524457892083, + "step": 47300 + }, + { + "epoch": 8.2, + "eval_loss": Infinity, + "eval_runtime": 542.8145, + "eval_samples_per_second": 20.764, + "eval_steps_per_second": 2.596, + "eval_wer": 0.23327449991595225, + "step": 47400 + }, + { + "epoch": 8.22, + "learning_rate": 0.0001365464455525919, + "loss": 0.0907, + "step": 47500 + }, + { + "epoch": 8.22, + "eval_loss": Infinity, + "eval_runtime": 543.608, + "eval_samples_per_second": 20.734, + "eval_steps_per_second": 2.592, + "eval_wer": 0.23349512523113128, + "step": 47500 + }, + { + "epoch": 8.23, + "eval_loss": Infinity, + "eval_runtime": 544.4985, + "eval_samples_per_second": 20.7, + "eval_steps_per_second": 2.588, + "eval_wer": 0.2339048579593209, + "step": 47600 + }, + { + "epoch": 8.25, + "eval_loss": Infinity, + "eval_runtime": 557.8672, + "eval_samples_per_second": 20.204, + "eval_steps_per_second": 2.526, + "eval_wer": 0.23124684820978317, + "step": 47700 + }, + { + "epoch": 8.27, + "eval_loss": Infinity, + "eval_runtime": 545.0667, + "eval_samples_per_second": 20.678, + "eval_steps_per_second": 2.585, + "eval_wer": 0.23343208942679441, + "step": 47800 + }, + { + "epoch": 8.28, + "eval_loss": Infinity, + "eval_runtime": 544.2596, + "eval_samples_per_second": 20.709, + "eval_steps_per_second": 2.589, + "eval_wer": 0.2310787527315515, + "step": 47900 + }, + { + "epoch": 8.3, + "learning_rate": 0.0001348103908152615, + "loss": 0.0909, + "step": 48000 + }, + { + "epoch": 8.3, + "eval_loss": Infinity, + "eval_runtime": 542.9121, + "eval_samples_per_second": 20.76, + "eval_steps_per_second": 2.595, + "eval_wer": 0.23346360732896285, + "step": 48000 + }, + { + "epoch": 8.32, + "eval_loss": Infinity, + "eval_runtime": 545.1225, + "eval_samples_per_second": 20.676, + "eval_steps_per_second": 2.585, + "eval_wer": 0.23476634728525803, + "step": 48100 + }, + { + "epoch": 8.34, + "eval_loss": Infinity, + "eval_runtime": 543.7866, + "eval_samples_per_second": 20.727, + "eval_steps_per_second": 2.591, + "eval_wer": 0.22904059505799293, + "step": 48200 + }, + { + "epoch": 8.35, + "eval_loss": Infinity, + "eval_runtime": 544.9739, + "eval_samples_per_second": 20.682, + "eval_steps_per_second": 2.585, + "eval_wer": 0.23550176500252143, + "step": 48300 + }, + { + "epoch": 8.37, + "eval_loss": Infinity, + "eval_runtime": 557.5362, + "eval_samples_per_second": 20.216, + "eval_steps_per_second": 2.527, + "eval_wer": 0.2322869389813414, + "step": 48400 + }, + { + "epoch": 8.39, + "learning_rate": 0.00013307085701032124, + "loss": 0.0956, + "step": 48500 + }, + { + "epoch": 8.39, + "eval_loss": Infinity, + "eval_runtime": 542.6037, + "eval_samples_per_second": 20.772, + "eval_steps_per_second": 2.597, + "eval_wer": 0.22925071440578249, + "step": 48500 + }, + { + "epoch": 8.41, + "eval_loss": Infinity, + "eval_runtime": 554.9667, + "eval_samples_per_second": 20.309, + "eval_steps_per_second": 2.539, + "eval_wer": 0.22897755925365607, + "step": 48600 + }, + { + "epoch": 8.42, + "eval_loss": Infinity, + "eval_runtime": 545.2076, + "eval_samples_per_second": 20.673, + "eval_steps_per_second": 2.584, + "eval_wer": 0.22791645654731887, + "step": 48700 + }, + { + "epoch": 8.44, + "eval_loss": Infinity, + "eval_runtime": 545.724, + "eval_samples_per_second": 20.653, + "eval_steps_per_second": 2.582, + "eval_wer": 0.2311312825684989, + "step": 48800 + }, + { + "epoch": 8.46, + "eval_loss": Infinity, + "eval_runtime": 545.671, + "eval_samples_per_second": 20.655, + "eval_steps_per_second": 2.582, + "eval_wer": 0.23051143049251976, + "step": 48900 + }, + { + "epoch": 8.47, + "learning_rate": 0.00013133132320538094, + "loss": 0.0923, + "step": 49000 + }, + { + "epoch": 8.47, + "eval_loss": Infinity, + "eval_runtime": 553.4158, + "eval_samples_per_second": 20.366, + "eval_steps_per_second": 2.546, + "eval_wer": 0.2332114641116154, + "step": 49000 + }, + { + "epoch": 8.49, + "eval_loss": Infinity, + "eval_runtime": 547.8596, + "eval_samples_per_second": 20.573, + "eval_steps_per_second": 2.572, + "eval_wer": 0.2293347621448983, + "step": 49100 + }, + { + "epoch": 8.51, + "eval_loss": Infinity, + "eval_runtime": 546.9612, + "eval_samples_per_second": 20.607, + "eval_steps_per_second": 2.576, + "eval_wer": 0.2290090771558245, + "step": 49200 + }, + { + "epoch": 8.53, + "eval_loss": Infinity, + "eval_runtime": 545.7413, + "eval_samples_per_second": 20.653, + "eval_steps_per_second": 2.582, + "eval_wer": 0.23329551185073122, + "step": 49300 + }, + { + "epoch": 8.54, + "eval_loss": Infinity, + "eval_runtime": 547.3327, + "eval_samples_per_second": 20.593, + "eval_steps_per_second": 2.574, + "eval_wer": 0.23098419902504622, + "step": 49400 + }, + { + "epoch": 8.56, + "learning_rate": 0.00012959178940044069, + "loss": 0.0922, + "step": 49500 + }, + { + "epoch": 8.56, + "eval_loss": Infinity, + "eval_runtime": 549.3327, + "eval_samples_per_second": 20.518, + "eval_steps_per_second": 2.565, + "eval_wer": 0.2294293158514036, + "step": 49500 + }, + { + "epoch": 8.58, + "eval_loss": Infinity, + "eval_runtime": 547.2867, + "eval_samples_per_second": 20.594, + "eval_steps_per_second": 2.575, + "eval_wer": 0.22784291477559254, + "step": 49600 + }, + { + "epoch": 8.6, + "eval_loss": Infinity, + "eval_runtime": 545.8501, + "eval_samples_per_second": 20.649, + "eval_steps_per_second": 2.581, + "eval_wer": 0.23023827534039334, + "step": 49700 + }, + { + "epoch": 8.61, + "eval_loss": Infinity, + "eval_runtime": 553.5261, + "eval_samples_per_second": 20.362, + "eval_steps_per_second": 2.545, + "eval_wer": 0.23106824676416204, + "step": 49800 + }, + { + "epoch": 8.63, + "eval_loss": Infinity, + "eval_runtime": 544.8885, + "eval_samples_per_second": 20.685, + "eval_steps_per_second": 2.586, + "eval_wer": 0.22471213649352834, + "step": 49900 + }, + { + "epoch": 8.65, + "learning_rate": 0.00012785225559550038, + "loss": 0.0922, + "step": 50000 + }, + { + "epoch": 8.65, + "eval_loss": Infinity, + "eval_runtime": 544.5289, + "eval_samples_per_second": 20.699, + "eval_steps_per_second": 2.588, + "eval_wer": 0.22955538746007734, + "step": 50000 + }, + { + "epoch": 8.66, + "eval_loss": Infinity, + "eval_runtime": 546.894, + "eval_samples_per_second": 20.609, + "eval_steps_per_second": 2.576, + "eval_wer": 0.23000714405782485, + "step": 50100 + }, + { + "epoch": 8.68, + "eval_loss": Infinity, + "eval_runtime": 545.6073, + "eval_samples_per_second": 20.658, + "eval_steps_per_second": 2.582, + "eval_wer": 0.2265191628845184, + "step": 50200 + }, + { + "epoch": 8.7, + "eval_loss": Infinity, + "eval_runtime": 545.5673, + "eval_samples_per_second": 20.659, + "eval_steps_per_second": 2.583, + "eval_wer": 0.22610943015632878, + "step": 50300 + }, + { + "epoch": 8.72, + "eval_loss": Infinity, + "eval_runtime": 548.0111, + "eval_samples_per_second": 20.567, + "eval_steps_per_second": 2.571, + "eval_wer": 0.22705496722138174, + "step": 50400 + }, + { + "epoch": 8.73, + "learning_rate": 0.00012611272179056013, + "loss": 0.0963, + "step": 50500 + }, + { + "epoch": 8.73, + "eval_loss": Infinity, + "eval_runtime": 545.7263, + "eval_samples_per_second": 20.653, + "eval_steps_per_second": 2.582, + "eval_wer": 0.2270759791561607, + "step": 50500 + }, + { + "epoch": 8.75, + "eval_loss": Infinity, + "eval_runtime": 545.0461, + "eval_samples_per_second": 20.679, + "eval_steps_per_second": 2.585, + "eval_wer": 0.22822112960161373, + "step": 50600 + }, + { + "epoch": 8.77, + "eval_loss": Infinity, + "eval_runtime": 544.416, + "eval_samples_per_second": 20.703, + "eval_steps_per_second": 2.588, + "eval_wer": 0.2308581274163725, + "step": 50700 + }, + { + "epoch": 8.79, + "eval_loss": Infinity, + "eval_runtime": 544.2614, + "eval_samples_per_second": 20.709, + "eval_steps_per_second": 2.589, + "eval_wer": 0.22995461422087746, + "step": 50800 + }, + { + "epoch": 8.8, + "eval_loss": Infinity, + "eval_runtime": 544.7154, + "eval_samples_per_second": 20.692, + "eval_steps_per_second": 2.587, + "eval_wer": 0.23181417044881492, + "step": 50900 + }, + { + "epoch": 8.82, + "learning_rate": 0.00012437318798561982, + "loss": 0.0922, + "step": 51000 + }, + { + "epoch": 8.82, + "eval_loss": Infinity, + "eval_runtime": 556.1696, + "eval_samples_per_second": 20.265, + "eval_steps_per_second": 2.533, + "eval_wer": 0.23071104387291982, + "step": 51000 + }, + { + "epoch": 8.84, + "eval_loss": Infinity, + "eval_runtime": 548.0972, + "eval_samples_per_second": 20.564, + "eval_steps_per_second": 2.571, + "eval_wer": 0.22771684316691881, + "step": 51100 + }, + { + "epoch": 8.86, + "eval_loss": Infinity, + "eval_runtime": 548.2781, + "eval_samples_per_second": 20.557, + "eval_steps_per_second": 2.57, + "eval_wer": 0.23090015128593042, + "step": 51200 + }, + { + "epoch": 8.87, + "eval_loss": Infinity, + "eval_runtime": 546.0918, + "eval_samples_per_second": 20.639, + "eval_steps_per_second": 2.58, + "eval_wer": 0.22607791225416035, + "step": 51300 + }, + { + "epoch": 8.89, + "eval_loss": Infinity, + "eval_runtime": 547.4138, + "eval_samples_per_second": 20.59, + "eval_steps_per_second": 2.574, + "eval_wer": 0.22970247100353, + "step": 51400 + }, + { + "epoch": 8.91, + "learning_rate": 0.00012264061231589932, + "loss": 0.0959, + "step": 51500 + }, + { + "epoch": 8.91, + "eval_loss": Infinity, + "eval_runtime": 547.932, + "eval_samples_per_second": 20.57, + "eval_steps_per_second": 2.571, + "eval_wer": 0.22756975962346612, + "step": 51500 + }, + { + "epoch": 8.92, + "eval_loss": Infinity, + "eval_runtime": 549.2316, + "eval_samples_per_second": 20.521, + "eval_steps_per_second": 2.565, + "eval_wer": 0.2244915111783493, + "step": 51600 + }, + { + "epoch": 8.94, + "eval_loss": Infinity, + "eval_runtime": 546.2517, + "eval_samples_per_second": 20.633, + "eval_steps_per_second": 2.579, + "eval_wer": 0.22511136325432846, + "step": 51700 + }, + { + "epoch": 8.96, + "eval_loss": Infinity, + "eval_runtime": 547.2468, + "eval_samples_per_second": 20.596, + "eval_steps_per_second": 2.575, + "eval_wer": 0.2243549336022861, + "step": 51800 + }, + { + "epoch": 8.98, + "eval_loss": Infinity, + "eval_runtime": 545.227, + "eval_samples_per_second": 20.672, + "eval_steps_per_second": 2.584, + "eval_wer": 0.2264351151454026, + "step": 51900 + }, + { + "epoch": 8.99, + "learning_rate": 0.00012090107851095906, + "loss": 0.0936, + "step": 52000 + }, + { + "epoch": 8.99, + "eval_loss": Infinity, + "eval_runtime": 548.1848, + "eval_samples_per_second": 20.561, + "eval_steps_per_second": 2.57, + "eval_wer": 0.22675029416708692, + "step": 52000 + }, + { + "epoch": 9.01, + "eval_loss": Infinity, + "eval_runtime": 546.0278, + "eval_samples_per_second": 20.642, + "eval_steps_per_second": 2.58, + "eval_wer": 0.2266137165910237, + "step": 52100 + }, + { + "epoch": 9.03, + "eval_loss": Infinity, + "eval_runtime": 545.9251, + "eval_samples_per_second": 20.646, + "eval_steps_per_second": 2.581, + "eval_wer": 0.22677130610186585, + "step": 52200 + }, + { + "epoch": 9.05, + "eval_loss": Infinity, + "eval_runtime": 544.7867, + "eval_samples_per_second": 20.689, + "eval_steps_per_second": 2.586, + "eval_wer": 0.2291036308623298, + "step": 52300 + }, + { + "epoch": 9.06, + "eval_loss": Infinity, + "eval_runtime": 543.6097, + "eval_samples_per_second": 20.734, + "eval_steps_per_second": 2.592, + "eval_wer": 0.22948184568835098, + "step": 52400 + }, + { + "epoch": 9.08, + "learning_rate": 0.00011916154470601877, + "loss": 0.0829, + "step": 52500 + }, + { + "epoch": 9.08, + "eval_loss": Infinity, + "eval_runtime": 545.0074, + "eval_samples_per_second": 20.68, + "eval_steps_per_second": 2.585, + "eval_wer": 0.2251849050260548, + "step": 52500 + }, + { + "epoch": 9.1, + "eval_loss": Infinity, + "eval_runtime": 543.7151, + "eval_samples_per_second": 20.73, + "eval_steps_per_second": 2.591, + "eval_wer": 0.22575222726508656, + "step": 52600 + }, + { + "epoch": 9.11, + "eval_loss": Infinity, + "eval_runtime": 544.2283, + "eval_samples_per_second": 20.71, + "eval_steps_per_second": 2.589, + "eval_wer": 0.2293767860144562, + "step": 52700 + }, + { + "epoch": 9.13, + "eval_loss": Infinity, + "eval_runtime": 545.1003, + "eval_samples_per_second": 20.677, + "eval_steps_per_second": 2.585, + "eval_wer": 0.22807404605816103, + "step": 52800 + }, + { + "epoch": 9.15, + "eval_loss": Infinity, + "eval_runtime": 546.4159, + "eval_samples_per_second": 20.627, + "eval_steps_per_second": 2.579, + "eval_wer": 0.2287359220036981, + "step": 52900 + }, + { + "epoch": 9.17, + "learning_rate": 0.0001174220109010785, + "loss": 0.0759, + "step": 53000 + }, + { + "epoch": 9.17, + "eval_loss": Infinity, + "eval_runtime": 546.0093, + "eval_samples_per_second": 20.643, + "eval_steps_per_second": 2.581, + "eval_wer": 0.22631954950411834, + "step": 53000 + }, + { + "epoch": 9.18, + "eval_loss": Infinity, + "eval_runtime": 553.224, + "eval_samples_per_second": 20.373, + "eval_steps_per_second": 2.547, + "eval_wer": 0.2282736594385611, + "step": 53100 + }, + { + "epoch": 9.2, + "eval_loss": Infinity, + "eval_runtime": 549.148, + "eval_samples_per_second": 20.525, + "eval_steps_per_second": 2.566, + "eval_wer": 0.22410279038493863, + "step": 53200 + }, + { + "epoch": 9.22, + "eval_loss": Infinity, + "eval_runtime": 545.6751, + "eval_samples_per_second": 20.655, + "eval_steps_per_second": 2.582, + "eval_wer": 0.22418683812405446, + "step": 53300 + }, + { + "epoch": 9.24, + "eval_loss": Infinity, + "eval_runtime": 549.3438, + "eval_samples_per_second": 20.517, + "eval_steps_per_second": 2.565, + "eval_wer": 0.224859220036981, + "step": 53400 + }, + { + "epoch": 9.25, + "learning_rate": 0.0001156859561637481, + "loss": 0.0775, + "step": 53500 + }, + { + "epoch": 9.25, + "eval_loss": Infinity, + "eval_runtime": 580.7095, + "eval_samples_per_second": 19.409, + "eval_steps_per_second": 2.426, + "eval_wer": 0.22645612708018154, + "step": 53500 + }, + { + "epoch": 9.27, + "eval_loss": Infinity, + "eval_runtime": 580.879, + "eval_samples_per_second": 19.403, + "eval_steps_per_second": 2.426, + "eval_wer": 0.22520591696083375, + "step": 53600 + }, + { + "epoch": 9.29, + "eval_loss": Infinity, + "eval_runtime": 548.8124, + "eval_samples_per_second": 20.537, + "eval_steps_per_second": 2.567, + "eval_wer": 0.22562615565641284, + "step": 53700 + }, + { + "epoch": 9.3, + "eval_loss": Infinity, + "eval_runtime": 578.538, + "eval_samples_per_second": 19.482, + "eval_steps_per_second": 2.435, + "eval_wer": 0.22503782148260212, + "step": 53800 + }, + { + "epoch": 9.32, + "eval_loss": Infinity, + "eval_runtime": 578.8587, + "eval_samples_per_second": 19.471, + "eval_steps_per_second": 2.434, + "eval_wer": 0.2237981173306438, + "step": 53900 + }, + { + "epoch": 9.34, + "learning_rate": 0.00011394642235880784, + "loss": 0.0763, + "step": 54000 + }, + { + "epoch": 9.34, + "eval_loss": Infinity, + "eval_runtime": 547.6879, + "eval_samples_per_second": 20.579, + "eval_steps_per_second": 2.573, + "eval_wer": 0.223251807026391, + "step": 54000 + }, + { + "epoch": 9.36, + "eval_loss": Infinity, + "eval_runtime": 576.5045, + "eval_samples_per_second": 19.551, + "eval_steps_per_second": 2.444, + "eval_wer": 0.22266347285258026, + "step": 54100 + }, + { + "epoch": 9.37, + "eval_loss": Infinity, + "eval_runtime": 579.2016, + "eval_samples_per_second": 19.46, + "eval_steps_per_second": 2.433, + "eval_wer": 0.22562615565641284, + "step": 54200 + }, + { + "epoch": 9.39, + "eval_loss": Infinity, + "eval_runtime": 546.2896, + "eval_samples_per_second": 20.632, + "eval_steps_per_second": 2.579, + "eval_wer": 0.2248171961674231, + "step": 54300 + }, + { + "epoch": 9.41, + "eval_loss": Infinity, + "eval_runtime": 576.9166, + "eval_samples_per_second": 19.537, + "eval_steps_per_second": 2.442, + "eval_wer": 0.22520591696083375, + "step": 54400 + }, + { + "epoch": 9.43, + "learning_rate": 0.00011220688855386754, + "loss": 0.0736, + "step": 54500 + }, + { + "epoch": 9.43, + "eval_loss": Infinity, + "eval_runtime": 552.0198, + "eval_samples_per_second": 20.418, + "eval_steps_per_second": 2.552, + "eval_wer": 0.2253635064716759, + "step": 54500 + }, + { + "epoch": 9.44, + "eval_loss": Infinity, + "eval_runtime": 589.0127, + "eval_samples_per_second": 19.135, + "eval_steps_per_second": 2.392, + "eval_wer": 0.2293767860144562, + "step": 54600 + }, + { + "epoch": 9.46, + "eval_loss": Infinity, + "eval_runtime": 599.9148, + "eval_samples_per_second": 18.788, + "eval_steps_per_second": 2.349, + "eval_wer": 0.2285468145906875, + "step": 54700 + }, + { + "epoch": 9.48, + "eval_loss": Infinity, + "eval_runtime": 584.9159, + "eval_samples_per_second": 19.269, + "eval_steps_per_second": 2.409, + "eval_wer": 0.22438645150445452, + "step": 54800 + }, + { + "epoch": 9.49, + "eval_loss": Infinity, + "eval_runtime": 579.4563, + "eval_samples_per_second": 19.451, + "eval_steps_per_second": 2.432, + "eval_wer": 0.2259728525802656, + "step": 54900 + }, + { + "epoch": 9.51, + "learning_rate": 0.00011046735474892728, + "loss": 0.0787, + "step": 55000 + }, + { + "epoch": 9.51, + "eval_loss": Infinity, + "eval_runtime": 580.0188, + "eval_samples_per_second": 19.432, + "eval_steps_per_second": 2.429, + "eval_wer": 0.22143427466801144, + "step": 55000 + }, + { + "epoch": 9.53, + "eval_loss": Infinity, + "eval_runtime": 592.0777, + "eval_samples_per_second": 19.036, + "eval_steps_per_second": 2.38, + "eval_wer": 0.22351445621112792, + "step": 55100 + }, + { + "epoch": 9.55, + "eval_loss": Infinity, + "eval_runtime": 576.7489, + "eval_samples_per_second": 19.542, + "eval_steps_per_second": 2.443, + "eval_wer": 0.22336737266767523, + "step": 55200 + }, + { + "epoch": 9.56, + "eval_loss": Infinity, + "eval_runtime": 579.5329, + "eval_samples_per_second": 19.448, + "eval_steps_per_second": 2.431, + "eval_wer": 0.22437594553706505, + "step": 55300 + }, + { + "epoch": 9.58, + "eval_loss": Infinity, + "eval_runtime": 578.7168, + "eval_samples_per_second": 19.476, + "eval_steps_per_second": 2.435, + "eval_wer": 0.22677130610186585, + "step": 55400 + }, + { + "epoch": 9.6, + "learning_rate": 0.00010872782094398702, + "loss": 0.078, + "step": 55500 + }, + { + "epoch": 9.6, + "eval_loss": Infinity, + "eval_runtime": 592.5376, + "eval_samples_per_second": 19.022, + "eval_steps_per_second": 2.378, + "eval_wer": 0.22233778786350647, + "step": 55500 + }, + { + "epoch": 9.62, + "eval_loss": Infinity, + "eval_runtime": 579.5326, + "eval_samples_per_second": 19.448, + "eval_steps_per_second": 2.431, + "eval_wer": 0.22266347285258026, + "step": 55600 + }, + { + "epoch": 9.63, + "eval_loss": Infinity, + "eval_runtime": 578.7638, + "eval_samples_per_second": 19.474, + "eval_steps_per_second": 2.434, + "eval_wer": 0.22395570684148597, + "step": 55700 + }, + { + "epoch": 9.65, + "eval_loss": Infinity, + "eval_runtime": 554.6371, + "eval_samples_per_second": 20.321, + "eval_steps_per_second": 2.54, + "eval_wer": 0.22456505295007564, + "step": 55800 + }, + { + "epoch": 9.67, + "eval_loss": Infinity, + "eval_runtime": 545.7119, + "eval_samples_per_second": 20.654, + "eval_steps_per_second": 2.582, + "eval_wer": 0.2248697260043705, + "step": 55900 + }, + { + "epoch": 9.69, + "learning_rate": 0.00010698828713904672, + "loss": 0.0784, + "step": 56000 + }, + { + "epoch": 9.69, + "eval_loss": Infinity, + "eval_runtime": 545.3578, + "eval_samples_per_second": 20.667, + "eval_steps_per_second": 2.584, + "eval_wer": 0.2238926710371491, + "step": 56000 + }, + { + "epoch": 9.7, + "eval_loss": Infinity, + "eval_runtime": 546.7066, + "eval_samples_per_second": 20.616, + "eval_steps_per_second": 2.577, + "eval_wer": 0.2213502269288956, + "step": 56100 + }, + { + "epoch": 9.72, + "eval_loss": Infinity, + "eval_runtime": 545.4792, + "eval_samples_per_second": 20.663, + "eval_steps_per_second": 2.583, + "eval_wer": 0.22418683812405446, + "step": 56200 + }, + { + "epoch": 9.74, + "eval_loss": Infinity, + "eval_runtime": 546.6115, + "eval_samples_per_second": 20.62, + "eval_steps_per_second": 2.578, + "eval_wer": 0.2221381744831064, + "step": 56300 + }, + { + "epoch": 9.75, + "eval_loss": Infinity, + "eval_runtime": 549.1114, + "eval_samples_per_second": 20.526, + "eval_steps_per_second": 2.566, + "eval_wer": 0.2241238023197176, + "step": 56400 + }, + { + "epoch": 9.77, + "learning_rate": 0.00010524875333410646, + "loss": 0.0771, + "step": 56500 + }, + { + "epoch": 9.77, + "eval_loss": Infinity, + "eval_runtime": 545.5876, + "eval_samples_per_second": 20.658, + "eval_steps_per_second": 2.583, + "eval_wer": 0.2237981173306438, + "step": 56500 + }, + { + "epoch": 9.79, + "eval_loss": Infinity, + "eval_runtime": 543.6977, + "eval_samples_per_second": 20.73, + "eval_steps_per_second": 2.592, + "eval_wer": 0.22221171625483274, + "step": 56600 + }, + { + "epoch": 9.81, + "eval_loss": Infinity, + "eval_runtime": 543.8359, + "eval_samples_per_second": 20.725, + "eval_steps_per_second": 2.591, + "eval_wer": 0.2245755589174651, + "step": 56700 + }, + { + "epoch": 9.82, + "eval_loss": Infinity, + "eval_runtime": 543.7056, + "eval_samples_per_second": 20.73, + "eval_steps_per_second": 2.591, + "eval_wer": 0.2232413010590015, + "step": 56800 + }, + { + "epoch": 9.84, + "eval_loss": Infinity, + "eval_runtime": 543.9681, + "eval_samples_per_second": 20.72, + "eval_steps_per_second": 2.59, + "eval_wer": 0.22365103378719112, + "step": 56900 + }, + { + "epoch": 9.86, + "learning_rate": 0.00010350921952916617, + "loss": 0.076, + "step": 57000 + }, + { + "epoch": 9.86, + "eval_loss": Infinity, + "eval_runtime": 544.4231, + "eval_samples_per_second": 20.703, + "eval_steps_per_second": 2.588, + "eval_wer": 0.22464910068919147, + "step": 57000 + }, + { + "epoch": 9.88, + "eval_loss": Infinity, + "eval_runtime": 544.6818, + "eval_samples_per_second": 20.693, + "eval_steps_per_second": 2.587, + "eval_wer": 0.22017355858127416, + "step": 57100 + }, + { + "epoch": 9.89, + "eval_loss": Infinity, + "eval_runtime": 547.1699, + "eval_samples_per_second": 20.599, + "eval_steps_per_second": 2.575, + "eval_wer": 0.2221801983526643, + "step": 57200 + }, + { + "epoch": 9.91, + "eval_loss": Infinity, + "eval_runtime": 546.1115, + "eval_samples_per_second": 20.639, + "eval_steps_per_second": 2.58, + "eval_wer": 0.2243549336022861, + "step": 57300 + }, + { + "epoch": 9.93, + "eval_loss": Infinity, + "eval_runtime": 545.2721, + "eval_samples_per_second": 20.67, + "eval_steps_per_second": 2.584, + "eval_wer": 0.22443898134140192, + "step": 57400 + }, + { + "epoch": 9.94, + "learning_rate": 0.00010177316479183579, + "loss": 0.0777, + "step": 57500 + }, + { + "epoch": 9.94, + "eval_loss": Infinity, + "eval_runtime": 545.5824, + "eval_samples_per_second": 20.659, + "eval_steps_per_second": 2.583, + "eval_wer": 0.2209930240376534, + "step": 57500 + }, + { + "epoch": 9.96, + "eval_loss": Infinity, + "eval_runtime": 546.1798, + "eval_samples_per_second": 20.636, + "eval_steps_per_second": 2.58, + "eval_wer": 0.218166918809884, + "step": 57600 + }, + { + "epoch": 9.98, + "eval_loss": Infinity, + "eval_runtime": 550.3082, + "eval_samples_per_second": 20.481, + "eval_steps_per_second": 2.56, + "eval_wer": 0.2208039166246428, + "step": 57700 + }, + { + "epoch": 10.0, + "eval_loss": Infinity, + "eval_runtime": 548.1847, + "eval_samples_per_second": 20.561, + "eval_steps_per_second": 2.57, + "eval_wer": 0.2210350479072113, + "step": 57800 + }, + { + "epoch": 10.01, + "eval_loss": Infinity, + "eval_runtime": 546.4203, + "eval_samples_per_second": 20.627, + "eval_steps_per_second": 2.579, + "eval_wer": 0.22032064212472685, + "step": 57900 + }, + { + "epoch": 10.03, + "learning_rate": 0.0001000336309868955, + "loss": 0.0745, + "step": 58000 + }, + { + "epoch": 10.03, + "eval_loss": Infinity, + "eval_runtime": 545.6515, + "eval_samples_per_second": 20.656, + "eval_steps_per_second": 2.582, + "eval_wer": 0.22211716254832745, + "step": 58000 + }, + { + "epoch": 10.05, + "eval_loss": Infinity, + "eval_runtime": 547.4513, + "eval_samples_per_second": 20.588, + "eval_steps_per_second": 2.574, + "eval_wer": 0.22035216002689528, + "step": 58100 + }, + { + "epoch": 10.07, + "eval_loss": Infinity, + "eval_runtime": 548.349, + "eval_samples_per_second": 20.554, + "eval_steps_per_second": 2.57, + "eval_wer": 0.22224323415700117, + "step": 58200 + }, + { + "epoch": 10.08, + "eval_loss": Infinity, + "eval_runtime": 548.8654, + "eval_samples_per_second": 20.535, + "eval_steps_per_second": 2.567, + "eval_wer": 0.21902840813582114, + "step": 58300 + }, + { + "epoch": 10.1, + "eval_loss": Infinity, + "eval_runtime": 578.3959, + "eval_samples_per_second": 19.487, + "eval_steps_per_second": 2.436, + "eval_wer": 0.22157085224407463, + "step": 58400 + }, + { + "epoch": 10.12, + "learning_rate": 9.829409718195524e-05, + "loss": 0.0656, + "step": 58500 + }, + { + "epoch": 10.12, + "eval_loss": Infinity, + "eval_runtime": 574.8445, + "eval_samples_per_second": 19.607, + "eval_steps_per_second": 2.451, + "eval_wer": 0.2210875777441587, + "step": 58500 + }, + { + "epoch": 10.13, + "eval_loss": Infinity, + "eval_runtime": 548.4437, + "eval_samples_per_second": 20.551, + "eval_steps_per_second": 2.569, + "eval_wer": 0.22125567322239031, + "step": 58600 + }, + { + "epoch": 10.15, + "eval_loss": Infinity, + "eval_runtime": 546.1949, + "eval_samples_per_second": 20.635, + "eval_steps_per_second": 2.58, + "eval_wer": 0.22302067574382248, + "step": 58700 + }, + { + "epoch": 10.17, + "eval_loss": Infinity, + "eval_runtime": 544.4777, + "eval_samples_per_second": 20.701, + "eval_steps_per_second": 2.588, + "eval_wer": 0.22341990250462263, + "step": 58800 + }, + { + "epoch": 10.19, + "eval_loss": Infinity, + "eval_runtime": 545.4451, + "eval_samples_per_second": 20.664, + "eval_steps_per_second": 2.583, + "eval_wer": 0.22386115313498067, + "step": 58900 + }, + { + "epoch": 10.2, + "learning_rate": 9.655456337701495e-05, + "loss": 0.0688, + "step": 59000 + }, + { + "epoch": 10.2, + "eval_loss": Infinity, + "eval_runtime": 548.1142, + "eval_samples_per_second": 20.563, + "eval_steps_per_second": 2.571, + "eval_wer": 0.22226424609178014, + "step": 59000 + }, + { + "epoch": 10.22, + "eval_loss": Infinity, + "eval_runtime": 547.69, + "eval_samples_per_second": 20.579, + "eval_steps_per_second": 2.573, + "eval_wer": 0.217484030929568, + "step": 59100 + }, + { + "epoch": 10.24, + "eval_loss": Infinity, + "eval_runtime": 546.4205, + "eval_samples_per_second": 20.627, + "eval_steps_per_second": 2.579, + "eval_wer": 0.21911245587493697, + "step": 59200 + }, + { + "epoch": 10.26, + "eval_loss": Infinity, + "eval_runtime": 547.1932, + "eval_samples_per_second": 20.598, + "eval_steps_per_second": 2.575, + "eval_wer": 0.2226004370482434, + "step": 59300 + }, + { + "epoch": 10.27, + "eval_loss": Infinity, + "eval_runtime": 546.9117, + "eval_samples_per_second": 20.608, + "eval_steps_per_second": 2.576, + "eval_wer": 0.21787275172297865, + "step": 59400 + }, + { + "epoch": 10.29, + "learning_rate": 9.481502957207468e-05, + "loss": 0.0633, + "step": 59500 + }, + { + "epoch": 10.29, + "eval_loss": Infinity, + "eval_runtime": 548.8254, + "eval_samples_per_second": 20.537, + "eval_steps_per_second": 2.567, + "eval_wer": 0.2196902840813582, + "step": 59500 + }, + { + "epoch": 10.31, + "eval_loss": Infinity, + "eval_runtime": 546.9648, + "eval_samples_per_second": 20.606, + "eval_steps_per_second": 2.576, + "eval_wer": 0.22122415532022188, + "step": 59600 + }, + { + "epoch": 10.33, + "eval_loss": Infinity, + "eval_runtime": 545.9902, + "eval_samples_per_second": 20.643, + "eval_steps_per_second": 2.581, + "eval_wer": 0.21917549167927383, + "step": 59700 + }, + { + "epoch": 10.34, + "eval_loss": Infinity, + "eval_runtime": 546.727, + "eval_samples_per_second": 20.615, + "eval_steps_per_second": 2.577, + "eval_wer": 0.21952218860312658, + "step": 59800 + }, + { + "epoch": 10.36, + "eval_loss": Infinity, + "eval_runtime": 547.09, + "eval_samples_per_second": 20.602, + "eval_steps_per_second": 2.575, + "eval_wer": 0.21751554883173643, + "step": 59900 + }, + { + "epoch": 10.38, + "learning_rate": 9.307549576713439e-05, + "loss": 0.0646, + "step": 60000 + }, + { + "epoch": 10.38, + "eval_loss": Infinity, + "eval_runtime": 547.783, + "eval_samples_per_second": 20.576, + "eval_steps_per_second": 2.572, + "eval_wer": 0.21554042696251471, + "step": 60000 + }, + { + "epoch": 10.39, + "eval_loss": Infinity, + "eval_runtime": 552.4006, + "eval_samples_per_second": 20.404, + "eval_steps_per_second": 2.551, + "eval_wer": 0.21595015969070433, + "step": 60100 + }, + { + "epoch": 10.41, + "eval_loss": Infinity, + "eval_runtime": 546.4271, + "eval_samples_per_second": 20.627, + "eval_steps_per_second": 2.579, + "eval_wer": 0.21806185913598924, + "step": 60200 + }, + { + "epoch": 10.43, + "eval_loss": Infinity, + "eval_runtime": 545.6537, + "eval_samples_per_second": 20.656, + "eval_steps_per_second": 2.582, + "eval_wer": 0.21958522440746345, + "step": 60300 + }, + { + "epoch": 10.45, + "eval_loss": Infinity, + "eval_runtime": 546.0782, + "eval_samples_per_second": 20.64, + "eval_steps_per_second": 2.58, + "eval_wer": 0.22041519583123215, + "step": 60400 + }, + { + "epoch": 10.46, + "learning_rate": 9.133596196219412e-05, + "loss": 0.0617, + "step": 60500 + }, + { + "epoch": 10.46, + "eval_loss": Infinity, + "eval_runtime": 549.3529, + "eval_samples_per_second": 20.517, + "eval_steps_per_second": 2.565, + "eval_wer": 0.21913346780971593, + "step": 60500 + }, + { + "epoch": 10.48, + "eval_loss": Infinity, + "eval_runtime": 548.3, + "eval_samples_per_second": 20.556, + "eval_steps_per_second": 2.57, + "eval_wer": 0.22019457051605312, + "step": 60600 + }, + { + "epoch": 10.5, + "eval_loss": Infinity, + "eval_runtime": 547.5552, + "eval_samples_per_second": 20.584, + "eval_steps_per_second": 2.573, + "eval_wer": 0.22350395024373845, + "step": 60700 + }, + { + "epoch": 10.52, + "eval_loss": Infinity, + "eval_runtime": 546.6552, + "eval_samples_per_second": 20.618, + "eval_steps_per_second": 2.577, + "eval_wer": 0.2166540595057993, + "step": 60800 + }, + { + "epoch": 10.53, + "eval_loss": Infinity, + "eval_runtime": 559.9166, + "eval_samples_per_second": 20.13, + "eval_steps_per_second": 2.516, + "eval_wer": 0.2203416540595058, + "step": 60900 + }, + { + "epoch": 10.55, + "learning_rate": 8.959642815725385e-05, + "loss": 0.0662, + "step": 61000 + }, + { + "epoch": 10.55, + "eval_loss": Infinity, + "eval_runtime": 549.9016, + "eval_samples_per_second": 20.496, + "eval_steps_per_second": 2.562, + "eval_wer": 0.21820894267944194, + "step": 61000 + }, + { + "epoch": 10.57, + "eval_loss": Infinity, + "eval_runtime": 549.326, + "eval_samples_per_second": 20.518, + "eval_steps_per_second": 2.565, + "eval_wer": 0.21708480416876785, + "step": 61100 + }, + { + "epoch": 10.58, + "eval_loss": Infinity, + "eval_runtime": 550.9593, + "eval_samples_per_second": 20.457, + "eval_steps_per_second": 2.557, + "eval_wer": 0.2189968902336527, + "step": 61200 + }, + { + "epoch": 10.6, + "eval_loss": Infinity, + "eval_runtime": 548.4716, + "eval_samples_per_second": 20.55, + "eval_steps_per_second": 2.569, + "eval_wer": 0.22214868045049588, + "step": 61300 + }, + { + "epoch": 10.62, + "eval_loss": Infinity, + "eval_runtime": 549.5474, + "eval_samples_per_second": 20.51, + "eval_steps_per_second": 2.564, + "eval_wer": 0.22244284753740123, + "step": 61400 + }, + { + "epoch": 10.64, + "learning_rate": 8.785689435231357e-05, + "loss": 0.0656, + "step": 61500 + }, + { + "epoch": 10.64, + "eval_loss": Infinity, + "eval_runtime": 549.7646, + "eval_samples_per_second": 20.502, + "eval_steps_per_second": 2.563, + "eval_wer": 0.22150781643973777, + "step": 61500 + }, + { + "epoch": 10.65, + "eval_loss": Infinity, + "eval_runtime": 551.0007, + "eval_samples_per_second": 20.456, + "eval_steps_per_second": 2.557, + "eval_wer": 0.21958522440746345, + "step": 61600 + }, + { + "epoch": 10.67, + "eval_loss": Infinity, + "eval_runtime": 551.2483, + "eval_samples_per_second": 20.446, + "eval_steps_per_second": 2.556, + "eval_wer": 0.2200684989073794, + "step": 61700 + }, + { + "epoch": 10.69, + "eval_loss": Infinity, + "eval_runtime": 549.7815, + "eval_samples_per_second": 20.501, + "eval_steps_per_second": 2.563, + "eval_wer": 0.21851361573373676, + "step": 61800 + }, + { + "epoch": 10.71, + "eval_loss": Infinity, + "eval_runtime": 553.4559, + "eval_samples_per_second": 20.365, + "eval_steps_per_second": 2.546, + "eval_wer": 0.2173789712556732, + "step": 61900 + }, + { + "epoch": 10.72, + "learning_rate": 8.612083961498317e-05, + "loss": 0.0636, + "step": 62000 + }, + { + "epoch": 10.72, + "eval_loss": Infinity, + "eval_runtime": 547.7095, + "eval_samples_per_second": 20.578, + "eval_steps_per_second": 2.573, + "eval_wer": 0.21892334846192638, + "step": 62000 + }, + { + "epoch": 10.74, + "eval_loss": Infinity, + "eval_runtime": 547.6345, + "eval_samples_per_second": 20.581, + "eval_steps_per_second": 2.573, + "eval_wer": 0.2205202555051269, + "step": 62100 + }, + { + "epoch": 10.76, + "eval_loss": Infinity, + "eval_runtime": 546.4002, + "eval_samples_per_second": 20.628, + "eval_steps_per_second": 2.579, + "eval_wer": 0.22041519583123215, + "step": 62200 + }, + { + "epoch": 10.77, + "eval_loss": Infinity, + "eval_runtime": 547.84, + "eval_samples_per_second": 20.574, + "eval_steps_per_second": 2.572, + "eval_wer": 0.22165489998319046, + "step": 62300 + }, + { + "epoch": 10.79, + "eval_loss": Infinity, + "eval_runtime": 551.3251, + "eval_samples_per_second": 20.443, + "eval_steps_per_second": 2.556, + "eval_wer": 0.21917549167927383, + "step": 62400 + }, + { + "epoch": 10.81, + "learning_rate": 8.438826394526265e-05, + "loss": 0.0626, + "step": 62500 + }, + { + "epoch": 10.81, + "eval_loss": Infinity, + "eval_runtime": 553.1486, + "eval_samples_per_second": 20.376, + "eval_steps_per_second": 2.547, + "eval_wer": 0.21754706673390486, + "step": 62500 + }, + { + "epoch": 10.83, + "eval_loss": Infinity, + "eval_runtime": 551.2466, + "eval_samples_per_second": 20.446, + "eval_steps_per_second": 2.556, + "eval_wer": 0.2192385274836107, + "step": 62600 + }, + { + "epoch": 10.84, + "eval_loss": Infinity, + "eval_runtime": 545.0806, + "eval_samples_per_second": 20.678, + "eval_steps_per_second": 2.585, + "eval_wer": 0.21865019330979996, + "step": 62700 + }, + { + "epoch": 10.86, + "eval_loss": Infinity, + "eval_runtime": 545.5781, + "eval_samples_per_second": 20.659, + "eval_steps_per_second": 2.583, + "eval_wer": 0.21712682803832578, + "step": 62800 + }, + { + "epoch": 10.88, + "eval_loss": Infinity, + "eval_runtime": 546.2445, + "eval_samples_per_second": 20.634, + "eval_steps_per_second": 2.579, + "eval_wer": 0.2154563792233989, + "step": 62900 + }, + { + "epoch": 10.9, + "learning_rate": 8.264873014032239e-05, + "loss": 0.0641, + "step": 63000 + }, + { + "epoch": 10.9, + "eval_loss": Infinity, + "eval_runtime": 546.3019, + "eval_samples_per_second": 20.631, + "eval_steps_per_second": 2.579, + "eval_wer": 0.21682215498403093, + "step": 63000 + }, + { + "epoch": 10.91, + "eval_loss": Infinity, + "eval_runtime": 546.5842, + "eval_samples_per_second": 20.621, + "eval_steps_per_second": 2.578, + "eval_wer": 0.2183140023533367, + "step": 63100 + }, + { + "epoch": 10.93, + "eval_loss": Infinity, + "eval_runtime": 547.5037, + "eval_samples_per_second": 20.586, + "eval_steps_per_second": 2.573, + "eval_wer": 0.2177151622121365, + "step": 63200 + }, + { + "epoch": 10.95, + "eval_loss": Infinity, + "eval_runtime": 546.2904, + "eval_samples_per_second": 20.632, + "eval_steps_per_second": 2.579, + "eval_wer": 0.2180303412338208, + "step": 63300 + }, + { + "epoch": 10.97, + "eval_loss": Infinity, + "eval_runtime": 546.5707, + "eval_samples_per_second": 20.621, + "eval_steps_per_second": 2.578, + "eval_wer": 0.21799882333165238, + "step": 63400 + }, + { + "epoch": 10.98, + "learning_rate": 8.090919633538211e-05, + "loss": 0.064, + "step": 63500 + }, + { + "epoch": 10.98, + "eval_loss": Infinity, + "eval_runtime": 544.7426, + "eval_samples_per_second": 20.691, + "eval_steps_per_second": 2.587, + "eval_wer": 0.2185871575054631, + "step": 63500 + }, + { + "epoch": 11.0, + "eval_loss": Infinity, + "eval_runtime": 551.0764, + "eval_samples_per_second": 20.453, + "eval_steps_per_second": 2.557, + "eval_wer": 0.21916498571188436, + "step": 63600 + }, + { + "epoch": 11.02, + "eval_loss": Infinity, + "eval_runtime": 548.7516, + "eval_samples_per_second": 20.539, + "eval_steps_per_second": 2.568, + "eval_wer": 0.2194171289292318, + "step": 63700 + }, + { + "epoch": 11.03, + "eval_loss": Infinity, + "eval_runtime": 551.4195, + "eval_samples_per_second": 20.44, + "eval_steps_per_second": 2.555, + "eval_wer": 0.21774668011430492, + "step": 63800 + }, + { + "epoch": 11.05, + "eval_loss": Infinity, + "eval_runtime": 552.4039, + "eval_samples_per_second": 20.404, + "eval_steps_per_second": 2.551, + "eval_wer": 0.21732644141872584, + "step": 63900 + }, + { + "epoch": 11.07, + "learning_rate": 7.916966253044183e-05, + "loss": 0.0571, + "step": 64000 + }, + { + "epoch": 11.07, + "eval_loss": Infinity, + "eval_runtime": 552.3428, + "eval_samples_per_second": 20.406, + "eval_steps_per_second": 2.551, + "eval_wer": 0.21994242729870567, + "step": 64000 + }, + { + "epoch": 11.09, + "eval_loss": Infinity, + "eval_runtime": 550.7081, + "eval_samples_per_second": 20.466, + "eval_steps_per_second": 2.559, + "eval_wer": 0.2176626323751891, + "step": 64100 + }, + { + "epoch": 11.1, + "eval_loss": Infinity, + "eval_runtime": 549.2417, + "eval_samples_per_second": 20.521, + "eval_steps_per_second": 2.565, + "eval_wer": 0.21783072785342075, + "step": 64200 + }, + { + "epoch": 11.12, + "eval_loss": Infinity, + "eval_runtime": 553.1807, + "eval_samples_per_second": 20.375, + "eval_steps_per_second": 2.547, + "eval_wer": 0.21962724827702135, + "step": 64300 + }, + { + "epoch": 11.14, + "eval_loss": Infinity, + "eval_runtime": 548.6438, + "eval_samples_per_second": 20.543, + "eval_steps_per_second": 2.568, + "eval_wer": 0.21541435535384099, + "step": 64400 + }, + { + "epoch": 11.16, + "learning_rate": 7.743012872550157e-05, + "loss": 0.0536, + "step": 64500 + }, + { + "epoch": 11.16, + "eval_loss": Infinity, + "eval_runtime": 551.8385, + "eval_samples_per_second": 20.424, + "eval_steps_per_second": 2.553, + "eval_wer": 0.21403807362581947, + "step": 64500 + }, + { + "epoch": 11.17, + "eval_loss": Infinity, + "eval_runtime": 551.8565, + "eval_samples_per_second": 20.424, + "eval_steps_per_second": 2.553, + "eval_wer": 0.21514120020171457, + "step": 64600 + }, + { + "epoch": 11.19, + "eval_loss": Infinity, + "eval_runtime": 551.0728, + "eval_samples_per_second": 20.453, + "eval_steps_per_second": 2.557, + "eval_wer": 0.21558245083207261, + "step": 64700 + }, + { + "epoch": 11.21, + "eval_loss": Infinity, + "eval_runtime": 550.1479, + "eval_samples_per_second": 20.487, + "eval_steps_per_second": 2.561, + "eval_wer": 0.21810388300554714, + "step": 64800 + }, + { + "epoch": 11.22, + "eval_loss": Infinity, + "eval_runtime": 556.5349, + "eval_samples_per_second": 20.252, + "eval_steps_per_second": 2.532, + "eval_wer": 0.2173369473861153, + "step": 64900 + }, + { + "epoch": 11.24, + "learning_rate": 7.569059492056128e-05, + "loss": 0.0544, + "step": 65000 + }, + { + "epoch": 11.24, + "eval_loss": Infinity, + "eval_runtime": 554.5243, + "eval_samples_per_second": 20.326, + "eval_steps_per_second": 2.541, + "eval_wer": 0.21618129097327282, + "step": 65000 + }, + { + "epoch": 11.26, + "eval_loss": Infinity, + "eval_runtime": 553.3737, + "eval_samples_per_second": 20.368, + "eval_steps_per_second": 2.546, + "eval_wer": 0.2145738779626828, + "step": 65100 + }, + { + "epoch": 11.28, + "eval_loss": Infinity, + "eval_runtime": 553.6751, + "eval_samples_per_second": 20.357, + "eval_steps_per_second": 2.545, + "eval_wer": 0.22014204067910573, + "step": 65200 + }, + { + "epoch": 11.29, + "eval_loss": Infinity, + "eval_runtime": 548.8824, + "eval_samples_per_second": 20.534, + "eval_steps_per_second": 2.567, + "eval_wer": 0.21588712388636747, + "step": 65300 + }, + { + "epoch": 11.31, + "eval_loss": Infinity, + "eval_runtime": 554.3172, + "eval_samples_per_second": 20.333, + "eval_steps_per_second": 2.542, + "eval_wer": 0.2159081358211464, + "step": 65400 + }, + { + "epoch": 11.33, + "learning_rate": 7.395454018323089e-05, + "loss": 0.0546, + "step": 65500 + }, + { + "epoch": 11.33, + "eval_loss": Infinity, + "eval_runtime": 548.0012, + "eval_samples_per_second": 20.567, + "eval_steps_per_second": 2.571, + "eval_wer": 0.21578206421247267, + "step": 65500 + }, + { + "epoch": 11.35, + "eval_loss": Infinity, + "eval_runtime": 546.2415, + "eval_samples_per_second": 20.634, + "eval_steps_per_second": 2.579, + "eval_wer": 0.21603420742982013, + "step": 65600 + }, + { + "epoch": 11.36, + "eval_loss": Infinity, + "eval_runtime": 549.3565, + "eval_samples_per_second": 20.517, + "eval_steps_per_second": 2.565, + "eval_wer": 0.21724239367961, + "step": 65700 + }, + { + "epoch": 11.38, + "eval_loss": Infinity, + "eval_runtime": 547.895, + "eval_samples_per_second": 20.571, + "eval_steps_per_second": 2.572, + "eval_wer": 0.21695873256009413, + "step": 65800 + }, + { + "epoch": 11.4, + "eval_loss": Infinity, + "eval_runtime": 549.1149, + "eval_samples_per_second": 20.526, + "eval_steps_per_second": 2.566, + "eval_wer": 0.216097243234157, + "step": 65900 + }, + { + "epoch": 11.41, + "learning_rate": 7.221500637829061e-05, + "loss": 0.0545, + "step": 66000 + }, + { + "epoch": 11.41, + "eval_loss": Infinity, + "eval_runtime": 557.4232, + "eval_samples_per_second": 20.22, + "eval_steps_per_second": 2.528, + "eval_wer": 0.21853462766851572, + "step": 66000 + }, + { + "epoch": 11.43, + "eval_loss": Infinity, + "eval_runtime": 551.3783, + "eval_samples_per_second": 20.442, + "eval_steps_per_second": 2.555, + "eval_wer": 0.2169377206253152, + "step": 66100 + }, + { + "epoch": 11.45, + "eval_loss": Infinity, + "eval_runtime": 548.1583, + "eval_samples_per_second": 20.562, + "eval_steps_per_second": 2.57, + "eval_wer": 0.21663304757102034, + "step": 66200 + }, + { + "epoch": 11.47, + "eval_loss": Infinity, + "eval_runtime": 549.1862, + "eval_samples_per_second": 20.523, + "eval_steps_per_second": 2.566, + "eval_wer": 0.21433224071272483, + "step": 66300 + }, + { + "epoch": 11.48, + "eval_loss": Infinity, + "eval_runtime": 547.0477, + "eval_samples_per_second": 20.603, + "eval_steps_per_second": 2.576, + "eval_wer": 0.2137964363758615, + "step": 66400 + }, + { + "epoch": 11.5, + "learning_rate": 7.047547257335033e-05, + "loss": 0.0539, + "step": 66500 + }, + { + "epoch": 11.5, + "eval_loss": Infinity, + "eval_runtime": 545.649, + "eval_samples_per_second": 20.656, + "eval_steps_per_second": 2.582, + "eval_wer": 0.21467893763657758, + "step": 66500 + }, + { + "epoch": 11.52, + "eval_loss": Infinity, + "eval_runtime": 545.0721, + "eval_samples_per_second": 20.678, + "eval_steps_per_second": 2.585, + "eval_wer": 0.2143532526475038, + "step": 66600 + }, + { + "epoch": 11.54, + "eval_loss": Infinity, + "eval_runtime": 546.699, + "eval_samples_per_second": 20.616, + "eval_steps_per_second": 2.577, + "eval_wer": 0.21421667507144057, + "step": 66700 + }, + { + "epoch": 11.55, + "eval_loss": Infinity, + "eval_runtime": 547.5775, + "eval_samples_per_second": 20.583, + "eval_steps_per_second": 2.573, + "eval_wer": 0.2140590855605984, + "step": 66800 + }, + { + "epoch": 11.57, + "eval_loss": Infinity, + "eval_runtime": 546.57, + "eval_samples_per_second": 20.621, + "eval_steps_per_second": 2.578, + "eval_wer": 0.2135547991259035, + "step": 66900 + }, + { + "epoch": 11.59, + "learning_rate": 6.873593876841007e-05, + "loss": 0.0545, + "step": 67000 + }, + { + "epoch": 11.59, + "eval_loss": Infinity, + "eval_runtime": 546.0529, + "eval_samples_per_second": 20.641, + "eval_steps_per_second": 2.58, + "eval_wer": 0.21575054631030424, + "step": 67000 + }, + { + "epoch": 11.6, + "eval_loss": Infinity, + "eval_runtime": 546.2996, + "eval_samples_per_second": 20.632, + "eval_steps_per_second": 2.579, + "eval_wer": 0.21779920995125232, + "step": 67100 + }, + { + "epoch": 11.62, + "eval_loss": Infinity, + "eval_runtime": 546.7915, + "eval_samples_per_second": 20.613, + "eval_steps_per_second": 2.577, + "eval_wer": 0.21658051773407294, + "step": 67200 + }, + { + "epoch": 11.64, + "eval_loss": Infinity, + "eval_runtime": 545.549, + "eval_samples_per_second": 20.66, + "eval_steps_per_second": 2.583, + "eval_wer": 0.21400655572365104, + "step": 67300 + }, + { + "epoch": 11.66, + "eval_loss": Infinity, + "eval_runtime": 546.7529, + "eval_samples_per_second": 20.614, + "eval_steps_per_second": 2.577, + "eval_wer": 0.21427971087577743, + "step": 67400 + }, + { + "epoch": 11.67, + "learning_rate": 6.699640496346979e-05, + "loss": 0.0538, + "step": 67500 + }, + { + "epoch": 11.67, + "eval_loss": Infinity, + "eval_runtime": 548.0068, + "eval_samples_per_second": 20.567, + "eval_steps_per_second": 2.571, + "eval_wer": 0.21409060346276684, + "step": 67500 + }, + { + "epoch": 11.69, + "eval_loss": Infinity, + "eval_runtime": 545.7442, + "eval_samples_per_second": 20.653, + "eval_steps_per_second": 2.582, + "eval_wer": 0.21662254160363087, + "step": 67600 + }, + { + "epoch": 11.71, + "eval_loss": Infinity, + "eval_runtime": 548.6181, + "eval_samples_per_second": 20.544, + "eval_steps_per_second": 2.568, + "eval_wer": 0.21437426458228273, + "step": 67700 + }, + { + "epoch": 11.73, + "eval_loss": Infinity, + "eval_runtime": 544.7509, + "eval_samples_per_second": 20.69, + "eval_steps_per_second": 2.587, + "eval_wer": 0.21205244578920826, + "step": 67800 + }, + { + "epoch": 11.74, + "eval_loss": Infinity, + "eval_runtime": 545.7434, + "eval_samples_per_second": 20.653, + "eval_steps_per_second": 2.582, + "eval_wer": 0.21325012607160868, + "step": 67900 + }, + { + "epoch": 11.76, + "learning_rate": 6.525687115852951e-05, + "loss": 0.0529, + "step": 68000 + }, + { + "epoch": 11.76, + "eval_loss": Infinity, + "eval_runtime": 545.6556, + "eval_samples_per_second": 20.656, + "eval_steps_per_second": 2.582, + "eval_wer": 0.2136073289628509, + "step": 68000 + }, + { + "epoch": 11.78, + "eval_loss": Infinity, + "eval_runtime": 545.981, + "eval_samples_per_second": 20.644, + "eval_steps_per_second": 2.581, + "eval_wer": 0.21634938645150445, + "step": 68100 + }, + { + "epoch": 11.8, + "eval_loss": Infinity, + "eval_runtime": 544.2745, + "eval_samples_per_second": 20.708, + "eval_steps_per_second": 2.589, + "eval_wer": 0.21389099008236678, + "step": 68200 + }, + { + "epoch": 11.81, + "eval_loss": Infinity, + "eval_runtime": 544.5409, + "eval_samples_per_second": 20.698, + "eval_steps_per_second": 2.588, + "eval_wer": 0.21302950075642965, + "step": 68300 + }, + { + "epoch": 11.83, + "eval_loss": Infinity, + "eval_runtime": 546.1049, + "eval_samples_per_second": 20.639, + "eval_steps_per_second": 2.58, + "eval_wer": 0.21082324760463944, + "step": 68400 + }, + { + "epoch": 11.85, + "learning_rate": 6.351733735358923e-05, + "loss": 0.0528, + "step": 68500 + }, + { + "epoch": 11.85, + "eval_loss": Infinity, + "eval_runtime": 546.5201, + "eval_samples_per_second": 20.623, + "eval_steps_per_second": 2.578, + "eval_wer": 0.2115691712892923, + "step": 68500 + }, + { + "epoch": 11.86, + "eval_loss": Infinity, + "eval_runtime": 546.1767, + "eval_samples_per_second": 20.636, + "eval_steps_per_second": 2.58, + "eval_wer": 0.21026643133299713, + "step": 68600 + }, + { + "epoch": 11.88, + "eval_loss": Infinity, + "eval_runtime": 548.1438, + "eval_samples_per_second": 20.562, + "eval_steps_per_second": 2.57, + "eval_wer": 0.21120146243066062, + "step": 68700 + }, + { + "epoch": 11.9, + "eval_loss": Infinity, + "eval_runtime": 545.8375, + "eval_samples_per_second": 20.649, + "eval_steps_per_second": 2.581, + "eval_wer": 0.212399142713061, + "step": 68800 + }, + { + "epoch": 11.92, + "eval_loss": Infinity, + "eval_runtime": 559.1437, + "eval_samples_per_second": 20.158, + "eval_steps_per_second": 2.52, + "eval_wer": 0.21138006387628172, + "step": 68900 + }, + { + "epoch": 11.93, + "learning_rate": 6.177780354864895e-05, + "loss": 0.0523, + "step": 69000 + }, + { + "epoch": 11.93, + "eval_loss": Infinity, + "eval_runtime": 547.1977, + "eval_samples_per_second": 20.598, + "eval_steps_per_second": 2.575, + "eval_wer": 0.21378593040847202, + "step": 69000 + }, + { + "epoch": 11.95, + "eval_loss": Infinity, + "eval_runtime": 546.6331, + "eval_samples_per_second": 20.619, + "eval_steps_per_second": 2.578, + "eval_wer": 0.2135232812237351, + "step": 69100 + }, + { + "epoch": 11.97, + "eval_loss": Infinity, + "eval_runtime": 546.1655, + "eval_samples_per_second": 20.637, + "eval_steps_per_second": 2.58, + "eval_wer": 0.21153765338712388, + "step": 69200 + }, + { + "epoch": 11.99, + "eval_loss": Infinity, + "eval_runtime": 546.7795, + "eval_samples_per_second": 20.613, + "eval_steps_per_second": 2.577, + "eval_wer": 0.21012985375693394, + "step": 69300 + }, + { + "epoch": 12.0, + "eval_loss": Infinity, + "eval_runtime": 546.9894, + "eval_samples_per_second": 20.606, + "eval_steps_per_second": 2.576, + "eval_wer": 0.21049756261556565, + "step": 69400 + }, + { + "epoch": 12.02, + "learning_rate": 6.003826974370868e-05, + "loss": 0.052, + "step": 69500 + }, + { + "epoch": 12.02, + "eval_loss": Infinity, + "eval_runtime": 546.4107, + "eval_samples_per_second": 20.627, + "eval_steps_per_second": 2.579, + "eval_wer": 0.21161119515885024, + "step": 69500 + }, + { + "epoch": 12.04, + "eval_loss": Infinity, + "eval_runtime": 547.49, + "eval_samples_per_second": 20.587, + "eval_steps_per_second": 2.574, + "eval_wer": 0.21267229786518743, + "step": 69600 + }, + { + "epoch": 12.05, + "eval_loss": Infinity, + "eval_runtime": 549.2968, + "eval_samples_per_second": 20.519, + "eval_steps_per_second": 2.565, + "eval_wer": 0.21150613548495545, + "step": 69700 + }, + { + "epoch": 12.07, + "eval_loss": Infinity, + "eval_runtime": 550.0198, + "eval_samples_per_second": 20.492, + "eval_steps_per_second": 2.562, + "eval_wer": 0.20942595394183897, + "step": 69800 + }, + { + "epoch": 12.09, + "eval_loss": Infinity, + "eval_runtime": 549.2856, + "eval_samples_per_second": 20.519, + "eval_steps_per_second": 2.565, + "eval_wer": 0.21057110438729199, + "step": 69900 + }, + { + "epoch": 12.11, + "learning_rate": 5.830569407398817e-05, + "loss": 0.0499, + "step": 70000 + }, + { + "epoch": 12.11, + "eval_loss": Infinity, + "eval_runtime": 547.589, + "eval_samples_per_second": 20.583, + "eval_steps_per_second": 2.573, + "eval_wer": 0.2110753908219869, + "step": 70000 + }, + { + "epoch": 12.12, + "eval_loss": Infinity, + "eval_runtime": 548.5834, + "eval_samples_per_second": 20.546, + "eval_steps_per_second": 2.568, + "eval_wer": 0.21128551016977642, + "step": 70100 + }, + { + "epoch": 12.14, + "eval_loss": Infinity, + "eval_runtime": 547.8589, + "eval_samples_per_second": 20.573, + "eval_steps_per_second": 2.572, + "eval_wer": 0.21247268448478737, + "step": 70200 + }, + { + "epoch": 12.16, + "eval_loss": Infinity, + "eval_runtime": 547.6862, + "eval_samples_per_second": 20.579, + "eval_steps_per_second": 2.573, + "eval_wer": 0.21007732391998654, + "step": 70300 + }, + { + "epoch": 12.18, + "eval_loss": Infinity, + "eval_runtime": 548.8788, + "eval_samples_per_second": 20.535, + "eval_steps_per_second": 2.567, + "eval_wer": 0.21147461758278702, + "step": 70400 + }, + { + "epoch": 12.19, + "learning_rate": 5.656616026904789e-05, + "loss": 0.0466, + "step": 70500 + }, + { + "epoch": 12.19, + "eval_loss": Infinity, + "eval_runtime": 547.2229, + "eval_samples_per_second": 20.597, + "eval_steps_per_second": 2.575, + "eval_wer": 0.2119053622457556, + "step": 70500 + }, + { + "epoch": 12.21, + "eval_loss": Infinity, + "eval_runtime": 545.9416, + "eval_samples_per_second": 20.645, + "eval_steps_per_second": 2.581, + "eval_wer": 0.21017187762649184, + "step": 70600 + }, + { + "epoch": 12.23, + "eval_loss": Infinity, + "eval_runtime": 546.221, + "eval_samples_per_second": 20.635, + "eval_steps_per_second": 2.58, + "eval_wer": 0.21210497562615566, + "step": 70700 + }, + { + "epoch": 12.24, + "eval_loss": Infinity, + "eval_runtime": 546.0324, + "eval_samples_per_second": 20.642, + "eval_steps_per_second": 2.58, + "eval_wer": 0.20912128088754411, + "step": 70800 + }, + { + "epoch": 12.26, + "eval_loss": Infinity, + "eval_runtime": 550.3946, + "eval_samples_per_second": 20.478, + "eval_steps_per_second": 2.56, + "eval_wer": 0.20918431669188098, + "step": 70900 + }, + { + "epoch": 12.28, + "learning_rate": 5.482662646410761e-05, + "loss": 0.0475, + "step": 71000 + }, + { + "epoch": 12.28, + "eval_loss": Infinity, + "eval_runtime": 550.7521, + "eval_samples_per_second": 20.465, + "eval_steps_per_second": 2.558, + "eval_wer": 0.21018238359388133, + "step": 71000 + }, + { + "epoch": 12.3, + "eval_loss": Infinity, + "eval_runtime": 549.8286, + "eval_samples_per_second": 20.499, + "eval_steps_per_second": 2.563, + "eval_wer": 0.20944696587661793, + "step": 71100 + }, + { + "epoch": 12.31, + "eval_loss": Infinity, + "eval_runtime": 550.14, + "eval_samples_per_second": 20.488, + "eval_steps_per_second": 2.561, + "eval_wer": 0.20863800638762817, + "step": 71200 + }, + { + "epoch": 12.33, + "eval_loss": Infinity, + "eval_runtime": 546.3515, + "eval_samples_per_second": 20.63, + "eval_steps_per_second": 2.579, + "eval_wer": 0.20678895612708018, + "step": 71300 + }, + { + "epoch": 12.35, + "eval_loss": Infinity, + "eval_runtime": 546.7793, + "eval_samples_per_second": 20.613, + "eval_steps_per_second": 2.577, + "eval_wer": 0.20771348125735417, + "step": 71400 + }, + { + "epoch": 12.37, + "learning_rate": 5.3087092659167335e-05, + "loss": 0.0433, + "step": 71500 + }, + { + "epoch": 12.37, + "eval_loss": Infinity, + "eval_runtime": 548.6341, + "eval_samples_per_second": 20.544, + "eval_steps_per_second": 2.568, + "eval_wer": 0.20904773911581778, + "step": 71500 + }, + { + "epoch": 12.38, + "eval_loss": Infinity, + "eval_runtime": 548.8543, + "eval_samples_per_second": 20.536, + "eval_steps_per_second": 2.567, + "eval_wer": 0.20905824508320725, + "step": 71600 + }, + { + "epoch": 12.4, + "eval_loss": Infinity, + "eval_runtime": 547.0279, + "eval_samples_per_second": 20.604, + "eval_steps_per_second": 2.576, + "eval_wer": 0.21201042191965036, + "step": 71700 + }, + { + "epoch": 12.42, + "eval_loss": Infinity, + "eval_runtime": 546.0371, + "eval_samples_per_second": 20.641, + "eval_steps_per_second": 2.58, + "eval_wer": 0.20892166750714405, + "step": 71800 + }, + { + "epoch": 12.44, + "eval_loss": Infinity, + "eval_runtime": 546.5248, + "eval_samples_per_second": 20.623, + "eval_steps_per_second": 2.578, + "eval_wer": 0.20953101361573373, + "step": 71900 + }, + { + "epoch": 12.45, + "learning_rate": 5.1347558854227064e-05, + "loss": 0.0457, + "step": 72000 + }, + { + "epoch": 12.45, + "eval_loss": Infinity, + "eval_runtime": 547.1024, + "eval_samples_per_second": 20.601, + "eval_steps_per_second": 2.575, + "eval_wer": 0.20903723314842831, + "step": 72000 + }, + { + "epoch": 12.47, + "eval_loss": Infinity, + "eval_runtime": 546.2064, + "eval_samples_per_second": 20.635, + "eval_steps_per_second": 2.58, + "eval_wer": 0.20880610186585982, + "step": 72100 + }, + { + "epoch": 12.49, + "eval_loss": Infinity, + "eval_runtime": 545.9585, + "eval_samples_per_second": 20.644, + "eval_steps_per_second": 2.581, + "eval_wer": 0.20800764834425953, + "step": 72200 + }, + { + "epoch": 12.5, + "eval_loss": Infinity, + "eval_runtime": 546.2479, + "eval_samples_per_second": 20.633, + "eval_steps_per_second": 2.579, + "eval_wer": 0.20662086064884855, + "step": 72300 + }, + { + "epoch": 12.52, + "eval_loss": Infinity, + "eval_runtime": 550.549, + "eval_samples_per_second": 20.472, + "eval_steps_per_second": 2.559, + "eval_wer": 0.20978315683308119, + "step": 72400 + }, + { + "epoch": 12.54, + "learning_rate": 4.961150411689667e-05, + "loss": 0.0446, + "step": 72500 + }, + { + "epoch": 12.54, + "eval_loss": Infinity, + "eval_runtime": 549.0154, + "eval_samples_per_second": 20.529, + "eval_steps_per_second": 2.566, + "eval_wer": 0.20758740964868044, + "step": 72500 + }, + { + "epoch": 12.56, + "eval_loss": Infinity, + "eval_runtime": 547.3815, + "eval_samples_per_second": 20.591, + "eval_steps_per_second": 2.574, + "eval_wer": 0.20679946209446967, + "step": 72600 + }, + { + "epoch": 12.57, + "eval_loss": Infinity, + "eval_runtime": 547.8075, + "eval_samples_per_second": 20.575, + "eval_steps_per_second": 2.572, + "eval_wer": 0.20801815431164902, + "step": 72700 + }, + { + "epoch": 12.59, + "eval_loss": Infinity, + "eval_runtime": 546.6072, + "eval_samples_per_second": 20.62, + "eval_steps_per_second": 2.578, + "eval_wer": 0.21288241721297696, + "step": 72800 + }, + { + "epoch": 12.61, + "eval_loss": Infinity, + "eval_runtime": 550.7128, + "eval_samples_per_second": 20.466, + "eval_steps_per_second": 2.559, + "eval_wer": 0.21161119515885024, + "step": 72900 + }, + { + "epoch": 12.63, + "learning_rate": 4.787197031195639e-05, + "loss": 0.0423, + "step": 73000 + }, + { + "epoch": 12.63, + "eval_loss": Infinity, + "eval_runtime": 547.9244, + "eval_samples_per_second": 20.57, + "eval_steps_per_second": 2.572, + "eval_wer": 0.210791729702471, + "step": 73000 + }, + { + "epoch": 12.64, + "eval_loss": Infinity, + "eval_runtime": 546.7393, + "eval_samples_per_second": 20.615, + "eval_steps_per_second": 2.577, + "eval_wer": 0.20828080349638595, + "step": 73100 + }, + { + "epoch": 12.66, + "eval_loss": Infinity, + "eval_runtime": 549.7708, + "eval_samples_per_second": 20.501, + "eval_steps_per_second": 2.563, + "eval_wer": 0.20792360060514373, + "step": 73200 + }, + { + "epoch": 12.68, + "eval_loss": Infinity, + "eval_runtime": 548.6428, + "eval_samples_per_second": 20.543, + "eval_steps_per_second": 2.568, + "eval_wer": 0.2072932425617751, + "step": 73300 + }, + { + "epoch": 12.69, + "eval_loss": Infinity, + "eval_runtime": 559.0002, + "eval_samples_per_second": 20.163, + "eval_steps_per_second": 2.521, + "eval_wer": 0.20738779626828038, + "step": 73400 + }, + { + "epoch": 12.71, + "learning_rate": 4.613243650701612e-05, + "loss": 0.0443, + "step": 73500 + }, + { + "epoch": 12.71, + "eval_loss": Infinity, + "eval_runtime": 545.8124, + "eval_samples_per_second": 20.65, + "eval_steps_per_second": 2.581, + "eval_wer": 0.20659984871406958, + "step": 73500 + }, + { + "epoch": 12.73, + "eval_loss": Infinity, + "eval_runtime": 549.5227, + "eval_samples_per_second": 20.511, + "eval_steps_per_second": 2.564, + "eval_wer": 0.2069570516053118, + "step": 73600 + }, + { + "epoch": 12.75, + "eval_loss": Infinity, + "eval_runtime": 547.0702, + "eval_samples_per_second": 20.602, + "eval_steps_per_second": 2.576, + "eval_wer": 0.20542318036644813, + "step": 73700 + }, + { + "epoch": 12.76, + "eval_loss": Infinity, + "eval_runtime": 548.2885, + "eval_samples_per_second": 20.557, + "eval_steps_per_second": 2.57, + "eval_wer": 0.20436207766011094, + "step": 73800 + }, + { + "epoch": 12.78, + "eval_loss": Infinity, + "eval_runtime": 548.5659, + "eval_samples_per_second": 20.546, + "eval_steps_per_second": 2.569, + "eval_wer": 0.20449865523617414, + "step": 73900 + }, + { + "epoch": 12.8, + "learning_rate": 4.439290270207584e-05, + "loss": 0.0431, + "step": 74000 + }, + { + "epoch": 12.8, + "eval_loss": Infinity, + "eval_runtime": 548.4023, + "eval_samples_per_second": 20.552, + "eval_steps_per_second": 2.569, + "eval_wer": 0.20554925197512186, + "step": 74000 + }, + { + "epoch": 12.82, + "eval_loss": Infinity, + "eval_runtime": 550.149, + "eval_samples_per_second": 20.487, + "eval_steps_per_second": 2.561, + "eval_wer": 0.205486216170785, + "step": 74100 + }, + { + "epoch": 12.83, + "eval_loss": Infinity, + "eval_runtime": 547.5824, + "eval_samples_per_second": 20.583, + "eval_steps_per_second": 2.573, + "eval_wer": 0.20856446461590183, + "step": 74200 + }, + { + "epoch": 12.85, + "eval_loss": Infinity, + "eval_runtime": 546.9058, + "eval_samples_per_second": 20.609, + "eval_steps_per_second": 2.576, + "eval_wer": 0.20840687510505967, + "step": 74300 + }, + { + "epoch": 12.87, + "eval_loss": Infinity, + "eval_runtime": 547.6274, + "eval_samples_per_second": 20.582, + "eval_steps_per_second": 2.573, + "eval_wer": 0.2061270801815431, + "step": 74400 + }, + { + "epoch": 12.88, + "learning_rate": 4.265336889713556e-05, + "loss": 0.045, + "step": 74500 + }, + { + "epoch": 12.88, + "eval_loss": Infinity, + "eval_runtime": 548.5153, + "eval_samples_per_second": 20.548, + "eval_steps_per_second": 2.569, + "eval_wer": 0.20694654563792234, + "step": 74500 + }, + { + "epoch": 12.9, + "eval_loss": Infinity, + "eval_runtime": 548.6672, + "eval_samples_per_second": 20.543, + "eval_steps_per_second": 2.568, + "eval_wer": 0.20734577239872248, + "step": 74600 + }, + { + "epoch": 12.92, + "eval_loss": Infinity, + "eval_runtime": 552.9233, + "eval_samples_per_second": 20.384, + "eval_steps_per_second": 2.548, + "eval_wer": 0.20574886535552195, + "step": 74700 + }, + { + "epoch": 12.94, + "eval_loss": Infinity, + "eval_runtime": 550.6342, + "eval_samples_per_second": 20.469, + "eval_steps_per_second": 2.559, + "eval_wer": 0.20813371995293325, + "step": 74800 + }, + { + "epoch": 12.95, + "eval_loss": Infinity, + "eval_runtime": 546.873, + "eval_samples_per_second": 20.61, + "eval_steps_per_second": 2.576, + "eval_wer": 0.205948478735922, + "step": 74900 + }, + { + "epoch": 12.97, + "learning_rate": 4.091731415980517e-05, + "loss": 0.0434, + "step": 75000 + }, + { + "epoch": 12.97, + "eval_loss": Infinity, + "eval_runtime": 547.6534, + "eval_samples_per_second": 20.581, + "eval_steps_per_second": 2.573, + "eval_wer": 0.20497142376870062, + "step": 75000 + }, + { + "epoch": 12.99, + "eval_loss": Infinity, + "eval_runtime": 547.905, + "eval_samples_per_second": 20.571, + "eval_steps_per_second": 2.572, + "eval_wer": 0.2041939821818793, + "step": 75100 + }, + { + "epoch": 13.01, + "eval_loss": Infinity, + "eval_runtime": 546.051, + "eval_samples_per_second": 20.641, + "eval_steps_per_second": 2.58, + "eval_wer": 0.20416246427971088, + "step": 75200 + }, + { + "epoch": 13.02, + "eval_loss": Infinity, + "eval_runtime": 548.0237, + "eval_samples_per_second": 20.567, + "eval_steps_per_second": 2.571, + "eval_wer": 0.20353210623634224, + "step": 75300 + }, + { + "epoch": 13.04, + "eval_loss": Infinity, + "eval_runtime": 547.0355, + "eval_samples_per_second": 20.604, + "eval_steps_per_second": 2.576, + "eval_wer": 0.20444612539922677, + "step": 75400 + }, + { + "epoch": 13.06, + "learning_rate": 3.9177780354864895e-05, + "loss": 0.0388, + "step": 75500 + }, + { + "epoch": 13.06, + "eval_loss": Infinity, + "eval_runtime": 547.6747, + "eval_samples_per_second": 20.58, + "eval_steps_per_second": 2.573, + "eval_wer": 0.2026285930408472, + "step": 75500 + }, + { + "epoch": 13.08, + "eval_loss": Infinity, + "eval_runtime": 549.5817, + "eval_samples_per_second": 20.508, + "eval_steps_per_second": 2.564, + "eval_wer": 0.20371070768196337, + "step": 75600 + }, + { + "epoch": 13.09, + "eval_loss": Infinity, + "eval_runtime": 549.0065, + "eval_samples_per_second": 20.53, + "eval_steps_per_second": 2.566, + "eval_wer": 0.20430954782316355, + "step": 75700 + }, + { + "epoch": 13.11, + "eval_loss": Infinity, + "eval_runtime": 547.8794, + "eval_samples_per_second": 20.572, + "eval_steps_per_second": 2.572, + "eval_wer": 0.20384728525802656, + "step": 75800 + }, + { + "epoch": 13.13, + "eval_loss": Infinity, + "eval_runtime": 548.5189, + "eval_samples_per_second": 20.548, + "eval_steps_per_second": 2.569, + "eval_wer": 0.20399436880147925, + "step": 75900 + }, + { + "epoch": 13.14, + "learning_rate": 3.743824654992462e-05, + "loss": 0.0391, + "step": 76000 + }, + { + "epoch": 13.14, + "eval_loss": Infinity, + "eval_runtime": 547.8529, + "eval_samples_per_second": 20.573, + "eval_steps_per_second": 2.572, + "eval_wer": 0.20545469826861656, + "step": 76000 + }, + { + "epoch": 13.16, + "eval_loss": Infinity, + "eval_runtime": 547.706, + "eval_samples_per_second": 20.579, + "eval_steps_per_second": 2.573, + "eval_wer": 0.2059064548663641, + "step": 76100 + }, + { + "epoch": 13.18, + "eval_loss": Infinity, + "eval_runtime": 546.7268, + "eval_samples_per_second": 20.615, + "eval_steps_per_second": 2.577, + "eval_wer": 0.20568582955118508, + "step": 76200 + }, + { + "epoch": 13.2, + "eval_loss": Infinity, + "eval_runtime": 545.8487, + "eval_samples_per_second": 20.649, + "eval_steps_per_second": 2.581, + "eval_wer": 0.20443561943183727, + "step": 76300 + }, + { + "epoch": 13.21, + "eval_loss": Infinity, + "eval_runtime": 546.5302, + "eval_samples_per_second": 20.623, + "eval_steps_per_second": 2.578, + "eval_wer": 0.20482434022524795, + "step": 76400 + }, + { + "epoch": 13.23, + "learning_rate": 3.569871274498434e-05, + "loss": 0.0416, + "step": 76500 + }, + { + "epoch": 13.23, + "eval_loss": Infinity, + "eval_runtime": 548.7117, + "eval_samples_per_second": 20.541, + "eval_steps_per_second": 2.568, + "eval_wer": 0.20413094637754245, + "step": 76500 + }, + { + "epoch": 13.25, + "eval_loss": Infinity, + "eval_runtime": 548.0591, + "eval_samples_per_second": 20.565, + "eval_steps_per_second": 2.571, + "eval_wer": 0.2031328794755421, + "step": 76600 + }, + { + "epoch": 13.27, + "eval_loss": Infinity, + "eval_runtime": 547.9137, + "eval_samples_per_second": 20.571, + "eval_steps_per_second": 2.572, + "eval_wer": 0.20347957639939485, + "step": 76700 + }, + { + "epoch": 13.28, + "eval_loss": Infinity, + "eval_runtime": 547.587, + "eval_samples_per_second": 20.583, + "eval_steps_per_second": 2.573, + "eval_wer": 0.2036476718776265, + "step": 76800 + }, + { + "epoch": 13.3, + "eval_loss": Infinity, + "eval_runtime": 547.4785, + "eval_samples_per_second": 20.587, + "eval_steps_per_second": 2.574, + "eval_wer": 0.20268112287779458, + "step": 76900 + }, + { + "epoch": 13.32, + "learning_rate": 3.395917894004407e-05, + "loss": 0.0387, + "step": 77000 + }, + { + "epoch": 13.32, + "eval_loss": Infinity, + "eval_runtime": 546.9031, + "eval_samples_per_second": 20.609, + "eval_steps_per_second": 2.576, + "eval_wer": 0.20260758110606825, + "step": 77000 + }, + { + "epoch": 13.33, + "eval_loss": Infinity, + "eval_runtime": 550.3877, + "eval_samples_per_second": 20.478, + "eval_steps_per_second": 2.56, + "eval_wer": 0.20273365271474197, + "step": 77100 + }, + { + "epoch": 13.35, + "eval_loss": Infinity, + "eval_runtime": 548.8206, + "eval_samples_per_second": 20.537, + "eval_steps_per_second": 2.567, + "eval_wer": 0.20204025886703647, + "step": 77200 + }, + { + "epoch": 13.37, + "eval_loss": Infinity, + "eval_runtime": 547.3966, + "eval_samples_per_second": 20.59, + "eval_steps_per_second": 2.574, + "eval_wer": 0.2015254664649521, + "step": 77300 + }, + { + "epoch": 13.39, + "eval_loss": Infinity, + "eval_runtime": 547.7422, + "eval_samples_per_second": 20.577, + "eval_steps_per_second": 2.572, + "eval_wer": 0.20210329467137333, + "step": 77400 + }, + { + "epoch": 13.4, + "learning_rate": 3.221964513510379e-05, + "loss": 0.0388, + "step": 77500 + }, + { + "epoch": 13.4, + "eval_loss": Infinity, + "eval_runtime": 548.8405, + "eval_samples_per_second": 20.536, + "eval_steps_per_second": 2.567, + "eval_wer": 0.20255505126912085, + "step": 77500 + }, + { + "epoch": 13.42, + "eval_loss": Infinity, + "eval_runtime": 547.5989, + "eval_samples_per_second": 20.583, + "eval_steps_per_second": 2.573, + "eval_wer": 0.20247100353000505, + "step": 77600 + }, + { + "epoch": 13.44, + "eval_loss": Infinity, + "eval_runtime": 549.3386, + "eval_samples_per_second": 20.517, + "eval_steps_per_second": 2.565, + "eval_wer": 0.20259707513867878, + "step": 77700 + }, + { + "epoch": 13.46, + "eval_loss": Infinity, + "eval_runtime": 548.9936, + "eval_samples_per_second": 20.53, + "eval_steps_per_second": 2.567, + "eval_wer": 0.20168305597579425, + "step": 77800 + }, + { + "epoch": 13.47, + "eval_loss": Infinity, + "eval_runtime": 547.7403, + "eval_samples_per_second": 20.577, + "eval_steps_per_second": 2.572, + "eval_wer": 0.20236594385611026, + "step": 77900 + }, + { + "epoch": 13.49, + "learning_rate": 3.0480111330163512e-05, + "loss": 0.0393, + "step": 78000 + }, + { + "epoch": 13.49, + "eval_loss": Infinity, + "eval_runtime": 546.9778, + "eval_samples_per_second": 20.606, + "eval_steps_per_second": 2.576, + "eval_wer": 0.20218734241048916, + "step": 78000 + }, + { + "epoch": 13.51, + "eval_loss": Infinity, + "eval_runtime": 547.4243, + "eval_samples_per_second": 20.589, + "eval_steps_per_second": 2.574, + "eval_wer": 0.2026706169104051, + "step": 78100 + }, + { + "epoch": 13.52, + "eval_loss": Infinity, + "eval_runtime": 547.4439, + "eval_samples_per_second": 20.588, + "eval_steps_per_second": 2.574, + "eval_wer": 0.20266011094301564, + "step": 78200 + }, + { + "epoch": 13.54, + "eval_loss": Infinity, + "eval_runtime": 548.5146, + "eval_samples_per_second": 20.548, + "eval_steps_per_second": 2.569, + "eval_wer": 0.20126281728021517, + "step": 78300 + }, + { + "epoch": 13.56, + "eval_loss": Infinity, + "eval_runtime": 548.6545, + "eval_samples_per_second": 20.543, + "eval_steps_per_second": 2.568, + "eval_wer": 0.201105227769373, + "step": 78400 + }, + { + "epoch": 13.58, + "learning_rate": 2.8744056592833116e-05, + "loss": 0.0389, + "step": 78500 + }, + { + "epoch": 13.58, + "eval_loss": Infinity, + "eval_runtime": 548.7215, + "eval_samples_per_second": 20.54, + "eval_steps_per_second": 2.568, + "eval_wer": 0.20085308455202555, + "step": 78500 + }, + { + "epoch": 13.59, + "eval_loss": Infinity, + "eval_runtime": 549.8062, + "eval_samples_per_second": 20.5, + "eval_steps_per_second": 2.563, + "eval_wer": 0.20089510842158345, + "step": 78600 + }, + { + "epoch": 13.61, + "eval_loss": Infinity, + "eval_runtime": 588.3973, + "eval_samples_per_second": 19.155, + "eval_steps_per_second": 2.395, + "eval_wer": 0.20059043536728863, + "step": 78700 + }, + { + "epoch": 13.63, + "eval_loss": Infinity, + "eval_runtime": 552.7964, + "eval_samples_per_second": 20.389, + "eval_steps_per_second": 2.549, + "eval_wer": 0.20140990082366783, + "step": 78800 + }, + { + "epoch": 13.65, + "eval_loss": Infinity, + "eval_runtime": 550.5531, + "eval_samples_per_second": 20.472, + "eval_steps_per_second": 2.559, + "eval_wer": 0.20086359051941502, + "step": 78900 + }, + { + "epoch": 13.66, + "learning_rate": 2.700452278789284e-05, + "loss": 0.0413, + "step": 79000 + }, + { + "epoch": 13.66, + "eval_loss": Infinity, + "eval_runtime": 549.8536, + "eval_samples_per_second": 20.498, + "eval_steps_per_second": 2.563, + "eval_wer": 0.20187216338880484, + "step": 79000 + }, + { + "epoch": 13.68, + "eval_loss": Infinity, + "eval_runtime": 550.6749, + "eval_samples_per_second": 20.468, + "eval_steps_per_second": 2.559, + "eval_wer": 0.20218734241048916, + "step": 79100 + }, + { + "epoch": 13.7, + "eval_loss": Infinity, + "eval_runtime": 551.1265, + "eval_samples_per_second": 20.451, + "eval_steps_per_second": 2.557, + "eval_wer": 0.20192469322575224, + "step": 79200 + }, + { + "epoch": 13.71, + "eval_loss": Infinity, + "eval_runtime": 548.06, + "eval_samples_per_second": 20.565, + "eval_steps_per_second": 2.571, + "eval_wer": 0.20288073625819467, + "step": 79300 + }, + { + "epoch": 13.73, + "eval_loss": Infinity, + "eval_runtime": 549.0029, + "eval_samples_per_second": 20.53, + "eval_steps_per_second": 2.566, + "eval_wer": 0.20201924693225753, + "step": 79400 + }, + { + "epoch": 13.75, + "learning_rate": 2.5264988982952567e-05, + "loss": 0.0384, + "step": 79500 + }, + { + "epoch": 13.75, + "eval_loss": Infinity, + "eval_runtime": 547.9777, + "eval_samples_per_second": 20.568, + "eval_steps_per_second": 2.571, + "eval_wer": 0.20127332324760464, + "step": 79500 + }, + { + "epoch": 13.77, + "eval_loss": Infinity, + "eval_runtime": 549.5908, + "eval_samples_per_second": 20.508, + "eval_steps_per_second": 2.564, + "eval_wer": 0.2008320726172466, + "step": 79600 + }, + { + "epoch": 13.78, + "eval_loss": Infinity, + "eval_runtime": 550.7209, + "eval_samples_per_second": 20.466, + "eval_steps_per_second": 2.558, + "eval_wer": 0.20131534711716254, + "step": 79700 + }, + { + "epoch": 13.8, + "eval_loss": Infinity, + "eval_runtime": 549.4461, + "eval_samples_per_second": 20.513, + "eval_steps_per_second": 2.564, + "eval_wer": 0.20072701294335182, + "step": 79800 + }, + { + "epoch": 13.82, + "eval_loss": Infinity, + "eval_runtime": 550.7003, + "eval_samples_per_second": 20.467, + "eval_steps_per_second": 2.559, + "eval_wer": 0.20068498907379392, + "step": 79900 + }, + { + "epoch": 13.84, + "learning_rate": 2.3525455178012292e-05, + "loss": 0.0366, + "step": 80000 + }, + { + "epoch": 13.84, + "eval_loss": Infinity, + "eval_runtime": 549.1719, + "eval_samples_per_second": 20.524, + "eval_steps_per_second": 2.566, + "eval_wer": 0.2013363590519415, + "step": 80000 + }, + { + "epoch": 13.85, + "eval_loss": Infinity, + "eval_runtime": 549.0216, + "eval_samples_per_second": 20.529, + "eval_steps_per_second": 2.566, + "eval_wer": 0.2008320726172466, + "step": 80100 + }, + { + "epoch": 13.87, + "eval_loss": Infinity, + "eval_runtime": 549.1895, + "eval_samples_per_second": 20.523, + "eval_steps_per_second": 2.566, + "eval_wer": 0.2003172802151622, + "step": 80200 + }, + { + "epoch": 13.89, + "eval_loss": Infinity, + "eval_runtime": 551.531, + "eval_samples_per_second": 20.436, + "eval_steps_per_second": 2.555, + "eval_wer": 0.1995818624978988, + "step": 80300 + }, + { + "epoch": 13.91, + "eval_loss": Infinity, + "eval_runtime": 551.0755, + "eval_samples_per_second": 20.453, + "eval_steps_per_second": 2.557, + "eval_wer": 0.19938224911749874, + "step": 80400 + }, + { + "epoch": 13.92, + "learning_rate": 2.1785921373072014e-05, + "loss": 0.0368, + "step": 80500 + }, + { + "epoch": 13.92, + "eval_loss": Infinity, + "eval_runtime": 550.0799, + "eval_samples_per_second": 20.49, + "eval_steps_per_second": 2.561, + "eval_wer": 0.20009665489998318, + "step": 80500 + }, + { + "epoch": 13.94, + "eval_loss": Infinity, + "eval_runtime": 548.5676, + "eval_samples_per_second": 20.546, + "eval_steps_per_second": 2.569, + "eval_wer": 0.19951882669356194, + "step": 80600 + }, + { + "epoch": 13.96, + "eval_loss": Infinity, + "eval_runtime": 547.3994, + "eval_samples_per_second": 20.59, + "eval_steps_per_second": 2.574, + "eval_wer": 0.20012817280215162, + "step": 80700 + }, + { + "epoch": 13.97, + "eval_loss": Infinity, + "eval_runtime": 547.7377, + "eval_samples_per_second": 20.577, + "eval_steps_per_second": 2.572, + "eval_wer": 0.19902504622625652, + "step": 80800 + }, + { + "epoch": 13.99, + "eval_loss": Infinity, + "eval_runtime": 547.4485, + "eval_samples_per_second": 20.588, + "eval_steps_per_second": 2.574, + "eval_wer": 0.20012817280215162, + "step": 80900 + }, + { + "epoch": 14.01, + "learning_rate": 2.0046387568131736e-05, + "loss": 0.0362, + "step": 81000 + }, + { + "epoch": 14.01, + "eval_loss": Infinity, + "eval_runtime": 549.1806, + "eval_samples_per_second": 20.523, + "eval_steps_per_second": 2.566, + "eval_wer": 0.19897251638930913, + "step": 81000 + }, + { + "epoch": 14.03, + "eval_loss": Infinity, + "eval_runtime": 550.171, + "eval_samples_per_second": 20.486, + "eval_steps_per_second": 2.561, + "eval_wer": 0.19812153303076147, + "step": 81100 + }, + { + "epoch": 14.04, + "eval_loss": Infinity, + "eval_runtime": 548.9202, + "eval_samples_per_second": 20.533, + "eval_steps_per_second": 2.567, + "eval_wer": 0.19864683140023534, + "step": 81200 + }, + { + "epoch": 14.06, + "eval_loss": Infinity, + "eval_runtime": 549.2666, + "eval_samples_per_second": 20.52, + "eval_steps_per_second": 2.565, + "eval_wer": 0.19794293158514037, + "step": 81300 + }, + { + "epoch": 14.08, + "eval_loss": Infinity, + "eval_runtime": 548.6556, + "eval_samples_per_second": 20.543, + "eval_steps_per_second": 2.568, + "eval_wer": 0.19731257354177173, + "step": 81400 + }, + { + "epoch": 14.1, + "learning_rate": 1.8306853763191462e-05, + "loss": 0.0353, + "step": 81500 + }, + { + "epoch": 14.1, + "eval_loss": Infinity, + "eval_runtime": 548.2556, + "eval_samples_per_second": 20.558, + "eval_steps_per_second": 2.57, + "eval_wer": 0.1979639435199193, + "step": 81500 + }, + { + "epoch": 14.11, + "eval_loss": Infinity, + "eval_runtime": 549.3102, + "eval_samples_per_second": 20.518, + "eval_steps_per_second": 2.565, + "eval_wer": 0.1986573373676248, + "step": 81600 + }, + { + "epoch": 14.13, + "eval_loss": Infinity, + "eval_runtime": 548.0325, + "eval_samples_per_second": 20.566, + "eval_steps_per_second": 2.571, + "eval_wer": 0.1978798957808035, + "step": 81700 + }, + { + "epoch": 14.15, + "eval_loss": Infinity, + "eval_runtime": 547.6151, + "eval_samples_per_second": 20.582, + "eval_steps_per_second": 2.573, + "eval_wer": 0.1972390317700454, + "step": 81800 + }, + { + "epoch": 14.16, + "eval_loss": Infinity, + "eval_runtime": 548.5829, + "eval_samples_per_second": 20.546, + "eval_steps_per_second": 2.568, + "eval_wer": 0.19802697932425617, + "step": 81900 + }, + { + "epoch": 14.18, + "learning_rate": 1.6567319958251187e-05, + "loss": 0.0344, + "step": 82000 + }, + { + "epoch": 14.18, + "eval_loss": Infinity, + "eval_runtime": 548.2811, + "eval_samples_per_second": 20.557, + "eval_steps_per_second": 2.57, + "eval_wer": 0.1977853420742982, + "step": 82000 + }, + { + "epoch": 14.2, + "eval_loss": Infinity, + "eval_runtime": 556.1898, + "eval_samples_per_second": 20.265, + "eval_steps_per_second": 2.533, + "eval_wer": 0.19866784333501428, + "step": 82100 + }, + { + "epoch": 14.22, + "eval_loss": Infinity, + "eval_runtime": 556.5263, + "eval_samples_per_second": 20.252, + "eval_steps_per_second": 2.532, + "eval_wer": 0.1974596570852244, + "step": 82200 + }, + { + "epoch": 14.23, + "eval_loss": Infinity, + "eval_runtime": 549.5075, + "eval_samples_per_second": 20.511, + "eval_steps_per_second": 2.564, + "eval_wer": 0.1975121869221718, + "step": 82300 + }, + { + "epoch": 14.25, + "eval_loss": Infinity, + "eval_runtime": 550.8891, + "eval_samples_per_second": 20.46, + "eval_steps_per_second": 2.558, + "eval_wer": 0.19743864515044546, + "step": 82400 + }, + { + "epoch": 14.27, + "learning_rate": 1.4827786153310911e-05, + "loss": 0.0348, + "step": 82500 + }, + { + "epoch": 14.27, + "eval_loss": Infinity, + "eval_runtime": 550.8558, + "eval_samples_per_second": 20.461, + "eval_steps_per_second": 2.558, + "eval_wer": 0.19743864515044546, + "step": 82500 + }, + { + "epoch": 14.29, + "eval_loss": Infinity, + "eval_runtime": 548.9923, + "eval_samples_per_second": 20.53, + "eval_steps_per_second": 2.567, + "eval_wer": 0.19740712724827703, + "step": 82600 + }, + { + "epoch": 14.3, + "eval_loss": Infinity, + "eval_runtime": 549.7751, + "eval_samples_per_second": 20.501, + "eval_steps_per_second": 2.563, + "eval_wer": 0.19762775256345605, + "step": 82700 + }, + { + "epoch": 14.32, + "eval_loss": Infinity, + "eval_runtime": 549.3637, + "eval_samples_per_second": 20.516, + "eval_steps_per_second": 2.565, + "eval_wer": 0.19734409144394016, + "step": 82800 + }, + { + "epoch": 14.34, + "eval_loss": Infinity, + "eval_runtime": 549.8173, + "eval_samples_per_second": 20.5, + "eval_steps_per_second": 2.563, + "eval_wer": 0.197428139183056, + "step": 82900 + }, + { + "epoch": 14.35, + "learning_rate": 1.3088252348370636e-05, + "loss": 0.0328, + "step": 83000 + }, + { + "epoch": 14.35, + "eval_loss": Infinity, + "eval_runtime": 548.4364, + "eval_samples_per_second": 20.551, + "eval_steps_per_second": 2.569, + "eval_wer": 0.19799546142208774, + "step": 83000 + }, + { + "epoch": 14.37, + "eval_loss": Infinity, + "eval_runtime": 548.2968, + "eval_samples_per_second": 20.556, + "eval_steps_per_second": 2.57, + "eval_wer": 0.1978798957808035, + "step": 83100 + }, + { + "epoch": 14.39, + "eval_loss": Infinity, + "eval_runtime": 548.7906, + "eval_samples_per_second": 20.538, + "eval_steps_per_second": 2.567, + "eval_wer": 0.197428139183056, + "step": 83200 + }, + { + "epoch": 14.41, + "eval_loss": Infinity, + "eval_runtime": 548.8022, + "eval_samples_per_second": 20.537, + "eval_steps_per_second": 2.567, + "eval_wer": 0.19744915111783493, + "step": 83300 + }, + { + "epoch": 14.42, + "eval_loss": Infinity, + "eval_runtime": 548.604, + "eval_samples_per_second": 20.545, + "eval_steps_per_second": 2.568, + "eval_wer": 0.19727054967221383, + "step": 83400 + }, + { + "epoch": 14.44, + "learning_rate": 1.135219761104024e-05, + "loss": 0.0351, + "step": 83500 + }, + { + "epoch": 14.44, + "eval_loss": Infinity, + "eval_runtime": 548.3355, + "eval_samples_per_second": 20.555, + "eval_steps_per_second": 2.57, + "eval_wer": 0.19730206757438226, + "step": 83500 + }, + { + "epoch": 14.46, + "eval_loss": Infinity, + "eval_runtime": 548.7268, + "eval_samples_per_second": 20.54, + "eval_steps_per_second": 2.568, + "eval_wer": 0.1972390317700454, + "step": 83600 + }, + { + "epoch": 14.48, + "eval_loss": Infinity, + "eval_runtime": 548.6096, + "eval_samples_per_second": 20.545, + "eval_steps_per_second": 2.568, + "eval_wer": 0.19758572869389812, + "step": 83700 + }, + { + "epoch": 14.49, + "eval_loss": Infinity, + "eval_runtime": 546.9624, + "eval_samples_per_second": 20.607, + "eval_steps_per_second": 2.576, + "eval_wer": 0.19687132291141368, + "step": 83800 + }, + { + "epoch": 14.51, + "eval_loss": Infinity, + "eval_runtime": 548.7393, + "eval_samples_per_second": 20.54, + "eval_steps_per_second": 2.568, + "eval_wer": 0.19694486468314001, + "step": 83900 + }, + { + "epoch": 14.53, + "learning_rate": 9.612663806099964e-06, + "loss": 0.0329, + "step": 84000 + }, + { + "epoch": 14.53, + "eval_loss": Infinity, + "eval_runtime": 548.6856, + "eval_samples_per_second": 20.542, + "eval_steps_per_second": 2.568, + "eval_wer": 0.1965351319549504, + "step": 84000 + }, + { + "epoch": 14.55, + "eval_loss": Infinity, + "eval_runtime": 560.2236, + "eval_samples_per_second": 20.119, + "eval_steps_per_second": 2.515, + "eval_wer": 0.19655614388972936, + "step": 84100 + }, + { + "epoch": 14.56, + "eval_loss": Infinity, + "eval_runtime": 548.2121, + "eval_samples_per_second": 20.56, + "eval_steps_per_second": 2.57, + "eval_wer": 0.1964090603462767, + "step": 84200 + }, + { + "epoch": 14.58, + "eval_loss": Infinity, + "eval_runtime": 548.7406, + "eval_samples_per_second": 20.54, + "eval_steps_per_second": 2.568, + "eval_wer": 0.19682929904185578, + "step": 84300 + }, + { + "epoch": 14.6, + "eval_loss": Infinity, + "eval_runtime": 549.4063, + "eval_samples_per_second": 20.515, + "eval_steps_per_second": 2.565, + "eval_wer": 0.1963985543788872, + "step": 84400 + }, + { + "epoch": 14.61, + "learning_rate": 7.876609068769568e-06, + "loss": 0.036, + "step": 84500 + }, + { + "epoch": 14.61, + "eval_loss": Infinity, + "eval_runtime": 549.2923, + "eval_samples_per_second": 20.519, + "eval_steps_per_second": 2.565, + "eval_wer": 0.1965456379223399, + "step": 84500 + }, + { + "epoch": 14.63, + "eval_loss": Infinity, + "eval_runtime": 547.7858, + "eval_samples_per_second": 20.576, + "eval_steps_per_second": 2.572, + "eval_wer": 0.19636703647671877, + "step": 84600 + }, + { + "epoch": 14.65, + "eval_loss": Infinity, + "eval_runtime": 548.7123, + "eval_samples_per_second": 20.541, + "eval_steps_per_second": 2.568, + "eval_wer": 0.19675575727012942, + "step": 84700 + }, + { + "epoch": 14.67, + "eval_loss": Infinity, + "eval_runtime": 549.2306, + "eval_samples_per_second": 20.521, + "eval_steps_per_second": 2.565, + "eval_wer": 0.19690284081358211, + "step": 84800 + }, + { + "epoch": 14.68, + "eval_loss": Infinity, + "eval_runtime": 548.8397, + "eval_samples_per_second": 20.536, + "eval_steps_per_second": 2.567, + "eval_wer": 0.19665069759623466, + "step": 84900 + }, + { + "epoch": 14.7, + "learning_rate": 6.1370752638292925e-06, + "loss": 0.0322, + "step": 85000 + }, + { + "epoch": 14.7, + "eval_loss": Infinity, + "eval_runtime": 548.3915, + "eval_samples_per_second": 20.553, + "eval_steps_per_second": 2.569, + "eval_wer": 0.19657715582450833, + "step": 85000 + }, + { + "epoch": 14.72, + "eval_loss": Infinity, + "eval_runtime": 547.5876, + "eval_samples_per_second": 20.583, + "eval_steps_per_second": 2.573, + "eval_wer": 0.19665069759623466, + "step": 85100 + }, + { + "epoch": 14.74, + "eval_loss": Infinity, + "eval_runtime": 548.4879, + "eval_samples_per_second": 20.549, + "eval_steps_per_second": 2.569, + "eval_wer": 0.1965456379223399, + "step": 85200 + }, + { + "epoch": 14.75, + "eval_loss": Infinity, + "eval_runtime": 549.2569, + "eval_samples_per_second": 20.52, + "eval_steps_per_second": 2.565, + "eval_wer": 0.1963985543788872, + "step": 85300 + }, + { + "epoch": 14.77, + "eval_loss": Infinity, + "eval_runtime": 548.644, + "eval_samples_per_second": 20.543, + "eval_steps_per_second": 2.568, + "eval_wer": 0.19644057824844513, + "step": 85400 + }, + { + "epoch": 14.79, + "learning_rate": 4.397541458889018e-06, + "loss": 0.0321, + "step": 85500 + }, + { + "epoch": 14.79, + "eval_loss": Infinity, + "eval_runtime": 547.1252, + "eval_samples_per_second": 20.6, + "eval_steps_per_second": 2.575, + "eval_wer": 0.1963565305093293, + "step": 85500 + }, + { + "epoch": 14.8, + "eval_loss": Infinity, + "eval_runtime": 551.1899, + "eval_samples_per_second": 20.448, + "eval_steps_per_second": 2.556, + "eval_wer": 0.1962094469658766, + "step": 85600 + }, + { + "epoch": 14.82, + "eval_loss": Infinity, + "eval_runtime": 564.4339, + "eval_samples_per_second": 19.969, + "eval_steps_per_second": 2.496, + "eval_wer": 0.19603084552025551, + "step": 85700 + }, + { + "epoch": 14.84, + "eval_loss": Infinity, + "eval_runtime": 555.5114, + "eval_samples_per_second": 20.289, + "eval_steps_per_second": 2.536, + "eval_wer": 0.1959467977811397, + "step": 85800 + }, + { + "epoch": 14.86, + "eval_loss": Infinity, + "eval_runtime": 551.0288, + "eval_samples_per_second": 20.454, + "eval_steps_per_second": 2.557, + "eval_wer": 0.19618843503109767, + "step": 85900 + }, + { + "epoch": 14.87, + "learning_rate": 2.6580076539487416e-06, + "loss": 0.0341, + "step": 86000 + }, + { + "epoch": 14.87, + "eval_loss": Infinity, + "eval_runtime": 552.5092, + "eval_samples_per_second": 20.4, + "eval_steps_per_second": 2.55, + "eval_wer": 0.19611489325937131, + "step": 86000 + }, + { + "epoch": 14.89, + "eval_loss": Infinity, + "eval_runtime": 551.7014, + "eval_samples_per_second": 20.43, + "eval_steps_per_second": 2.554, + "eval_wer": 0.19637754244410827, + "step": 86100 + }, + { + "epoch": 14.91, + "eval_loss": Infinity, + "eval_runtime": 551.3725, + "eval_samples_per_second": 20.442, + "eval_steps_per_second": 2.555, + "eval_wer": 0.19624096486804504, + "step": 86200 + }, + { + "epoch": 14.93, + "eval_loss": Infinity, + "eval_runtime": 551.3971, + "eval_samples_per_second": 20.441, + "eval_steps_per_second": 2.555, + "eval_wer": 0.19617792906370818, + "step": 86300 + }, + { + "epoch": 14.94, + "eval_loss": Infinity, + "eval_runtime": 548.852, + "eval_samples_per_second": 20.536, + "eval_steps_per_second": 2.567, + "eval_wer": 0.19632501260716087, + "step": 86400 + }, + { + "epoch": 14.96, + "learning_rate": 9.184738490084656e-07, + "loss": 0.0338, + "step": 86500 + }, + { + "epoch": 14.96, + "eval_loss": Infinity, + "eval_runtime": 549.3084, + "eval_samples_per_second": 20.519, + "eval_steps_per_second": 2.565, + "eval_wer": 0.19634602454193983, + "step": 86500 + }, + { + "epoch": 14.98, + "eval_loss": Infinity, + "eval_runtime": 548.1703, + "eval_samples_per_second": 20.561, + "eval_steps_per_second": 2.57, + "eval_wer": 0.19627248277021347, + "step": 86600 + }, + { + "epoch": 14.99, + "eval_loss": Infinity, + "eval_runtime": 548.1231, + "eval_samples_per_second": 20.563, + "eval_steps_per_second": 2.571, + "eval_wer": 0.19625147083543454, + "step": 86700 + }, + { + "epoch": 15.0, + "step": 86730, + "total_flos": 1.1589202082196755e+20, + "train_loss": 0.15599208657172234, + "train_runtime": 535995.9461, + "train_samples_per_second": 1.294, + "train_steps_per_second": 0.162 + } + ], + "max_steps": 86730, + "num_train_epochs": 15, + "total_flos": 1.1589202082196755e+20, + "trial_name": null, + "trial_params": null +}