{ "best_metric": null, "best_model_checkpoint": null, "epoch": 15.0, "global_step": 86730, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.02, "eval_loss": Infinity, "eval_runtime": 555.4159, "eval_samples_per_second": 20.293, "eval_steps_per_second": 2.537, "eval_wer": 1.0, "step": 100 }, { "epoch": 0.03, "eval_loss": Infinity, "eval_runtime": 545.0664, "eval_samples_per_second": 20.678, "eval_steps_per_second": 2.585, "eval_wer": 1.0, "step": 200 }, { "epoch": 0.05, "eval_loss": Infinity, "eval_runtime": 543.6935, "eval_samples_per_second": 20.73, "eval_steps_per_second": 2.592, "eval_wer": 0.999978988065221, "step": 300 }, { "epoch": 0.07, "eval_loss": Infinity, "eval_runtime": 546.0816, "eval_samples_per_second": 20.64, "eval_steps_per_second": 2.58, "eval_wer": 0.7648344259539418, "step": 400 }, { "epoch": 0.09, "learning_rate": 0.0002982, "loss": 3.8863, "step": 500 }, { "epoch": 0.09, "eval_loss": Infinity, "eval_runtime": 544.2871, "eval_samples_per_second": 20.708, "eval_steps_per_second": 2.589, "eval_wer": 0.6947386115313499, "step": 500 }, { "epoch": 0.1, "eval_loss": Infinity, "eval_runtime": 544.7171, "eval_samples_per_second": 20.691, "eval_steps_per_second": 2.587, "eval_wer": 0.6413262733232477, "step": 600 }, { "epoch": 0.12, "eval_loss": Infinity, "eval_runtime": 545.5744, "eval_samples_per_second": 20.659, "eval_steps_per_second": 2.583, "eval_wer": 0.5953521600268953, "step": 700 }, { "epoch": 0.14, "eval_loss": Infinity, "eval_runtime": 545.5238, "eval_samples_per_second": 20.661, "eval_steps_per_second": 2.583, "eval_wer": 0.619494873087914, "step": 800 }, { "epoch": 0.16, "eval_loss": Infinity, "eval_runtime": 544.0596, "eval_samples_per_second": 20.716, "eval_steps_per_second": 2.59, "eval_wer": 0.530624894940326, "step": 900 }, { "epoch": 0.17, "learning_rate": 0.0002982709033978893, "loss": 0.5864, "step": 1000 }, { "epoch": 0.17, "eval_loss": Infinity, "eval_runtime": 544.4141, "eval_samples_per_second": 20.703, "eval_steps_per_second": 2.588, "eval_wer": 0.5510379895780804, "step": 1000 }, { "epoch": 0.19, "eval_loss": Infinity, "eval_runtime": 549.751, "eval_samples_per_second": 20.502, "eval_steps_per_second": 2.563, "eval_wer": 0.5625105059673895, "step": 1100 }, { "epoch": 0.21, "eval_loss": Infinity, "eval_runtime": 543.401, "eval_samples_per_second": 20.742, "eval_steps_per_second": 2.593, "eval_wer": 0.5268742645822827, "step": 1200 }, { "epoch": 0.22, "eval_loss": Infinity, "eval_runtime": 543.2604, "eval_samples_per_second": 20.747, "eval_steps_per_second": 2.594, "eval_wer": 0.4834425953941839, "step": 1300 }, { "epoch": 0.24, "eval_loss": Infinity, "eval_runtime": 544.1865, "eval_samples_per_second": 20.712, "eval_steps_per_second": 2.589, "eval_wer": 0.4874138510674063, "step": 1400 }, { "epoch": 0.26, "learning_rate": 0.00029653136959294907, "loss": 0.4471, "step": 1500 }, { "epoch": 0.26, "eval_loss": Infinity, "eval_runtime": 543.1806, "eval_samples_per_second": 20.75, "eval_steps_per_second": 2.594, "eval_wer": 0.466559505799294, "step": 1500 }, { "epoch": 0.28, "eval_loss": Infinity, "eval_runtime": 543.9283, "eval_samples_per_second": 20.721, "eval_steps_per_second": 2.59, "eval_wer": 0.4632816439737771, "step": 1600 }, { "epoch": 0.29, "eval_loss": Infinity, "eval_runtime": 543.32, "eval_samples_per_second": 20.745, "eval_steps_per_second": 2.593, "eval_wer": 0.4523029080517734, "step": 1700 }, { "epoch": 0.31, "eval_loss": Infinity, "eval_runtime": 542.6473, "eval_samples_per_second": 20.77, "eval_steps_per_second": 2.597, "eval_wer": 0.45108421583459407, "step": 1800 }, { "epoch": 0.33, "eval_loss": Infinity, "eval_runtime": 544.9665, "eval_samples_per_second": 20.682, "eval_steps_per_second": 2.585, "eval_wer": 0.46307152462598755, "step": 1900 }, { "epoch": 0.35, "learning_rate": 0.00029479183578800877, "loss": 0.4075, "step": 2000 }, { "epoch": 0.35, "eval_loss": Infinity, "eval_runtime": 543.0548, "eval_samples_per_second": 20.755, "eval_steps_per_second": 2.595, "eval_wer": 0.4614641116153975, "step": 2000 }, { "epoch": 0.36, "eval_loss": Infinity, "eval_runtime": 543.3783, "eval_samples_per_second": 20.742, "eval_steps_per_second": 2.593, "eval_wer": 0.4452113800638763, "step": 2100 }, { "epoch": 0.38, "eval_loss": Infinity, "eval_runtime": 556.7449, "eval_samples_per_second": 20.244, "eval_steps_per_second": 2.531, "eval_wer": 0.438424525130274, "step": 2200 }, { "epoch": 0.4, "eval_loss": Infinity, "eval_runtime": 545.6186, "eval_samples_per_second": 20.657, "eval_steps_per_second": 2.582, "eval_wer": 0.4395381576735586, "step": 2300 }, { "epoch": 0.42, "eval_loss": Infinity, "eval_runtime": 548.6849, "eval_samples_per_second": 20.542, "eval_steps_per_second": 2.568, "eval_wer": 0.432898386283409, "step": 2400 }, { "epoch": 0.43, "learning_rate": 0.0002930523019830685, "loss": 0.3885, "step": 2500 }, { "epoch": 0.43, "eval_loss": Infinity, "eval_runtime": 543.661, "eval_samples_per_second": 20.732, "eval_steps_per_second": 2.592, "eval_wer": 0.42552319717599596, "step": 2500 }, { "epoch": 0.45, "eval_loss": Infinity, "eval_runtime": 544.3496, "eval_samples_per_second": 20.705, "eval_steps_per_second": 2.588, "eval_wer": 0.4184106572533199, "step": 2600 }, { "epoch": 0.47, "eval_loss": Infinity, "eval_runtime": 545.2818, "eval_samples_per_second": 20.67, "eval_steps_per_second": 2.584, "eval_wer": 0.42287569339384773, "step": 2700 }, { "epoch": 0.48, "eval_loss": Infinity, "eval_runtime": 543.2493, "eval_samples_per_second": 20.747, "eval_steps_per_second": 2.594, "eval_wer": 0.40858757774415866, "step": 2800 }, { "epoch": 0.5, "eval_loss": Infinity, "eval_runtime": 544.043, "eval_samples_per_second": 20.717, "eval_steps_per_second": 2.59, "eval_wer": 0.41017397881996975, "step": 2900 }, { "epoch": 0.52, "learning_rate": 0.0002913127681781282, "loss": 0.3744, "step": 3000 }, { "epoch": 0.52, "eval_loss": Infinity, "eval_runtime": 546.2103, "eval_samples_per_second": 20.635, "eval_steps_per_second": 2.58, "eval_wer": 0.3903597243234157, "step": 3000 }, { "epoch": 0.54, "eval_loss": Infinity, "eval_runtime": 545.1789, "eval_samples_per_second": 20.674, "eval_steps_per_second": 2.584, "eval_wer": 0.39412086064884855, "step": 3100 }, { "epoch": 0.55, "eval_loss": Infinity, "eval_runtime": 544.832, "eval_samples_per_second": 20.687, "eval_steps_per_second": 2.586, "eval_wer": 0.38530635400907715, "step": 3200 }, { "epoch": 0.57, "eval_loss": Infinity, "eval_runtime": 543.4333, "eval_samples_per_second": 20.74, "eval_steps_per_second": 2.593, "eval_wer": 0.38726046394351993, "step": 3300 }, { "epoch": 0.59, "eval_loss": Infinity, "eval_runtime": 546.7602, "eval_samples_per_second": 20.614, "eval_steps_per_second": 2.577, "eval_wer": 0.3931753235837956, "step": 3400 }, { "epoch": 0.61, "learning_rate": 0.00028957323437318796, "loss": 0.3538, "step": 3500 }, { "epoch": 0.61, "eval_loss": Infinity, "eval_runtime": 545.2677, "eval_samples_per_second": 20.671, "eval_steps_per_second": 2.584, "eval_wer": 0.38855269793242564, "step": 3500 }, { "epoch": 0.62, "eval_loss": Infinity, "eval_runtime": 542.3889, "eval_samples_per_second": 20.78, "eval_steps_per_second": 2.598, "eval_wer": 0.4128635064716759, "step": 3600 }, { "epoch": 0.64, "eval_loss": Infinity, "eval_runtime": 542.5923, "eval_samples_per_second": 20.773, "eval_steps_per_second": 2.597, "eval_wer": 0.3857370986720457, "step": 3700 }, { "epoch": 0.66, "eval_loss": Infinity, "eval_runtime": 543.4133, "eval_samples_per_second": 20.741, "eval_steps_per_second": 2.593, "eval_wer": 0.38266935619431836, "step": 3800 }, { "epoch": 0.67, "eval_loss": Infinity, "eval_runtime": 543.805, "eval_samples_per_second": 20.726, "eval_steps_per_second": 2.591, "eval_wer": 0.39107413010590014, "step": 3900 }, { "epoch": 0.69, "learning_rate": 0.0002878337005682477, "loss": 0.3577, "step": 4000 }, { "epoch": 0.69, "eval_loss": Infinity, "eval_runtime": 544.2518, "eval_samples_per_second": 20.709, "eval_steps_per_second": 2.589, "eval_wer": 0.4018427466801143, "step": 4000 }, { "epoch": 0.71, "eval_loss": Infinity, "eval_runtime": 541.8941, "eval_samples_per_second": 20.799, "eval_steps_per_second": 2.6, "eval_wer": 0.39127374348630023, "step": 4100 }, { "epoch": 0.73, "eval_loss": Infinity, "eval_runtime": 542.2205, "eval_samples_per_second": 20.787, "eval_steps_per_second": 2.599, "eval_wer": 0.3795175659774752, "step": 4200 }, { "epoch": 0.74, "eval_loss": Infinity, "eval_runtime": 540.8985, "eval_samples_per_second": 20.838, "eval_steps_per_second": 2.605, "eval_wer": 0.3949193141704488, "step": 4300 }, { "epoch": 0.76, "eval_loss": Infinity, "eval_runtime": 541.2726, "eval_samples_per_second": 20.823, "eval_steps_per_second": 2.603, "eval_wer": 0.38375147083543454, "step": 4400 }, { "epoch": 0.78, "learning_rate": 0.0002860941667633074, "loss": 0.349, "step": 4500 }, { "epoch": 0.78, "eval_loss": Infinity, "eval_runtime": 546.7973, "eval_samples_per_second": 20.613, "eval_steps_per_second": 2.577, "eval_wer": 0.37175365607665156, "step": 4500 }, { "epoch": 0.8, "eval_loss": Infinity, "eval_runtime": 543.3484, "eval_samples_per_second": 20.744, "eval_steps_per_second": 2.593, "eval_wer": 0.36440998487140697, "step": 4600 }, { "epoch": 0.81, "eval_loss": Infinity, "eval_runtime": 542.3944, "eval_samples_per_second": 20.78, "eval_steps_per_second": 2.598, "eval_wer": 0.3591780131114473, "step": 4700 }, { "epoch": 0.83, "eval_loss": Infinity, "eval_runtime": 543.0473, "eval_samples_per_second": 20.755, "eval_steps_per_second": 2.595, "eval_wer": 0.3694213313161876, "step": 4800 }, { "epoch": 0.85, "eval_loss": Infinity, "eval_runtime": 542.8039, "eval_samples_per_second": 20.764, "eval_steps_per_second": 2.596, "eval_wer": 0.36223524962178516, "step": 4900 }, { "epoch": 0.86, "learning_rate": 0.00028435463295836715, "loss": 0.327, "step": 5000 }, { "epoch": 0.86, "eval_loss": Infinity, "eval_runtime": 542.4774, "eval_samples_per_second": 20.777, "eval_steps_per_second": 2.597, "eval_wer": 0.359083459404942, "step": 5000 }, { "epoch": 0.88, "eval_loss": Infinity, "eval_runtime": 546.0865, "eval_samples_per_second": 20.64, "eval_steps_per_second": 2.58, "eval_wer": 0.37074508320726174, "step": 5100 }, { "epoch": 0.9, "eval_loss": Infinity, "eval_runtime": 543.8013, "eval_samples_per_second": 20.726, "eval_steps_per_second": 2.591, "eval_wer": 0.35611027063371997, "step": 5200 }, { "epoch": 0.92, "eval_loss": Infinity, "eval_runtime": 542.7376, "eval_samples_per_second": 20.767, "eval_steps_per_second": 2.596, "eval_wer": 0.3559421751554883, "step": 5300 }, { "epoch": 0.93, "eval_loss": Infinity, "eval_runtime": 541.9303, "eval_samples_per_second": 20.798, "eval_steps_per_second": 2.6, "eval_wer": 0.36291813750210117, "step": 5400 }, { "epoch": 0.95, "learning_rate": 0.00028261509915342685, "loss": 0.3328, "step": 5500 }, { "epoch": 0.95, "eval_loss": Infinity, "eval_runtime": 541.7032, "eval_samples_per_second": 20.807, "eval_steps_per_second": 2.601, "eval_wer": 0.35176080013447636, "step": 5500 }, { "epoch": 0.97, "eval_loss": Infinity, "eval_runtime": 542.8204, "eval_samples_per_second": 20.764, "eval_steps_per_second": 2.596, "eval_wer": 0.34550974953773744, "step": 5600 }, { "epoch": 0.99, "eval_loss": Infinity, "eval_runtime": 544.376, "eval_samples_per_second": 20.704, "eval_steps_per_second": 2.588, "eval_wer": 0.3792023869557909, "step": 5700 }, { "epoch": 1.0, "eval_loss": Infinity, "eval_runtime": 543.1296, "eval_samples_per_second": 20.752, "eval_steps_per_second": 2.594, "eval_wer": 0.35637291981845687, "step": 5800 }, { "epoch": 1.02, "eval_loss": Infinity, "eval_runtime": 542.0195, "eval_samples_per_second": 20.794, "eval_steps_per_second": 2.6, "eval_wer": 0.3562363422423937, "step": 5900 }, { "epoch": 1.04, "learning_rate": 0.0002808755653484866, "loss": 0.2984, "step": 6000 }, { "epoch": 1.04, "eval_loss": Infinity, "eval_runtime": 542.3963, "eval_samples_per_second": 20.78, "eval_steps_per_second": 2.598, "eval_wer": 0.34357665153807365, "step": 6000 }, { "epoch": 1.05, "eval_loss": Infinity, "eval_runtime": 542.7224, "eval_samples_per_second": 20.768, "eval_steps_per_second": 2.596, "eval_wer": 0.34884014120020174, "step": 6100 }, { "epoch": 1.07, "eval_loss": Infinity, "eval_runtime": 541.1971, "eval_samples_per_second": 20.826, "eval_steps_per_second": 2.603, "eval_wer": 0.3464973104723483, "step": 6200 }, { "epoch": 1.09, "eval_loss": Infinity, "eval_runtime": 542.2512, "eval_samples_per_second": 20.786, "eval_steps_per_second": 2.598, "eval_wer": 0.33660068919146074, "step": 6300 }, { "epoch": 1.11, "eval_loss": Infinity, "eval_runtime": 541.5435, "eval_samples_per_second": 20.813, "eval_steps_per_second": 2.602, "eval_wer": 0.3417906370818625, "step": 6400 }, { "epoch": 1.12, "learning_rate": 0.0002791360315435463, "loss": 0.2773, "step": 6500 }, { "epoch": 1.12, "eval_loss": Infinity, "eval_runtime": 543.2211, "eval_samples_per_second": 20.748, "eval_steps_per_second": 2.594, "eval_wer": 0.3393427466801143, "step": 6500 }, { "epoch": 1.14, "eval_loss": Infinity, "eval_runtime": 540.5493, "eval_samples_per_second": 20.851, "eval_steps_per_second": 2.607, "eval_wer": 0.34255757270129433, "step": 6600 }, { "epoch": 1.16, "eval_loss": Infinity, "eval_runtime": 545.9558, "eval_samples_per_second": 20.645, "eval_steps_per_second": 2.581, "eval_wer": 0.33338586317028074, "step": 6700 }, { "epoch": 1.18, "eval_loss": Infinity, "eval_runtime": 540.5178, "eval_samples_per_second": 20.852, "eval_steps_per_second": 2.607, "eval_wer": 0.3470121028744327, "step": 6800 }, { "epoch": 1.19, "eval_loss": Infinity, "eval_runtime": 541.1405, "eval_samples_per_second": 20.828, "eval_steps_per_second": 2.604, "eval_wer": 0.3309905026054799, "step": 6900 }, { "epoch": 1.21, "learning_rate": 0.00027739649773860604, "loss": 0.2777, "step": 7000 }, { "epoch": 1.21, "eval_loss": Infinity, "eval_runtime": 545.61, "eval_samples_per_second": 20.658, "eval_steps_per_second": 2.582, "eval_wer": 0.33262943351823837, "step": 7000 }, { "epoch": 1.23, "eval_loss": Infinity, "eval_runtime": 540.9626, "eval_samples_per_second": 20.835, "eval_steps_per_second": 2.605, "eval_wer": 0.3390695915279879, "step": 7100 }, { "epoch": 1.25, "eval_loss": Infinity, "eval_runtime": 541.732, "eval_samples_per_second": 20.805, "eval_steps_per_second": 2.601, "eval_wer": 0.345940494200706, "step": 7200 }, { "epoch": 1.26, "eval_loss": Infinity, "eval_runtime": 543.292, "eval_samples_per_second": 20.746, "eval_steps_per_second": 2.593, "eval_wer": 0.32880526138846866, "step": 7300 }, { "epoch": 1.28, "eval_loss": Infinity, "eval_runtime": 541.9911, "eval_samples_per_second": 20.796, "eval_steps_per_second": 2.6, "eval_wer": 0.3483883846024542, "step": 7400 }, { "epoch": 1.3, "learning_rate": 0.00027565696393366573, "loss": 0.2775, "step": 7500 }, { "epoch": 1.3, "eval_loss": Infinity, "eval_runtime": 542.1379, "eval_samples_per_second": 20.79, "eval_steps_per_second": 2.599, "eval_wer": 0.33937426458228276, "step": 7500 }, { "epoch": 1.31, "eval_loss": Infinity, "eval_runtime": 543.314, "eval_samples_per_second": 20.745, "eval_steps_per_second": 2.593, "eval_wer": 0.336253992267608, "step": 7600 }, { "epoch": 1.33, "eval_loss": Infinity, "eval_runtime": 543.9348, "eval_samples_per_second": 20.721, "eval_steps_per_second": 2.59, "eval_wer": 0.3464132627332325, "step": 7700 }, { "epoch": 1.35, "eval_loss": Infinity, "eval_runtime": 541.7191, "eval_samples_per_second": 20.806, "eval_steps_per_second": 2.601, "eval_wer": 0.3530110102538242, "step": 7800 }, { "epoch": 1.37, "eval_loss": Infinity, "eval_runtime": 543.1641, "eval_samples_per_second": 20.751, "eval_steps_per_second": 2.594, "eval_wer": 0.33844973945200874, "step": 7900 }, { "epoch": 1.38, "learning_rate": 0.0002739174301287255, "loss": 0.2833, "step": 8000 }, { "epoch": 1.38, "eval_loss": Infinity, "eval_runtime": 543.1917, "eval_samples_per_second": 20.75, "eval_steps_per_second": 2.594, "eval_wer": 0.3380925365607665, "step": 8000 }, { "epoch": 1.4, "eval_loss": Infinity, "eval_runtime": 541.3015, "eval_samples_per_second": 20.822, "eval_steps_per_second": 2.603, "eval_wer": 0.3407610522776937, "step": 8100 }, { "epoch": 1.42, "eval_loss": Infinity, "eval_runtime": 540.4975, "eval_samples_per_second": 20.853, "eval_steps_per_second": 2.607, "eval_wer": 0.33338586317028074, "step": 8200 }, { "epoch": 1.44, "eval_loss": Infinity, "eval_runtime": 541.3309, "eval_samples_per_second": 20.821, "eval_steps_per_second": 2.603, "eval_wer": 0.3391116153975458, "step": 8300 }, { "epoch": 1.45, "eval_loss": Infinity, "eval_runtime": 540.5391, "eval_samples_per_second": 20.851, "eval_steps_per_second": 2.607, "eval_wer": 0.330486216170785, "step": 8400 }, { "epoch": 1.47, "learning_rate": 0.00027217789632378523, "loss": 0.2793, "step": 8500 }, { "epoch": 1.47, "eval_loss": Infinity, "eval_runtime": 543.2054, "eval_samples_per_second": 20.749, "eval_steps_per_second": 2.594, "eval_wer": 0.3472222222222222, "step": 8500 }, { "epoch": 1.49, "eval_loss": Infinity, "eval_runtime": 542.7471, "eval_samples_per_second": 20.767, "eval_steps_per_second": 2.596, "eval_wer": 0.32446629685661454, "step": 8600 }, { "epoch": 1.5, "eval_loss": Infinity, "eval_runtime": 543.1292, "eval_samples_per_second": 20.752, "eval_steps_per_second": 2.594, "eval_wer": 0.3266095142040679, "step": 8700 }, { "epoch": 1.52, "eval_loss": Infinity, "eval_runtime": 554.6022, "eval_samples_per_second": 20.323, "eval_steps_per_second": 2.541, "eval_wer": 0.32360480753067744, "step": 8800 }, { "epoch": 1.54, "eval_loss": Infinity, "eval_runtime": 541.8471, "eval_samples_per_second": 20.801, "eval_steps_per_second": 2.6, "eval_wer": 0.32525424441082534, "step": 8900 }, { "epoch": 1.56, "learning_rate": 0.00027043836251884493, "loss": 0.2693, "step": 9000 }, { "epoch": 1.56, "eval_loss": Infinity, "eval_runtime": 541.1695, "eval_samples_per_second": 20.827, "eval_steps_per_second": 2.604, "eval_wer": 0.3280593377038158, "step": 9000 }, { "epoch": 1.57, "eval_loss": Infinity, "eval_runtime": 542.036, "eval_samples_per_second": 20.794, "eval_steps_per_second": 2.599, "eval_wer": 0.32761808707345774, "step": 9100 }, { "epoch": 1.59, "eval_loss": Infinity, "eval_runtime": 543.8181, "eval_samples_per_second": 20.726, "eval_steps_per_second": 2.591, "eval_wer": 0.34042486132123045, "step": 9200 }, { "epoch": 1.61, "eval_loss": Infinity, "eval_runtime": 545.4298, "eval_samples_per_second": 20.664, "eval_steps_per_second": 2.583, "eval_wer": 0.3477054967221382, "step": 9300 }, { "epoch": 1.63, "eval_loss": Infinity, "eval_runtime": 547.3255, "eval_samples_per_second": 20.593, "eval_steps_per_second": 2.574, "eval_wer": 0.32468692217179357, "step": 9400 }, { "epoch": 1.64, "learning_rate": 0.0002687023077815145, "loss": 0.2735, "step": 9500 }, { "epoch": 1.64, "eval_loss": Infinity, "eval_runtime": 546.7521, "eval_samples_per_second": 20.614, "eval_steps_per_second": 2.577, "eval_wer": 0.3282694570516053, "step": 9500 }, { "epoch": 1.66, "eval_loss": Infinity, "eval_runtime": 546.8572, "eval_samples_per_second": 20.61, "eval_steps_per_second": 2.577, "eval_wer": 0.32723987224743656, "step": 9600 }, { "epoch": 1.68, "eval_loss": Infinity, "eval_runtime": 542.4218, "eval_samples_per_second": 20.779, "eval_steps_per_second": 2.598, "eval_wer": 0.3346045553874601, "step": 9700 }, { "epoch": 1.69, "eval_loss": Infinity, "eval_runtime": 543.0577, "eval_samples_per_second": 20.755, "eval_steps_per_second": 2.595, "eval_wer": 0.34167507144057824, "step": 9800 }, { "epoch": 1.71, "eval_loss": Infinity, "eval_runtime": 543.4435, "eval_samples_per_second": 20.74, "eval_steps_per_second": 2.593, "eval_wer": 0.3227748361069087, "step": 9900 }, { "epoch": 1.73, "learning_rate": 0.0002669627739765743, "loss": 0.27, "step": 10000 }, { "epoch": 1.73, "eval_loss": Infinity, "eval_runtime": 543.9959, "eval_samples_per_second": 20.719, "eval_steps_per_second": 2.59, "eval_wer": 0.3264204067910573, "step": 10000 }, { "epoch": 1.75, "eval_loss": Infinity, "eval_runtime": 541.6787, "eval_samples_per_second": 20.808, "eval_steps_per_second": 2.601, "eval_wer": 0.3197281055639603, "step": 10100 }, { "epoch": 1.76, "eval_loss": Infinity, "eval_runtime": 544.3682, "eval_samples_per_second": 20.705, "eval_steps_per_second": 2.588, "eval_wer": 0.3207156664985712, "step": 10200 }, { "epoch": 1.78, "eval_loss": Infinity, "eval_runtime": 541.8579, "eval_samples_per_second": 20.801, "eval_steps_per_second": 2.6, "eval_wer": 0.3160510169776433, "step": 10300 }, { "epoch": 1.8, "eval_loss": Infinity, "eval_runtime": 542.4905, "eval_samples_per_second": 20.776, "eval_steps_per_second": 2.597, "eval_wer": 0.30929567994620943, "step": 10400 }, { "epoch": 1.82, "learning_rate": 0.00026522324017163397, "loss": 0.2632, "step": 10500 }, { "epoch": 1.82, "eval_loss": Infinity, "eval_runtime": 543.1131, "eval_samples_per_second": 20.753, "eval_steps_per_second": 2.594, "eval_wer": 0.32033745167255, "step": 10500 }, { "epoch": 1.83, "eval_loss": Infinity, "eval_runtime": 543.354, "eval_samples_per_second": 20.743, "eval_steps_per_second": 2.593, "eval_wer": 0.31596696923852746, "step": 10600 }, { "epoch": 1.85, "eval_loss": Infinity, "eval_runtime": 543.51, "eval_samples_per_second": 20.737, "eval_steps_per_second": 2.592, "eval_wer": 0.31722768532526474, "step": 10700 }, { "epoch": 1.87, "eval_loss": Infinity, "eval_runtime": 543.0833, "eval_samples_per_second": 20.754, "eval_steps_per_second": 2.594, "eval_wer": 0.3213040006723819, "step": 10800 }, { "epoch": 1.89, "eval_loss": Infinity, "eval_runtime": 545.9727, "eval_samples_per_second": 20.644, "eval_steps_per_second": 2.581, "eval_wer": 0.3135611027063372, "step": 10900 }, { "epoch": 1.9, "learning_rate": 0.0002634871854343036, "loss": 0.2615, "step": 11000 }, { "epoch": 1.9, "eval_loss": Infinity, "eval_runtime": 543.6394, "eval_samples_per_second": 20.732, "eval_steps_per_second": 2.592, "eval_wer": 0.31185913598924186, "step": 11000 }, { "epoch": 1.92, "eval_loss": Infinity, "eval_runtime": 546.0573, "eval_samples_per_second": 20.641, "eval_steps_per_second": 2.58, "eval_wer": 0.3111552361741469, "step": 11100 }, { "epoch": 1.94, "eval_loss": Infinity, "eval_runtime": 544.569, "eval_samples_per_second": 20.697, "eval_steps_per_second": 2.587, "eval_wer": 0.33042318036644813, "step": 11200 }, { "epoch": 1.95, "eval_loss": Infinity, "eval_runtime": 545.5464, "eval_samples_per_second": 20.66, "eval_steps_per_second": 2.583, "eval_wer": 0.31183812405446293, "step": 11300 }, { "epoch": 1.97, "eval_loss": Infinity, "eval_runtime": 543.6903, "eval_samples_per_second": 20.731, "eval_steps_per_second": 2.592, "eval_wer": 0.3163767019667171, "step": 11400 }, { "epoch": 1.99, "learning_rate": 0.0002617476516293633, "loss": 0.2665, "step": 11500 }, { "epoch": 1.99, "eval_loss": Infinity, "eval_runtime": 543.0226, "eval_samples_per_second": 20.756, "eval_steps_per_second": 2.595, "eval_wer": 0.31048285426122035, "step": 11500 }, { "epoch": 2.01, "eval_loss": Infinity, "eval_runtime": 543.9768, "eval_samples_per_second": 20.72, "eval_steps_per_second": 2.59, "eval_wer": 0.29904185577407966, "step": 11600 }, { "epoch": 2.02, "eval_loss": Infinity, "eval_runtime": 544.806, "eval_samples_per_second": 20.688, "eval_steps_per_second": 2.586, "eval_wer": 0.3090855605984199, "step": 11700 }, { "epoch": 2.04, "eval_loss": Infinity, "eval_runtime": 541.7677, "eval_samples_per_second": 20.804, "eval_steps_per_second": 2.601, "eval_wer": 0.29954614220877457, "step": 11800 }, { "epoch": 2.06, "eval_loss": Infinity, "eval_runtime": 543.1744, "eval_samples_per_second": 20.75, "eval_steps_per_second": 2.594, "eval_wer": 0.30464153639267105, "step": 11900 }, { "epoch": 2.08, "learning_rate": 0.000260008117824423, "loss": 0.2272, "step": 12000 }, { "epoch": 2.08, "eval_loss": Infinity, "eval_runtime": 541.7916, "eval_samples_per_second": 20.803, "eval_steps_per_second": 2.601, "eval_wer": 0.31607202891242225, "step": 12000 }, { "epoch": 2.09, "eval_loss": Infinity, "eval_runtime": 544.0285, "eval_samples_per_second": 20.718, "eval_steps_per_second": 2.59, "eval_wer": 0.31450663977139015, "step": 12100 }, { "epoch": 2.11, "eval_loss": Infinity, "eval_runtime": 541.9109, "eval_samples_per_second": 20.799, "eval_steps_per_second": 2.6, "eval_wer": 0.3083816607833249, "step": 12200 }, { "epoch": 2.13, "eval_loss": Infinity, "eval_runtime": 541.3453, "eval_samples_per_second": 20.82, "eval_steps_per_second": 2.603, "eval_wer": 0.3082030593377038, "step": 12300 }, { "epoch": 2.14, "eval_loss": Infinity, "eval_runtime": 542.8224, "eval_samples_per_second": 20.764, "eval_steps_per_second": 2.596, "eval_wer": 0.3013531685997647, "step": 12400 }, { "epoch": 2.16, "learning_rate": 0.00025826858401948276, "loss": 0.2235, "step": 12500 }, { "epoch": 2.16, "eval_loss": Infinity, "eval_runtime": 544.2628, "eval_samples_per_second": 20.709, "eval_steps_per_second": 2.589, "eval_wer": 0.3140233652714742, "step": 12500 }, { "epoch": 2.18, "eval_loss": Infinity, "eval_runtime": 544.0918, "eval_samples_per_second": 20.715, "eval_steps_per_second": 2.59, "eval_wer": 0.30928517397882, "step": 12600 }, { "epoch": 2.2, "eval_loss": Infinity, "eval_runtime": 542.7651, "eval_samples_per_second": 20.766, "eval_steps_per_second": 2.596, "eval_wer": 0.3025403429147756, "step": 12700 }, { "epoch": 2.21, "eval_loss": Infinity, "eval_runtime": 543.9574, "eval_samples_per_second": 20.72, "eval_steps_per_second": 2.59, "eval_wer": 0.3109451168263574, "step": 12800 }, { "epoch": 2.23, "eval_loss": Infinity, "eval_runtime": 544.6133, "eval_samples_per_second": 20.695, "eval_steps_per_second": 2.587, "eval_wer": 0.29886325432845856, "step": 12900 }, { "epoch": 2.25, "learning_rate": 0.0002565290502145425, "loss": 0.2287, "step": 13000 }, { "epoch": 2.25, "eval_loss": Infinity, "eval_runtime": 542.6763, "eval_samples_per_second": 20.769, "eval_steps_per_second": 2.596, "eval_wer": 0.3071209446965877, "step": 13000 }, { "epoch": 2.27, "eval_loss": Infinity, "eval_runtime": 544.2325, "eval_samples_per_second": 20.71, "eval_steps_per_second": 2.589, "eval_wer": 0.31163851067406284, "step": 13100 }, { "epoch": 2.28, "eval_loss": Infinity, "eval_runtime": 544.5274, "eval_samples_per_second": 20.699, "eval_steps_per_second": 2.588, "eval_wer": 0.30776180870734576, "step": 13200 }, { "epoch": 2.3, "eval_loss": Infinity, "eval_runtime": 544.8554, "eval_samples_per_second": 20.686, "eval_steps_per_second": 2.586, "eval_wer": 0.30717347453353505, "step": 13300 }, { "epoch": 2.32, "eval_loss": Infinity, "eval_runtime": 544.5413, "eval_samples_per_second": 20.698, "eval_steps_per_second": 2.587, "eval_wer": 0.3042423096318709, "step": 13400 }, { "epoch": 2.33, "learning_rate": 0.00025479299547721205, "loss": 0.2343, "step": 13500 }, { "epoch": 2.33, "eval_loss": Infinity, "eval_runtime": 541.9379, "eval_samples_per_second": 20.798, "eval_steps_per_second": 2.6, "eval_wer": 0.2993675407631535, "step": 13500 }, { "epoch": 2.35, "eval_loss": Infinity, "eval_runtime": 544.0455, "eval_samples_per_second": 20.717, "eval_steps_per_second": 2.59, "eval_wer": 0.3025823667843335, "step": 13600 }, { "epoch": 2.37, "eval_loss": Infinity, "eval_runtime": 542.9108, "eval_samples_per_second": 20.76, "eval_steps_per_second": 2.595, "eval_wer": 0.307215498403093, "step": 13700 }, { "epoch": 2.39, "eval_loss": Infinity, "eval_runtime": 542.1131, "eval_samples_per_second": 20.791, "eval_steps_per_second": 2.599, "eval_wer": 0.31030425281559926, "step": 13800 }, { "epoch": 2.4, "eval_loss": Infinity, "eval_runtime": 543.103, "eval_samples_per_second": 20.753, "eval_steps_per_second": 2.594, "eval_wer": 0.3074781475878299, "step": 13900 }, { "epoch": 2.42, "learning_rate": 0.0002530534616722718, "loss": 0.2255, "step": 14000 }, { "epoch": 2.42, "eval_loss": Infinity, "eval_runtime": 541.4673, "eval_samples_per_second": 20.816, "eval_steps_per_second": 2.602, "eval_wer": 0.3033072785342074, "step": 14000 }, { "epoch": 2.44, "eval_loss": Infinity, "eval_runtime": 544.3551, "eval_samples_per_second": 20.705, "eval_steps_per_second": 2.588, "eval_wer": 0.301668347621449, "step": 14100 }, { "epoch": 2.46, "eval_loss": Infinity, "eval_runtime": 543.9092, "eval_samples_per_second": 20.722, "eval_steps_per_second": 2.591, "eval_wer": 0.3094742813918306, "step": 14200 }, { "epoch": 2.47, "eval_loss": Infinity, "eval_runtime": 543.9507, "eval_samples_per_second": 20.721, "eval_steps_per_second": 2.59, "eval_wer": 0.3030026054799126, "step": 14300 }, { "epoch": 2.49, "eval_loss": Infinity, "eval_runtime": 548.8025, "eval_samples_per_second": 20.537, "eval_steps_per_second": 2.567, "eval_wer": 0.29882123045890063, "step": 14400 }, { "epoch": 2.51, "learning_rate": 0.00025131392786733155, "loss": 0.2266, "step": 14500 }, { "epoch": 2.51, "eval_loss": Infinity, "eval_runtime": 542.8924, "eval_samples_per_second": 20.761, "eval_steps_per_second": 2.595, "eval_wer": 0.3069633551857455, "step": 14500 }, { "epoch": 2.53, "eval_loss": Infinity, "eval_runtime": 544.5732, "eval_samples_per_second": 20.697, "eval_steps_per_second": 2.587, "eval_wer": 0.29389393175323586, "step": 14600 }, { "epoch": 2.54, "eval_loss": Infinity, "eval_runtime": 548.0549, "eval_samples_per_second": 20.565, "eval_steps_per_second": 2.571, "eval_wer": 0.30245629517565975, "step": 14700 }, { "epoch": 2.56, "eval_loss": Infinity, "eval_runtime": 546.5456, "eval_samples_per_second": 20.622, "eval_steps_per_second": 2.578, "eval_wer": 0.305366448142545, "step": 14800 }, { "epoch": 2.58, "eval_loss": Infinity, "eval_runtime": 542.2527, "eval_samples_per_second": 20.786, "eval_steps_per_second": 2.598, "eval_wer": 0.30794041015296686, "step": 14900 }, { "epoch": 2.59, "learning_rate": 0.00024957439406239124, "loss": 0.2298, "step": 15000 }, { "epoch": 2.59, "eval_loss": Infinity, "eval_runtime": 541.872, "eval_samples_per_second": 20.8, "eval_steps_per_second": 2.6, "eval_wer": 0.2883362750042024, "step": 15000 }, { "epoch": 2.61, "eval_loss": Infinity, "eval_runtime": 542.3187, "eval_samples_per_second": 20.783, "eval_steps_per_second": 2.598, "eval_wer": 0.2941250630358043, "step": 15100 }, { "epoch": 2.63, "eval_loss": Infinity, "eval_runtime": 542.164, "eval_samples_per_second": 20.789, "eval_steps_per_second": 2.599, "eval_wer": 0.2994515885022693, "step": 15200 }, { "epoch": 2.65, "eval_loss": Infinity, "eval_runtime": 543.4743, "eval_samples_per_second": 20.739, "eval_steps_per_second": 2.593, "eval_wer": 0.3017523953605648, "step": 15300 }, { "epoch": 2.66, "eval_loss": Infinity, "eval_runtime": 544.8229, "eval_samples_per_second": 20.687, "eval_steps_per_second": 2.586, "eval_wer": 0.30269793242561777, "step": 15400 }, { "epoch": 2.68, "learning_rate": 0.000247834860257451, "loss": 0.2269, "step": 15500 }, { "epoch": 2.68, "eval_loss": Infinity, "eval_runtime": 541.6192, "eval_samples_per_second": 20.81, "eval_steps_per_second": 2.601, "eval_wer": 0.294051521264078, "step": 15500 }, { "epoch": 2.7, "eval_loss": Infinity, "eval_runtime": 543.4863, "eval_samples_per_second": 20.738, "eval_steps_per_second": 2.593, "eval_wer": 0.2966254832744999, "step": 15600 }, { "epoch": 2.72, "eval_loss": Infinity, "eval_runtime": 543.1533, "eval_samples_per_second": 20.751, "eval_steps_per_second": 2.594, "eval_wer": 0.29043746848209784, "step": 15700 }, { "epoch": 2.73, "eval_loss": Infinity, "eval_runtime": 545.1777, "eval_samples_per_second": 20.674, "eval_steps_per_second": 2.584, "eval_wer": 0.2978336695242898, "step": 15800 }, { "epoch": 2.75, "eval_loss": Infinity, "eval_runtime": 542.6934, "eval_samples_per_second": 20.769, "eval_steps_per_second": 2.596, "eval_wer": 0.28683392166750715, "step": 15900 }, { "epoch": 2.77, "learning_rate": 0.0002460988055201206, "loss": 0.2222, "step": 16000 }, { "epoch": 2.77, "eval_loss": Infinity, "eval_runtime": 541.9593, "eval_samples_per_second": 20.797, "eval_steps_per_second": 2.6, "eval_wer": 0.3007858463607329, "step": 16000 }, { "epoch": 2.78, "eval_loss": Infinity, "eval_runtime": 544.4119, "eval_samples_per_second": 20.703, "eval_steps_per_second": 2.588, "eval_wer": 0.2976235501765003, "step": 16100 }, { "epoch": 2.8, "eval_loss": Infinity, "eval_runtime": 542.8691, "eval_samples_per_second": 20.762, "eval_steps_per_second": 2.595, "eval_wer": 0.29393595562279373, "step": 16200 }, { "epoch": 2.82, "eval_loss": Infinity, "eval_runtime": 543.4284, "eval_samples_per_second": 20.741, "eval_steps_per_second": 2.593, "eval_wer": 0.2976970919482266, "step": 16300 }, { "epoch": 2.84, "eval_loss": Infinity, "eval_runtime": 540.9365, "eval_samples_per_second": 20.836, "eval_steps_per_second": 2.605, "eval_wer": 0.2913724995797613, "step": 16400 }, { "epoch": 2.85, "learning_rate": 0.0002443592717151803, "loss": 0.2336, "step": 16500 }, { "epoch": 2.85, "eval_loss": Infinity, "eval_runtime": 542.3035, "eval_samples_per_second": 20.784, "eval_steps_per_second": 2.598, "eval_wer": 0.2862981173306438, "step": 16500 }, { "epoch": 2.87, "eval_loss": Infinity, "eval_runtime": 540.4767, "eval_samples_per_second": 20.854, "eval_steps_per_second": 2.607, "eval_wer": 0.29223398890569846, "step": 16600 }, { "epoch": 2.89, "eval_loss": Infinity, "eval_runtime": 544.1303, "eval_samples_per_second": 20.714, "eval_steps_per_second": 2.589, "eval_wer": 0.29320053790553036, "step": 16700 }, { "epoch": 2.91, "eval_loss": Infinity, "eval_runtime": 544.5968, "eval_samples_per_second": 20.696, "eval_steps_per_second": 2.587, "eval_wer": 0.2959741132963523, "step": 16800 }, { "epoch": 2.92, "eval_loss": Infinity, "eval_runtime": 544.104, "eval_samples_per_second": 20.715, "eval_steps_per_second": 2.59, "eval_wer": 0.2904059505799294, "step": 16900 }, { "epoch": 2.94, "learning_rate": 0.00024261973791024004, "loss": 0.2275, "step": 17000 }, { "epoch": 2.94, "eval_loss": Infinity, "eval_runtime": 549.5031, "eval_samples_per_second": 20.511, "eval_steps_per_second": 2.564, "eval_wer": 0.29583753572028915, "step": 17000 }, { "epoch": 2.96, "eval_loss": Infinity, "eval_runtime": 550.5262, "eval_samples_per_second": 20.473, "eval_steps_per_second": 2.559, "eval_wer": 0.29877920658934276, "step": 17100 }, { "epoch": 2.97, "eval_loss": Infinity, "eval_runtime": 545.837, "eval_samples_per_second": 20.649, "eval_steps_per_second": 2.581, "eval_wer": 0.2908787191124559, "step": 17200 }, { "epoch": 2.99, "eval_loss": Infinity, "eval_runtime": 542.7983, "eval_samples_per_second": 20.765, "eval_steps_per_second": 2.596, "eval_wer": 0.30473609009917635, "step": 17300 }, { "epoch": 3.01, "eval_loss": Infinity, "eval_runtime": 542.8109, "eval_samples_per_second": 20.764, "eval_steps_per_second": 2.596, "eval_wer": 0.3058182047402925, "step": 17400 }, { "epoch": 3.03, "learning_rate": 0.00024088020410529976, "loss": 0.2208, "step": 17500 }, { "epoch": 3.03, "eval_loss": Infinity, "eval_runtime": 544.3135, "eval_samples_per_second": 20.707, "eval_steps_per_second": 2.589, "eval_wer": 0.2900172297865187, "step": 17500 }, { "epoch": 3.04, "eval_loss": Infinity, "eval_runtime": 544.1566, "eval_samples_per_second": 20.713, "eval_steps_per_second": 2.589, "eval_wer": 0.2941040511010254, "step": 17600 }, { "epoch": 3.06, "eval_loss": Infinity, "eval_runtime": 544.4905, "eval_samples_per_second": 20.7, "eval_steps_per_second": 2.588, "eval_wer": 0.28978609850395026, "step": 17700 }, { "epoch": 3.08, "eval_loss": Infinity, "eval_runtime": 542.4047, "eval_samples_per_second": 20.78, "eval_steps_per_second": 2.598, "eval_wer": 0.2869389813414019, "step": 17800 }, { "epoch": 3.1, "eval_loss": Infinity, "eval_runtime": 542.3956, "eval_samples_per_second": 20.78, "eval_steps_per_second": 2.598, "eval_wer": 0.3040847201210287, "step": 17900 }, { "epoch": 3.11, "learning_rate": 0.00023914067030035948, "loss": 0.192, "step": 18000 }, { "epoch": 3.11, "eval_loss": Infinity, "eval_runtime": 541.1082, "eval_samples_per_second": 20.829, "eval_steps_per_second": 2.604, "eval_wer": 0.29535426122037317, "step": 18000 }, { "epoch": 3.13, "eval_loss": Infinity, "eval_runtime": 543.6529, "eval_samples_per_second": 20.732, "eval_steps_per_second": 2.592, "eval_wer": 0.28465918641788535, "step": 18100 }, { "epoch": 3.15, "eval_loss": Infinity, "eval_runtime": 540.5467, "eval_samples_per_second": 20.851, "eval_steps_per_second": 2.607, "eval_wer": 0.2999873928391326, "step": 18200 }, { "epoch": 3.16, "eval_loss": Infinity, "eval_runtime": 541.4182, "eval_samples_per_second": 20.818, "eval_steps_per_second": 2.602, "eval_wer": 0.28889309127584467, "step": 18300 }, { "epoch": 3.18, "eval_loss": Infinity, "eval_runtime": 542.5022, "eval_samples_per_second": 20.776, "eval_steps_per_second": 2.597, "eval_wer": 0.2883677929063708, "step": 18400 }, { "epoch": 3.2, "learning_rate": 0.00023740113649541923, "loss": 0.1883, "step": 18500 }, { "epoch": 3.2, "eval_loss": Infinity, "eval_runtime": 544.1075, "eval_samples_per_second": 20.715, "eval_steps_per_second": 2.59, "eval_wer": 0.29573247604639435, "step": 18500 }, { "epoch": 3.22, "eval_loss": Infinity, "eval_runtime": 542.3164, "eval_samples_per_second": 20.783, "eval_steps_per_second": 2.598, "eval_wer": 0.28954446125399225, "step": 18600 }, { "epoch": 3.23, "eval_loss": Infinity, "eval_runtime": 543.3924, "eval_samples_per_second": 20.742, "eval_steps_per_second": 2.593, "eval_wer": 0.282978231635569, "step": 18700 }, { "epoch": 3.25, "eval_loss": Infinity, "eval_runtime": 542.6139, "eval_samples_per_second": 20.772, "eval_steps_per_second": 2.597, "eval_wer": 0.2868759455370651, "step": 18800 }, { "epoch": 3.27, "eval_loss": Infinity, "eval_runtime": 543.143, "eval_samples_per_second": 20.751, "eval_steps_per_second": 2.594, "eval_wer": 0.28079299041855776, "step": 18900 }, { "epoch": 3.29, "learning_rate": 0.00023566160269047892, "loss": 0.195, "step": 19000 }, { "epoch": 3.29, "eval_loss": Infinity, "eval_runtime": 542.4472, "eval_samples_per_second": 20.778, "eval_steps_per_second": 2.597, "eval_wer": 0.28243192133131617, "step": 19000 }, { "epoch": 3.3, "eval_loss": Infinity, "eval_runtime": 540.0992, "eval_samples_per_second": 20.868, "eval_steps_per_second": 2.609, "eval_wer": 0.29113086232980334, "step": 19100 }, { "epoch": 3.32, "eval_loss": Infinity, "eval_runtime": 542.3617, "eval_samples_per_second": 20.781, "eval_steps_per_second": 2.598, "eval_wer": 0.2887144898302236, "step": 19200 }, { "epoch": 3.34, "eval_loss": Infinity, "eval_runtime": 541.9599, "eval_samples_per_second": 20.797, "eval_steps_per_second": 2.6, "eval_wer": 0.28065641284249454, "step": 19300 }, { "epoch": 3.36, "eval_loss": Infinity, "eval_runtime": 544.4396, "eval_samples_per_second": 20.702, "eval_steps_per_second": 2.588, "eval_wer": 0.28173852748361067, "step": 19400 }, { "epoch": 3.37, "learning_rate": 0.00023392554795314855, "loss": 0.1917, "step": 19500 }, { "epoch": 3.37, "eval_loss": Infinity, "eval_runtime": 541.3966, "eval_samples_per_second": 20.818, "eval_steps_per_second": 2.603, "eval_wer": 0.29162464279710876, "step": 19500 }, { "epoch": 3.39, "eval_loss": Infinity, "eval_runtime": 541.7731, "eval_samples_per_second": 20.804, "eval_steps_per_second": 2.601, "eval_wer": 0.28613002185241215, "step": 19600 }, { "epoch": 3.41, "eval_loss": Infinity, "eval_runtime": 542.4733, "eval_samples_per_second": 20.777, "eval_steps_per_second": 2.597, "eval_wer": 0.2870545469826862, "step": 19700 }, { "epoch": 3.42, "eval_loss": Infinity, "eval_runtime": 541.7667, "eval_samples_per_second": 20.804, "eval_steps_per_second": 2.601, "eval_wer": 0.28756933938477053, "step": 19800 }, { "epoch": 3.44, "eval_loss": Infinity, "eval_runtime": 541.3431, "eval_samples_per_second": 20.82, "eval_steps_per_second": 2.603, "eval_wer": 0.28075096654899984, "step": 19900 }, { "epoch": 3.46, "learning_rate": 0.00023218601414820827, "loss": 0.1925, "step": 20000 }, { "epoch": 3.46, "eval_loss": Infinity, "eval_runtime": 541.8278, "eval_samples_per_second": 20.802, "eval_steps_per_second": 2.6, "eval_wer": 0.29112035636241385, "step": 20000 }, { "epoch": 3.48, "eval_loss": Infinity, "eval_runtime": 547.1285, "eval_samples_per_second": 20.6, "eval_steps_per_second": 2.575, "eval_wer": 0.2812237350815263, "step": 20100 }, { "epoch": 3.49, "eval_loss": Infinity, "eval_runtime": 541.0571, "eval_samples_per_second": 20.831, "eval_steps_per_second": 2.604, "eval_wer": 0.27968986384266264, "step": 20200 }, { "epoch": 3.51, "eval_loss": Infinity, "eval_runtime": 541.9172, "eval_samples_per_second": 20.798, "eval_steps_per_second": 2.6, "eval_wer": 0.282515969070432, "step": 20300 }, { "epoch": 3.53, "eval_loss": Infinity, "eval_runtime": 544.2103, "eval_samples_per_second": 20.711, "eval_steps_per_second": 2.589, "eval_wer": 0.2877479408303917, "step": 20400 }, { "epoch": 3.55, "learning_rate": 0.000230446480343268, "loss": 0.1952, "step": 20500 }, { "epoch": 3.55, "eval_loss": Infinity, "eval_runtime": 544.2822, "eval_samples_per_second": 20.708, "eval_steps_per_second": 2.589, "eval_wer": 0.2850058833417381, "step": 20500 }, { "epoch": 3.56, "eval_loss": Infinity, "eval_runtime": 540.3288, "eval_samples_per_second": 20.86, "eval_steps_per_second": 2.608, "eval_wer": 0.2826630526138847, "step": 20600 }, { "epoch": 3.58, "eval_loss": Infinity, "eval_runtime": 540.8405, "eval_samples_per_second": 20.84, "eval_steps_per_second": 2.605, "eval_wer": 0.2861195158850227, "step": 20700 }, { "epoch": 3.6, "eval_loss": Infinity, "eval_runtime": 543.3795, "eval_samples_per_second": 20.742, "eval_steps_per_second": 2.593, "eval_wer": 0.284344007396201, "step": 20800 }, { "epoch": 3.61, "eval_loss": Infinity, "eval_runtime": 542.5007, "eval_samples_per_second": 20.776, "eval_steps_per_second": 2.597, "eval_wer": 0.2957534879811733, "step": 20900 }, { "epoch": 3.63, "learning_rate": 0.00022870694653832769, "loss": 0.194, "step": 21000 }, { "epoch": 3.63, "eval_loss": Infinity, "eval_runtime": 541.5576, "eval_samples_per_second": 20.812, "eval_steps_per_second": 2.602, "eval_wer": 0.2867708858631703, "step": 21000 }, { "epoch": 3.65, "eval_loss": Infinity, "eval_runtime": 542.9935, "eval_samples_per_second": 20.757, "eval_steps_per_second": 2.595, "eval_wer": 0.2838082030593377, "step": 21100 }, { "epoch": 3.67, "eval_loss": Infinity, "eval_runtime": 541.3856, "eval_samples_per_second": 20.819, "eval_steps_per_second": 2.603, "eval_wer": 0.2771999495713565, "step": 21200 }, { "epoch": 3.68, "eval_loss": Infinity, "eval_runtime": 542.358, "eval_samples_per_second": 20.781, "eval_steps_per_second": 2.598, "eval_wer": 0.2796163220709363, "step": 21300 }, { "epoch": 3.7, "eval_loss": Infinity, "eval_runtime": 541.9323, "eval_samples_per_second": 20.798, "eval_steps_per_second": 2.6, "eval_wer": 0.27928013111447303, "step": 21400 }, { "epoch": 3.72, "learning_rate": 0.00022696741273338744, "loss": 0.1912, "step": 21500 }, { "epoch": 3.72, "eval_loss": Infinity, "eval_runtime": 542.4498, "eval_samples_per_second": 20.778, "eval_steps_per_second": 2.597, "eval_wer": 0.2811186754076315, "step": 21500 }, { "epoch": 3.74, "eval_loss": Infinity, "eval_runtime": 541.1622, "eval_samples_per_second": 20.827, "eval_steps_per_second": 2.604, "eval_wer": 0.27576063203899814, "step": 21600 }, { "epoch": 3.75, "eval_loss": Infinity, "eval_runtime": 544.4094, "eval_samples_per_second": 20.703, "eval_steps_per_second": 2.588, "eval_wer": 0.28317784501596904, "step": 21700 }, { "epoch": 3.77, "eval_loss": Infinity, "eval_runtime": 541.8456, "eval_samples_per_second": 20.801, "eval_steps_per_second": 2.6, "eval_wer": 0.2731131282568499, "step": 21800 }, { "epoch": 3.79, "eval_loss": Infinity, "eval_runtime": 541.5491, "eval_samples_per_second": 20.813, "eval_steps_per_second": 2.602, "eval_wer": 0.27668515716927217, "step": 21900 }, { "epoch": 3.8, "learning_rate": 0.00022522787892844716, "loss": 0.1966, "step": 22000 }, { "epoch": 3.8, "eval_loss": Infinity, "eval_runtime": 542.4841, "eval_samples_per_second": 20.777, "eval_steps_per_second": 2.597, "eval_wer": 0.27910152966885193, "step": 22000 }, { "epoch": 3.82, "eval_loss": Infinity, "eval_runtime": 545.5878, "eval_samples_per_second": 20.658, "eval_steps_per_second": 2.583, "eval_wer": 0.28655026054799126, "step": 22100 }, { "epoch": 3.84, "eval_loss": Infinity, "eval_runtime": 541.4456, "eval_samples_per_second": 20.816, "eval_steps_per_second": 2.602, "eval_wer": 0.28485879979828543, "step": 22200 }, { "epoch": 3.86, "eval_loss": Infinity, "eval_runtime": 541.8429, "eval_samples_per_second": 20.801, "eval_steps_per_second": 2.6, "eval_wer": 0.28729618423264414, "step": 22300 }, { "epoch": 3.87, "eval_loss": Infinity, "eval_runtime": 546.2903, "eval_samples_per_second": 20.632, "eval_steps_per_second": 2.579, "eval_wer": 0.28351403597243235, "step": 22400 }, { "epoch": 3.89, "learning_rate": 0.00022349182419111678, "loss": 0.1932, "step": 22500 }, { "epoch": 3.89, "eval_loss": Infinity, "eval_runtime": 544.9851, "eval_samples_per_second": 20.681, "eval_steps_per_second": 2.585, "eval_wer": 0.2781454866364095, "step": 22500 }, { "epoch": 3.91, "eval_loss": Infinity, "eval_runtime": 543.4194, "eval_samples_per_second": 20.741, "eval_steps_per_second": 2.593, "eval_wer": 0.27511976802824006, "step": 22600 }, { "epoch": 3.93, "eval_loss": Infinity, "eval_runtime": 542.5928, "eval_samples_per_second": 20.772, "eval_steps_per_second": 2.597, "eval_wer": 0.2871280887544125, "step": 22700 }, { "epoch": 3.94, "eval_loss": Infinity, "eval_runtime": 543.1769, "eval_samples_per_second": 20.75, "eval_steps_per_second": 2.594, "eval_wer": 0.2715162212136494, "step": 22800 }, { "epoch": 3.96, "eval_loss": Infinity, "eval_runtime": 542.7369, "eval_samples_per_second": 20.767, "eval_steps_per_second": 2.596, "eval_wer": 0.28232686165742144, "step": 22900 }, { "epoch": 3.98, "learning_rate": 0.00022175229038617648, "loss": 0.1928, "step": 23000 }, { "epoch": 3.98, "eval_loss": Infinity, "eval_runtime": 541.6129, "eval_samples_per_second": 20.81, "eval_steps_per_second": 2.601, "eval_wer": 0.28185409312489496, "step": 23000 }, { "epoch": 4.0, "eval_loss": Infinity, "eval_runtime": 541.322, "eval_samples_per_second": 20.821, "eval_steps_per_second": 2.603, "eval_wer": 0.27848167759287273, "step": 23100 }, { "epoch": 4.01, "eval_loss": Infinity, "eval_runtime": 543.2229, "eval_samples_per_second": 20.748, "eval_steps_per_second": 2.594, "eval_wer": 0.2746680114304925, "step": 23200 }, { "epoch": 4.03, "eval_loss": Infinity, "eval_runtime": 545.8357, "eval_samples_per_second": 20.649, "eval_steps_per_second": 2.581, "eval_wer": 0.27156875105059675, "step": 23300 }, { "epoch": 4.05, "eval_loss": Infinity, "eval_runtime": 543.6397, "eval_samples_per_second": 20.732, "eval_steps_per_second": 2.592, "eval_wer": 0.2673243402252479, "step": 23400 }, { "epoch": 4.06, "learning_rate": 0.0002200127565812362, "loss": 0.1651, "step": 23500 }, { "epoch": 4.06, "eval_loss": Infinity, "eval_runtime": 545.2541, "eval_samples_per_second": 20.671, "eval_steps_per_second": 2.584, "eval_wer": 0.2795637922339889, "step": 23500 }, { "epoch": 4.08, "eval_loss": Infinity, "eval_runtime": 541.1431, "eval_samples_per_second": 20.828, "eval_steps_per_second": 2.604, "eval_wer": 0.2786602790384939, "step": 23600 }, { "epoch": 4.1, "eval_loss": Infinity, "eval_runtime": 542.8901, "eval_samples_per_second": 20.761, "eval_steps_per_second": 2.595, "eval_wer": 0.2709488989746176, "step": 23700 }, { "epoch": 4.12, "eval_loss": Infinity, "eval_runtime": 541.6991, "eval_samples_per_second": 20.807, "eval_steps_per_second": 2.601, "eval_wer": 0.28349302403765336, "step": 23800 }, { "epoch": 4.13, "eval_loss": Infinity, "eval_runtime": 542.3686, "eval_samples_per_second": 20.781, "eval_steps_per_second": 2.598, "eval_wer": 0.27752563456043033, "step": 23900 }, { "epoch": 4.15, "learning_rate": 0.00021827322277629592, "loss": 0.1678, "step": 24000 }, { "epoch": 4.15, "eval_loss": Infinity, "eval_runtime": 543.089, "eval_samples_per_second": 20.754, "eval_steps_per_second": 2.594, "eval_wer": 0.27352286098503953, "step": 24000 }, { "epoch": 4.17, "eval_loss": Infinity, "eval_runtime": 545.6128, "eval_samples_per_second": 20.658, "eval_steps_per_second": 2.582, "eval_wer": 0.2738695579088922, "step": 24100 }, { "epoch": 4.19, "eval_loss": Infinity, "eval_runtime": 541.6932, "eval_samples_per_second": 20.807, "eval_steps_per_second": 2.601, "eval_wer": 0.2723041687678601, "step": 24200 }, { "epoch": 4.2, "eval_loss": Infinity, "eval_runtime": 543.1454, "eval_samples_per_second": 20.751, "eval_steps_per_second": 2.594, "eval_wer": 0.27206253151790216, "step": 24300 }, { "epoch": 4.22, "eval_loss": Infinity, "eval_runtime": 541.1009, "eval_samples_per_second": 20.83, "eval_steps_per_second": 2.604, "eval_wer": 0.2682698772903009, "step": 24400 }, { "epoch": 4.24, "learning_rate": 0.00021653716803896555, "loss": 0.1701, "step": 24500 }, { "epoch": 4.24, "eval_loss": Infinity, "eval_runtime": 547.7655, "eval_samples_per_second": 20.576, "eval_steps_per_second": 2.572, "eval_wer": 0.270539166246428, "step": 24500 }, { "epoch": 4.25, "eval_loss": Infinity, "eval_runtime": 546.8009, "eval_samples_per_second": 20.613, "eval_steps_per_second": 2.577, "eval_wer": 0.27438435031097663, "step": 24600 }, { "epoch": 4.27, "eval_loss": Infinity, "eval_runtime": 544.7395, "eval_samples_per_second": 20.691, "eval_steps_per_second": 2.587, "eval_wer": 0.2675029416708691, "step": 24700 }, { "epoch": 4.29, "eval_loss": Infinity, "eval_runtime": 541.3702, "eval_samples_per_second": 20.819, "eval_steps_per_second": 2.603, "eval_wer": 0.272125567322239, "step": 24800 }, { "epoch": 4.31, "eval_loss": Infinity, "eval_runtime": 541.2194, "eval_samples_per_second": 20.825, "eval_steps_per_second": 2.603, "eval_wer": 0.270055891746512, "step": 24900 }, { "epoch": 4.32, "learning_rate": 0.00021479763423402524, "loss": 0.1681, "step": 25000 }, { "epoch": 4.32, "eval_loss": Infinity, "eval_runtime": 543.6583, "eval_samples_per_second": 20.732, "eval_steps_per_second": 2.592, "eval_wer": 0.2697407127248277, "step": 25000 }, { "epoch": 4.34, "eval_loss": Infinity, "eval_runtime": 541.8047, "eval_samples_per_second": 20.803, "eval_steps_per_second": 2.601, "eval_wer": 0.26358421583459407, "step": 25100 }, { "epoch": 4.36, "eval_loss": Infinity, "eval_runtime": 542.7168, "eval_samples_per_second": 20.768, "eval_steps_per_second": 2.596, "eval_wer": 0.2710329467137334, "step": 25200 }, { "epoch": 4.38, "eval_loss": Infinity, "eval_runtime": 542.9637, "eval_samples_per_second": 20.758, "eval_steps_per_second": 2.595, "eval_wer": 0.2671982686165742, "step": 25300 }, { "epoch": 4.39, "eval_loss": Infinity, "eval_runtime": 544.2227, "eval_samples_per_second": 20.71, "eval_steps_per_second": 2.589, "eval_wer": 0.26634728525802653, "step": 25400 }, { "epoch": 4.41, "learning_rate": 0.00021306157949669486, "loss": 0.1686, "step": 25500 }, { "epoch": 4.41, "eval_loss": Infinity, "eval_runtime": 543.0802, "eval_samples_per_second": 20.754, "eval_steps_per_second": 2.594, "eval_wer": 0.2682173474533535, "step": 25500 }, { "epoch": 4.43, "eval_loss": Infinity, "eval_runtime": 542.2325, "eval_samples_per_second": 20.786, "eval_steps_per_second": 2.599, "eval_wer": 0.2665363926710371, "step": 25600 }, { "epoch": 4.44, "eval_loss": Infinity, "eval_runtime": 544.8929, "eval_samples_per_second": 20.685, "eval_steps_per_second": 2.586, "eval_wer": 0.2659480584972264, "step": 25700 }, { "epoch": 4.46, "eval_loss": Infinity, "eval_runtime": 544.4755, "eval_samples_per_second": 20.701, "eval_steps_per_second": 2.588, "eval_wer": 0.26376281728021517, "step": 25800 }, { "epoch": 4.48, "eval_loss": Infinity, "eval_runtime": 545.5151, "eval_samples_per_second": 20.661, "eval_steps_per_second": 2.583, "eval_wer": 0.2654437720625315, "step": 25900 }, { "epoch": 4.5, "learning_rate": 0.00021132204569175459, "loss": 0.1704, "step": 26000 }, { "epoch": 4.5, "eval_loss": Infinity, "eval_runtime": 544.8363, "eval_samples_per_second": 20.687, "eval_steps_per_second": 2.586, "eval_wer": 0.2693624978988065, "step": 26000 }, { "epoch": 4.51, "eval_loss": Infinity, "eval_runtime": 542.9637, "eval_samples_per_second": 20.758, "eval_steps_per_second": 2.595, "eval_wer": 0.2657379391494369, "step": 26100 }, { "epoch": 4.53, "eval_loss": Infinity, "eval_runtime": 542.0387, "eval_samples_per_second": 20.794, "eval_steps_per_second": 2.599, "eval_wer": 0.26736636409480585, "step": 26200 }, { "epoch": 4.55, "eval_loss": Infinity, "eval_runtime": 540.8149, "eval_samples_per_second": 20.841, "eval_steps_per_second": 2.605, "eval_wer": 0.27195747184400737, "step": 26300 }, { "epoch": 4.57, "eval_loss": Infinity, "eval_runtime": 543.2221, "eval_samples_per_second": 20.748, "eval_steps_per_second": 2.594, "eval_wer": 0.2743108085392503, "step": 26400 }, { "epoch": 4.58, "learning_rate": 0.00020958251188681434, "loss": 0.1646, "step": 26500 }, { "epoch": 4.58, "eval_loss": Infinity, "eval_runtime": 544.9463, "eval_samples_per_second": 20.683, "eval_steps_per_second": 2.586, "eval_wer": 0.27350184905026054, "step": 26500 }, { "epoch": 4.6, "eval_loss": Infinity, "eval_runtime": 544.3881, "eval_samples_per_second": 20.704, "eval_steps_per_second": 2.588, "eval_wer": 0.2658745167255001, "step": 26600 }, { "epoch": 4.62, "eval_loss": Infinity, "eval_runtime": 544.4068, "eval_samples_per_second": 20.703, "eval_steps_per_second": 2.588, "eval_wer": 0.26746091780131115, "step": 26700 }, { "epoch": 4.64, "eval_loss": Infinity, "eval_runtime": 543.2382, "eval_samples_per_second": 20.748, "eval_steps_per_second": 2.594, "eval_wer": 0.2743108085392503, "step": 26800 }, { "epoch": 4.65, "eval_loss": Infinity, "eval_runtime": 543.0733, "eval_samples_per_second": 20.754, "eval_steps_per_second": 2.594, "eval_wer": 0.2641725500084048, "step": 26900 }, { "epoch": 4.67, "learning_rate": 0.00020784297808187406, "loss": 0.1662, "step": 27000 }, { "epoch": 4.67, "eval_loss": Infinity, "eval_runtime": 542.9197, "eval_samples_per_second": 20.76, "eval_steps_per_second": 2.595, "eval_wer": 0.2652231467473525, "step": 27000 }, { "epoch": 4.69, "eval_loss": Infinity, "eval_runtime": 543.0343, "eval_samples_per_second": 20.756, "eval_steps_per_second": 2.595, "eval_wer": 0.26765002521432174, "step": 27100 }, { "epoch": 4.7, "eval_loss": Infinity, "eval_runtime": 543.1054, "eval_samples_per_second": 20.753, "eval_steps_per_second": 2.594, "eval_wer": 0.26988779626828036, "step": 27200 }, { "epoch": 4.72, "eval_loss": Infinity, "eval_runtime": 543.2158, "eval_samples_per_second": 20.749, "eval_steps_per_second": 2.594, "eval_wer": 0.26490796772566816, "step": 27300 }, { "epoch": 4.74, "eval_loss": Infinity, "eval_runtime": 542.913, "eval_samples_per_second": 20.76, "eval_steps_per_second": 2.595, "eval_wer": 0.26394141872583626, "step": 27400 }, { "epoch": 4.76, "learning_rate": 0.00020610344427693375, "loss": 0.1713, "step": 27500 }, { "epoch": 4.76, "eval_loss": Infinity, "eval_runtime": 543.0263, "eval_samples_per_second": 20.756, "eval_steps_per_second": 2.595, "eval_wer": 0.2634056143889729, "step": 27500 }, { "epoch": 4.77, "eval_loss": Infinity, "eval_runtime": 542.6947, "eval_samples_per_second": 20.769, "eval_steps_per_second": 2.596, "eval_wer": 0.26396243066061525, "step": 27600 }, { "epoch": 4.79, "eval_loss": Infinity, "eval_runtime": 553.6288, "eval_samples_per_second": 20.358, "eval_steps_per_second": 2.545, "eval_wer": 0.2604744494873088, "step": 27700 }, { "epoch": 4.81, "eval_loss": Infinity, "eval_runtime": 542.7462, "eval_samples_per_second": 20.767, "eval_steps_per_second": 2.596, "eval_wer": 0.25767986216170785, "step": 27800 }, { "epoch": 4.83, "eval_loss": Infinity, "eval_runtime": 543.1573, "eval_samples_per_second": 20.751, "eval_steps_per_second": 2.594, "eval_wer": 0.26473987224743656, "step": 27900 }, { "epoch": 4.84, "learning_rate": 0.00020436391047199347, "loss": 0.1674, "step": 28000 }, { "epoch": 4.84, "eval_loss": Infinity, "eval_runtime": 542.5497, "eval_samples_per_second": 20.774, "eval_steps_per_second": 2.597, "eval_wer": 0.2605164733568667, "step": 28000 }, { "epoch": 4.86, "eval_loss": Infinity, "eval_runtime": 542.4903, "eval_samples_per_second": 20.776, "eval_steps_per_second": 2.597, "eval_wer": 0.2551689359556228, "step": 28100 }, { "epoch": 4.88, "eval_loss": Infinity, "eval_runtime": 542.4923, "eval_samples_per_second": 20.776, "eval_steps_per_second": 2.597, "eval_wer": 0.2640254664649521, "step": 28200 }, { "epoch": 4.89, "eval_loss": Infinity, "eval_runtime": 543.3538, "eval_samples_per_second": 20.743, "eval_steps_per_second": 2.593, "eval_wer": 0.26158808203059336, "step": 28300 }, { "epoch": 4.91, "eval_loss": Infinity, "eval_runtime": 544.8688, "eval_samples_per_second": 20.686, "eval_steps_per_second": 2.586, "eval_wer": 0.2625021011934779, "step": 28400 }, { "epoch": 4.93, "learning_rate": 0.00020262437666705322, "loss": 0.1627, "step": 28500 }, { "epoch": 4.93, "eval_loss": Infinity, "eval_runtime": 545.1106, "eval_samples_per_second": 20.677, "eval_steps_per_second": 2.585, "eval_wer": 0.2595919482265927, "step": 28500 }, { "epoch": 4.95, "eval_loss": Infinity, "eval_runtime": 545.1809, "eval_samples_per_second": 20.674, "eval_steps_per_second": 2.584, "eval_wer": 0.2587724827702135, "step": 28600 }, { "epoch": 4.96, "eval_loss": Infinity, "eval_runtime": 543.2839, "eval_samples_per_second": 20.746, "eval_steps_per_second": 2.593, "eval_wer": 0.27188393007228107, "step": 28700 }, { "epoch": 4.98, "eval_loss": Infinity, "eval_runtime": 543.3434, "eval_samples_per_second": 20.744, "eval_steps_per_second": 2.593, "eval_wer": 0.26246007732391996, "step": 28800 }, { "epoch": 5.0, "eval_loss": Infinity, "eval_runtime": 544.0956, "eval_samples_per_second": 20.715, "eval_steps_per_second": 2.59, "eval_wer": 0.2631009413346781, "step": 28900 }, { "epoch": 5.02, "learning_rate": 0.00020088484286211295, "loss": 0.162, "step": 29000 }, { "epoch": 5.02, "eval_loss": Infinity, "eval_runtime": 543.4223, "eval_samples_per_second": 20.741, "eval_steps_per_second": 2.593, "eval_wer": 0.26189275508488824, "step": 29000 }, { "epoch": 5.03, "eval_loss": Infinity, "eval_runtime": 548.0793, "eval_samples_per_second": 20.565, "eval_steps_per_second": 2.571, "eval_wer": 0.25953941838964534, "step": 29100 }, { "epoch": 5.05, "eval_loss": Infinity, "eval_runtime": 548.6875, "eval_samples_per_second": 20.542, "eval_steps_per_second": 2.568, "eval_wer": 0.2667885358883846, "step": 29200 }, { "epoch": 5.07, "eval_loss": Infinity, "eval_runtime": 550.2049, "eval_samples_per_second": 20.485, "eval_steps_per_second": 2.561, "eval_wer": 0.26004370482434025, "step": 29300 }, { "epoch": 5.08, "eval_loss": Infinity, "eval_runtime": 542.8181, "eval_samples_per_second": 20.764, "eval_steps_per_second": 2.596, "eval_wer": 0.2608841822154984, "step": 29400 }, { "epoch": 5.1, "learning_rate": 0.00019914530905717264, "loss": 0.147, "step": 29500 }, { "epoch": 5.1, "eval_loss": Infinity, "eval_runtime": 543.4487, "eval_samples_per_second": 20.74, "eval_steps_per_second": 2.593, "eval_wer": 0.2654647839973105, "step": 29500 }, { "epoch": 5.12, "eval_loss": Infinity, "eval_runtime": 543.1438, "eval_samples_per_second": 20.751, "eval_steps_per_second": 2.594, "eval_wer": 0.2614515044545302, "step": 29600 }, { "epoch": 5.14, "eval_loss": Infinity, "eval_runtime": 547.647, "eval_samples_per_second": 20.581, "eval_steps_per_second": 2.573, "eval_wer": 0.26274373844343585, "step": 29700 }, { "epoch": 5.15, "eval_loss": Infinity, "eval_runtime": 544.3766, "eval_samples_per_second": 20.704, "eval_steps_per_second": 2.588, "eval_wer": 0.26189275508488824, "step": 29800 }, { "epoch": 5.17, "eval_loss": Infinity, "eval_runtime": 542.734, "eval_samples_per_second": 20.767, "eval_steps_per_second": 2.596, "eval_wer": 0.2622289460413515, "step": 29900 }, { "epoch": 5.19, "learning_rate": 0.0001974057752522324, "loss": 0.1441, "step": 30000 }, { "epoch": 5.19, "eval_loss": Infinity, "eval_runtime": 545.8282, "eval_samples_per_second": 20.649, "eval_steps_per_second": 2.581, "eval_wer": 0.25874096486804504, "step": 30000 }, { "epoch": 5.21, "eval_loss": Infinity, "eval_runtime": 542.7688, "eval_samples_per_second": 20.766, "eval_steps_per_second": 2.596, "eval_wer": 0.25953941838964534, "step": 30100 }, { "epoch": 5.22, "eval_loss": Infinity, "eval_runtime": 544.0516, "eval_samples_per_second": 20.717, "eval_steps_per_second": 2.59, "eval_wer": 0.2589090603462767, "step": 30200 }, { "epoch": 5.24, "eval_loss": Infinity, "eval_runtime": 541.9109, "eval_samples_per_second": 20.799, "eval_steps_per_second": 2.6, "eval_wer": 0.256912926542276, "step": 30300 }, { "epoch": 5.26, "eval_loss": Infinity, "eval_runtime": 542.1921, "eval_samples_per_second": 20.788, "eval_steps_per_second": 2.599, "eval_wer": 0.26571692721465795, "step": 30400 }, { "epoch": 5.27, "learning_rate": 0.0001956662414472921, "loss": 0.1446, "step": 30500 }, { "epoch": 5.27, "eval_loss": Infinity, "eval_runtime": 541.0843, "eval_samples_per_second": 20.83, "eval_steps_per_second": 2.604, "eval_wer": 0.2649499915952261, "step": 30500 }, { "epoch": 5.29, "eval_loss": Infinity, "eval_runtime": 542.2461, "eval_samples_per_second": 20.786, "eval_steps_per_second": 2.598, "eval_wer": 0.25893007228105563, "step": 30600 }, { "epoch": 5.31, "eval_loss": Infinity, "eval_runtime": 542.4141, "eval_samples_per_second": 20.779, "eval_steps_per_second": 2.598, "eval_wer": 0.255084888216507, "step": 30700 }, { "epoch": 5.33, "eval_loss": Infinity, "eval_runtime": 545.8125, "eval_samples_per_second": 20.65, "eval_steps_per_second": 2.581, "eval_wer": 0.2588565305093293, "step": 30800 }, { "epoch": 5.34, "eval_loss": Infinity, "eval_runtime": 542.3161, "eval_samples_per_second": 20.783, "eval_steps_per_second": 2.598, "eval_wer": 0.2544335182383594, "step": 30900 }, { "epoch": 5.36, "learning_rate": 0.00019392670764235183, "loss": 0.146, "step": 31000 }, { "epoch": 5.36, "eval_loss": Infinity, "eval_runtime": 543.7391, "eval_samples_per_second": 20.729, "eval_steps_per_second": 2.591, "eval_wer": 0.25232181879307447, "step": 31000 }, { "epoch": 5.38, "eval_loss": Infinity, "eval_runtime": 543.7175, "eval_samples_per_second": 20.73, "eval_steps_per_second": 2.591, "eval_wer": 0.2579845352160027, "step": 31100 }, { "epoch": 5.4, "eval_loss": Infinity, "eval_runtime": 545.4245, "eval_samples_per_second": 20.665, "eval_steps_per_second": 2.583, "eval_wer": 0.25971801983526643, "step": 31200 }, { "epoch": 5.41, "eval_loss": Infinity, "eval_runtime": 543.7184, "eval_samples_per_second": 20.729, "eval_steps_per_second": 2.591, "eval_wer": 0.2649499915952261, "step": 31300 }, { "epoch": 5.43, "eval_loss": Infinity, "eval_runtime": 544.3584, "eval_samples_per_second": 20.705, "eval_steps_per_second": 2.588, "eval_wer": 0.26140948058497226, "step": 31400 }, { "epoch": 5.45, "learning_rate": 0.00019218717383741156, "loss": 0.1512, "step": 31500 }, { "epoch": 5.45, "eval_loss": Infinity, "eval_runtime": 543.9248, "eval_samples_per_second": 20.722, "eval_steps_per_second": 2.59, "eval_wer": 0.2576588502269289, "step": 31500 }, { "epoch": 5.47, "eval_loss": Infinity, "eval_runtime": 543.2727, "eval_samples_per_second": 20.746, "eval_steps_per_second": 2.594, "eval_wer": 0.2623129937804673, "step": 31600 }, { "epoch": 5.48, "eval_loss": Infinity, "eval_runtime": 544.7565, "eval_samples_per_second": 20.69, "eval_steps_per_second": 2.586, "eval_wer": 0.25522146579257016, "step": 31700 }, { "epoch": 5.5, "eval_loss": Infinity, "eval_runtime": 542.465, "eval_samples_per_second": 20.777, "eval_steps_per_second": 2.597, "eval_wer": 0.2526264918473693, "step": 31800 }, { "epoch": 5.52, "eval_loss": Infinity, "eval_runtime": 541.8171, "eval_samples_per_second": 20.802, "eval_steps_per_second": 2.601, "eval_wer": 0.25689191460749705, "step": 31900 }, { "epoch": 5.53, "learning_rate": 0.0001904476400324713, "loss": 0.1489, "step": 32000 }, { "epoch": 5.53, "eval_loss": Infinity, "eval_runtime": 554.5484, "eval_samples_per_second": 20.325, "eval_steps_per_second": 2.541, "eval_wer": 0.2555681627164229, "step": 32000 }, { "epoch": 5.55, "eval_loss": Infinity, "eval_runtime": 541.0928, "eval_samples_per_second": 20.83, "eval_steps_per_second": 2.604, "eval_wer": 0.2576483442595394, "step": 32100 }, { "epoch": 5.57, "eval_loss": Infinity, "eval_runtime": 555.6973, "eval_samples_per_second": 20.283, "eval_steps_per_second": 2.536, "eval_wer": 0.2543389645318541, "step": 32200 }, { "epoch": 5.59, "eval_loss": Infinity, "eval_runtime": 541.7763, "eval_samples_per_second": 20.804, "eval_steps_per_second": 2.601, "eval_wer": 0.25343545133635903, "step": 32300 }, { "epoch": 5.6, "eval_loss": Infinity, "eval_runtime": 543.9041, "eval_samples_per_second": 20.722, "eval_steps_per_second": 2.591, "eval_wer": 0.25112413851067406, "step": 32400 }, { "epoch": 5.62, "learning_rate": 0.00018871158529514087, "loss": 0.1482, "step": 32500 }, { "epoch": 5.62, "eval_loss": Infinity, "eval_runtime": 542.0995, "eval_samples_per_second": 20.791, "eval_steps_per_second": 2.599, "eval_wer": 0.2581631366616238, "step": 32500 }, { "epoch": 5.64, "eval_loss": Infinity, "eval_runtime": 542.5978, "eval_samples_per_second": 20.772, "eval_steps_per_second": 2.597, "eval_wer": 0.2593923348461926, "step": 32600 }, { "epoch": 5.66, "eval_loss": Infinity, "eval_runtime": 542.1323, "eval_samples_per_second": 20.79, "eval_steps_per_second": 2.599, "eval_wer": 0.2545806017818121, "step": 32700 }, { "epoch": 5.67, "eval_loss": Infinity, "eval_runtime": 543.4344, "eval_samples_per_second": 20.74, "eval_steps_per_second": 2.593, "eval_wer": 0.24796184232644142, "step": 32800 }, { "epoch": 5.69, "eval_loss": Infinity, "eval_runtime": 543.5989, "eval_samples_per_second": 20.734, "eval_steps_per_second": 2.592, "eval_wer": 0.2610417717263406, "step": 32900 }, { "epoch": 5.71, "learning_rate": 0.00018697205149020062, "loss": 0.1379, "step": 33000 }, { "epoch": 5.71, "eval_loss": Infinity, "eval_runtime": 545.9938, "eval_samples_per_second": 20.643, "eval_steps_per_second": 2.581, "eval_wer": 0.2549798285426122, "step": 33000 }, { "epoch": 5.72, "eval_loss": Infinity, "eval_runtime": 542.7219, "eval_samples_per_second": 20.768, "eval_steps_per_second": 2.596, "eval_wer": 0.2584467977811397, "step": 33100 }, { "epoch": 5.74, "eval_loss": Infinity, "eval_runtime": 542.3547, "eval_samples_per_second": 20.782, "eval_steps_per_second": 2.598, "eval_wer": 0.2568603967053286, "step": 33200 }, { "epoch": 5.76, "eval_loss": Infinity, "eval_runtime": 542.4176, "eval_samples_per_second": 20.779, "eval_steps_per_second": 2.598, "eval_wer": 0.25814212472684483, "step": 33300 }, { "epoch": 5.78, "eval_loss": Infinity, "eval_runtime": 543.6528, "eval_samples_per_second": 20.732, "eval_steps_per_second": 2.592, "eval_wer": 0.26317448310640446, "step": 33400 }, { "epoch": 5.79, "learning_rate": 0.00018523599675287022, "loss": 0.1469, "step": 33500 }, { "epoch": 5.79, "eval_loss": Infinity, "eval_runtime": 543.1136, "eval_samples_per_second": 20.753, "eval_steps_per_second": 2.594, "eval_wer": 0.25725962346612874, "step": 33500 }, { "epoch": 5.81, "eval_loss": Infinity, "eval_runtime": 544.0134, "eval_samples_per_second": 20.718, "eval_steps_per_second": 2.59, "eval_wer": 0.25016809547823166, "step": 33600 }, { "epoch": 5.83, "eval_loss": Infinity, "eval_runtime": 544.855, "eval_samples_per_second": 20.686, "eval_steps_per_second": 2.586, "eval_wer": 0.25649268784669693, "step": 33700 }, { "epoch": 5.85, "eval_loss": Infinity, "eval_runtime": 545.0055, "eval_samples_per_second": 20.681, "eval_steps_per_second": 2.585, "eval_wer": 0.2574277189443604, "step": 33800 }, { "epoch": 5.86, "eval_loss": Infinity, "eval_runtime": 544.8939, "eval_samples_per_second": 20.685, "eval_steps_per_second": 2.586, "eval_wer": 0.25730164733568667, "step": 33900 }, { "epoch": 5.88, "learning_rate": 0.00018349646294792992, "loss": 0.1502, "step": 34000 }, { "epoch": 5.88, "eval_loss": Infinity, "eval_runtime": 542.1481, "eval_samples_per_second": 20.79, "eval_steps_per_second": 2.599, "eval_wer": 0.2602433182047403, "step": 34000 }, { "epoch": 5.9, "eval_loss": Infinity, "eval_runtime": 543.1924, "eval_samples_per_second": 20.75, "eval_steps_per_second": 2.594, "eval_wer": 0.24964279710875778, "step": 34100 }, { "epoch": 5.91, "eval_loss": Infinity, "eval_runtime": 544.5365, "eval_samples_per_second": 20.698, "eval_steps_per_second": 2.588, "eval_wer": 0.25418137502101196, "step": 34200 }, { "epoch": 5.93, "eval_loss": Infinity, "eval_runtime": 544.445, "eval_samples_per_second": 20.702, "eval_steps_per_second": 2.588, "eval_wer": 0.24754160363086233, "step": 34300 }, { "epoch": 5.95, "eval_loss": Infinity, "eval_runtime": 541.9528, "eval_samples_per_second": 20.797, "eval_steps_per_second": 2.6, "eval_wer": 0.24889687342410488, "step": 34400 }, { "epoch": 5.97, "learning_rate": 0.00018175692914298967, "loss": 0.1414, "step": 34500 }, { "epoch": 5.97, "eval_loss": Infinity, "eval_runtime": 546.9612, "eval_samples_per_second": 20.607, "eval_steps_per_second": 2.576, "eval_wer": 0.2520381576735586, "step": 34500 }, { "epoch": 5.98, "eval_loss": Infinity, "eval_runtime": 542.4137, "eval_samples_per_second": 20.779, "eval_steps_per_second": 2.598, "eval_wer": 0.248613212304589, "step": 34600 }, { "epoch": 6.0, "eval_loss": Infinity, "eval_runtime": 543.6113, "eval_samples_per_second": 20.734, "eval_steps_per_second": 2.592, "eval_wer": 0.2601592704656245, "step": 34700 }, { "epoch": 6.02, "eval_loss": Infinity, "eval_runtime": 544.1036, "eval_samples_per_second": 20.715, "eval_steps_per_second": 2.59, "eval_wer": 0.2517019667170953, "step": 34800 }, { "epoch": 6.04, "eval_loss": Infinity, "eval_runtime": 544.3655, "eval_samples_per_second": 20.705, "eval_steps_per_second": 2.588, "eval_wer": 0.2563771222054127, "step": 34900 }, { "epoch": 6.05, "learning_rate": 0.0001800173953380494, "loss": 0.1385, "step": 35000 }, { "epoch": 6.05, "eval_loss": Infinity, "eval_runtime": 545.9585, "eval_samples_per_second": 20.644, "eval_steps_per_second": 2.581, "eval_wer": 0.2500840477391158, "step": 35000 }, { "epoch": 6.07, "eval_loss": Infinity, "eval_runtime": 543.5683, "eval_samples_per_second": 20.735, "eval_steps_per_second": 2.592, "eval_wer": 0.24773071104387293, "step": 35100 }, { "epoch": 6.09, "eval_loss": Infinity, "eval_runtime": 543.8849, "eval_samples_per_second": 20.723, "eval_steps_per_second": 2.591, "eval_wer": 0.25002101193477894, "step": 35200 }, { "epoch": 6.11, "eval_loss": Infinity, "eval_runtime": 546.0856, "eval_samples_per_second": 20.64, "eval_steps_per_second": 2.58, "eval_wer": 0.2556627164229282, "step": 35300 }, { "epoch": 6.12, "eval_loss": Infinity, "eval_runtime": 545.6013, "eval_samples_per_second": 20.658, "eval_steps_per_second": 2.582, "eval_wer": 0.25199613380400065, "step": 35400 }, { "epoch": 6.14, "learning_rate": 0.000178281340600719, "loss": 0.1265, "step": 35500 }, { "epoch": 6.14, "eval_loss": Infinity, "eval_runtime": 544.0517, "eval_samples_per_second": 20.717, "eval_steps_per_second": 2.59, "eval_wer": 0.2567658429988233, "step": 35500 }, { "epoch": 6.16, "eval_loss": Infinity, "eval_runtime": 544.4823, "eval_samples_per_second": 20.7, "eval_steps_per_second": 2.588, "eval_wer": 0.24956925533703142, "step": 35600 }, { "epoch": 6.17, "eval_loss": Infinity, "eval_runtime": 544.9002, "eval_samples_per_second": 20.685, "eval_steps_per_second": 2.586, "eval_wer": 0.2563666162380232, "step": 35700 }, { "epoch": 6.19, "eval_loss": Infinity, "eval_runtime": 544.1075, "eval_samples_per_second": 20.715, "eval_steps_per_second": 2.59, "eval_wer": 0.2511871743150109, "step": 35800 }, { "epoch": 6.21, "eval_loss": Infinity, "eval_runtime": 542.1212, "eval_samples_per_second": 20.791, "eval_steps_per_second": 2.599, "eval_wer": 0.2511556564128425, "step": 35900 }, { "epoch": 6.23, "learning_rate": 0.0001765418067957787, "loss": 0.1267, "step": 36000 }, { "epoch": 6.23, "eval_loss": Infinity, "eval_runtime": 542.2556, "eval_samples_per_second": 20.785, "eval_steps_per_second": 2.598, "eval_wer": 0.2540237855101698, "step": 36000 }, { "epoch": 6.24, "eval_loss": Infinity, "eval_runtime": 555.6145, "eval_samples_per_second": 20.286, "eval_steps_per_second": 2.536, "eval_wer": 0.25, "step": 36100 }, { "epoch": 6.26, "eval_loss": Infinity, "eval_runtime": 545.544, "eval_samples_per_second": 20.66, "eval_steps_per_second": 2.583, "eval_wer": 0.25425491679273826, "step": 36200 }, { "epoch": 6.28, "eval_loss": Infinity, "eval_runtime": 544.7624, "eval_samples_per_second": 20.69, "eval_steps_per_second": 2.586, "eval_wer": 0.2606425449655404, "step": 36300 }, { "epoch": 6.3, "eval_loss": Infinity, "eval_runtime": 544.7203, "eval_samples_per_second": 20.691, "eval_steps_per_second": 2.587, "eval_wer": 0.2527630694234325, "step": 36400 }, { "epoch": 6.31, "learning_rate": 0.00017480227299083843, "loss": 0.1271, "step": 36500 }, { "epoch": 6.31, "eval_loss": Infinity, "eval_runtime": 545.2904, "eval_samples_per_second": 20.67, "eval_steps_per_second": 2.584, "eval_wer": 0.2536035468145907, "step": 36500 }, { "epoch": 6.33, "eval_loss": Infinity, "eval_runtime": 545.8896, "eval_samples_per_second": 20.647, "eval_steps_per_second": 2.581, "eval_wer": 0.2473209783156833, "step": 36600 }, { "epoch": 6.35, "eval_loss": Infinity, "eval_runtime": 546.4085, "eval_samples_per_second": 20.627, "eval_steps_per_second": 2.579, "eval_wer": 0.25052529836947385, "step": 36700 }, { "epoch": 6.36, "eval_loss": Infinity, "eval_runtime": 545.4805, "eval_samples_per_second": 20.663, "eval_steps_per_second": 2.583, "eval_wer": 0.25445453017313835, "step": 36800 }, { "epoch": 6.38, "eval_loss": Infinity, "eval_runtime": 545.6649, "eval_samples_per_second": 20.656, "eval_steps_per_second": 2.582, "eval_wer": 0.25120818624978986, "step": 36900 }, { "epoch": 6.4, "learning_rate": 0.00017306273918589818, "loss": 0.1269, "step": 37000 }, { "epoch": 6.4, "eval_loss": Infinity, "eval_runtime": 545.7146, "eval_samples_per_second": 20.654, "eval_steps_per_second": 2.582, "eval_wer": 0.25005252983694737, "step": 37000 }, { "epoch": 6.42, "eval_loss": Infinity, "eval_runtime": 545.1673, "eval_samples_per_second": 20.674, "eval_steps_per_second": 2.585, "eval_wer": 0.24807740796772568, "step": 37100 }, { "epoch": 6.43, "eval_loss": Infinity, "eval_runtime": 544.0697, "eval_samples_per_second": 20.716, "eval_steps_per_second": 2.59, "eval_wer": 0.245156749033451, "step": 37200 }, { "epoch": 6.45, "eval_loss": Infinity, "eval_runtime": 552.8142, "eval_samples_per_second": 20.388, "eval_steps_per_second": 2.549, "eval_wer": 0.2427088586317028, "step": 37300 }, { "epoch": 6.47, "eval_loss": Infinity, "eval_runtime": 579.5521, "eval_samples_per_second": 19.448, "eval_steps_per_second": 2.431, "eval_wer": 0.25326735585812743, "step": 37400 }, { "epoch": 6.49, "learning_rate": 0.0001713232053809579, "loss": 0.1304, "step": 37500 }, { "epoch": 6.49, "eval_loss": Infinity, "eval_runtime": 609.7099, "eval_samples_per_second": 18.486, "eval_steps_per_second": 2.311, "eval_wer": 0.25523197175995965, "step": 37500 }, { "epoch": 6.5, "eval_loss": Infinity, "eval_runtime": 611.8183, "eval_samples_per_second": 18.422, "eval_steps_per_second": 2.303, "eval_wer": 0.2482455034459573, "step": 37600 }, { "epoch": 6.52, "eval_loss": Infinity, "eval_runtime": 609.1706, "eval_samples_per_second": 18.502, "eval_steps_per_second": 2.313, "eval_wer": 0.24762565136997816, "step": 37700 }, { "epoch": 6.54, "eval_loss": Infinity, "eval_runtime": 610.1889, "eval_samples_per_second": 18.471, "eval_steps_per_second": 2.309, "eval_wer": 0.252994200706001, "step": 37800 }, { "epoch": 6.55, "eval_loss": Infinity, "eval_runtime": 608.2683, "eval_samples_per_second": 18.53, "eval_steps_per_second": 2.316, "eval_wer": 0.2427193645990923, "step": 37900 }, { "epoch": 6.57, "learning_rate": 0.00016958367157601762, "loss": 0.1259, "step": 38000 }, { "epoch": 6.57, "eval_loss": Infinity, "eval_runtime": 607.8109, "eval_samples_per_second": 18.544, "eval_steps_per_second": 2.318, "eval_wer": 0.244473861153135, "step": 38000 }, { "epoch": 6.59, "eval_loss": Infinity, "eval_runtime": 611.2735, "eval_samples_per_second": 18.439, "eval_steps_per_second": 2.305, "eval_wer": 0.24523029080517733, "step": 38100 }, { "epoch": 6.61, "eval_loss": Infinity, "eval_runtime": 611.2354, "eval_samples_per_second": 18.44, "eval_steps_per_second": 2.305, "eval_wer": 0.2509560430324424, "step": 38200 }, { "epoch": 6.62, "eval_loss": Infinity, "eval_runtime": 607.3737, "eval_samples_per_second": 18.557, "eval_steps_per_second": 2.32, "eval_wer": 0.24547192805513532, "step": 38300 }, { "epoch": 6.64, "eval_loss": Infinity, "eval_runtime": 557.5444, "eval_samples_per_second": 20.215, "eval_steps_per_second": 2.527, "eval_wer": 0.2478777945873256, "step": 38400 }, { "epoch": 6.66, "learning_rate": 0.00016784413777107732, "loss": 0.1244, "step": 38500 }, { "epoch": 6.66, "eval_loss": Infinity, "eval_runtime": 558.0795, "eval_samples_per_second": 20.196, "eval_steps_per_second": 2.525, "eval_wer": 0.25171247268448477, "step": 38500 }, { "epoch": 6.68, "eval_loss": Infinity, "eval_runtime": 551.4957, "eval_samples_per_second": 20.437, "eval_steps_per_second": 2.555, "eval_wer": 0.25004202386955793, "step": 38600 }, { "epoch": 6.69, "eval_loss": Infinity, "eval_runtime": 547.5154, "eval_samples_per_second": 20.586, "eval_steps_per_second": 2.573, "eval_wer": 0.24217305429483946, "step": 38700 }, { "epoch": 6.71, "eval_loss": Infinity, "eval_runtime": 551.8818, "eval_samples_per_second": 20.423, "eval_steps_per_second": 2.553, "eval_wer": 0.2515548831736426, "step": 38800 }, { "epoch": 6.73, "eval_loss": Infinity, "eval_runtime": 571.7971, "eval_samples_per_second": 19.712, "eval_steps_per_second": 2.464, "eval_wer": 0.24498865355521937, "step": 38900 }, { "epoch": 6.75, "learning_rate": 0.00016610460396613707, "loss": 0.1281, "step": 39000 }, { "epoch": 6.75, "eval_loss": Infinity, "eval_runtime": 559.2146, "eval_samples_per_second": 20.155, "eval_steps_per_second": 2.52, "eval_wer": 0.24629139351151455, "step": 39000 }, { "epoch": 6.76, "eval_loss": Infinity, "eval_runtime": 549.7387, "eval_samples_per_second": 20.502, "eval_steps_per_second": 2.563, "eval_wer": 0.24811943183728358, "step": 39100 }, { "epoch": 6.78, "eval_loss": Infinity, "eval_runtime": 546.7395, "eval_samples_per_second": 20.615, "eval_steps_per_second": 2.577, "eval_wer": 0.24802487813077828, "step": 39200 }, { "epoch": 6.8, "eval_loss": Infinity, "eval_runtime": 556.9541, "eval_samples_per_second": 20.237, "eval_steps_per_second": 2.53, "eval_wer": 0.24601823835938813, "step": 39300 }, { "epoch": 6.81, "eval_loss": Infinity, "eval_runtime": 546.1242, "eval_samples_per_second": 20.638, "eval_steps_per_second": 2.58, "eval_wer": 0.24889687342410488, "step": 39400 }, { "epoch": 6.83, "learning_rate": 0.00016436854922880666, "loss": 0.1287, "step": 39500 }, { "epoch": 6.83, "eval_loss": Infinity, "eval_runtime": 542.5205, "eval_samples_per_second": 20.775, "eval_steps_per_second": 2.597, "eval_wer": 0.24849764666330476, "step": 39500 }, { "epoch": 6.85, "eval_loss": Infinity, "eval_runtime": 542.3359, "eval_samples_per_second": 20.782, "eval_steps_per_second": 2.598, "eval_wer": 0.24547192805513532, "step": 39600 }, { "epoch": 6.87, "eval_loss": Infinity, "eval_runtime": 544.5258, "eval_samples_per_second": 20.699, "eval_steps_per_second": 2.588, "eval_wer": 0.2451042191965036, "step": 39700 }, { "epoch": 6.88, "eval_loss": Infinity, "eval_runtime": 544.0336, "eval_samples_per_second": 20.717, "eval_steps_per_second": 2.59, "eval_wer": 0.2473209783156833, "step": 39800 }, { "epoch": 6.9, "eval_loss": Infinity, "eval_runtime": 551.3211, "eval_samples_per_second": 20.444, "eval_steps_per_second": 2.556, "eval_wer": 0.25002101193477894, "step": 39900 }, { "epoch": 6.92, "learning_rate": 0.00016263249449147626, "loss": 0.1308, "step": 40000 }, { "epoch": 6.92, "eval_loss": Infinity, "eval_runtime": 554.882, "eval_samples_per_second": 20.312, "eval_steps_per_second": 2.539, "eval_wer": 0.2451042191965036, "step": 40000 }, { "epoch": 6.94, "eval_loss": Infinity, "eval_runtime": 542.0787, "eval_samples_per_second": 20.792, "eval_steps_per_second": 2.599, "eval_wer": 0.24064968902336528, "step": 40100 }, { "epoch": 6.95, "eval_loss": Infinity, "eval_runtime": 589.9942, "eval_samples_per_second": 19.104, "eval_steps_per_second": 2.388, "eval_wer": 0.23928391326273324, "step": 40200 }, { "epoch": 6.97, "eval_loss": Infinity, "eval_runtime": 542.3329, "eval_samples_per_second": 20.782, "eval_steps_per_second": 2.598, "eval_wer": 0.24142713061018659, "step": 40300 }, { "epoch": 6.99, "eval_loss": Infinity, "eval_runtime": 543.579, "eval_samples_per_second": 20.735, "eval_steps_per_second": 2.592, "eval_wer": 0.23991427130610188, "step": 40400 }, { "epoch": 7.0, "learning_rate": 0.00016089296068653598, "loss": 0.1189, "step": 40500 }, { "epoch": 7.0, "eval_loss": Infinity, "eval_runtime": 546.472, "eval_samples_per_second": 20.625, "eval_steps_per_second": 2.578, "eval_wer": 0.2381912926542276, "step": 40500 }, { "epoch": 7.02, "eval_loss": Infinity, "eval_runtime": 554.1607, "eval_samples_per_second": 20.339, "eval_steps_per_second": 2.543, "eval_wer": 0.2400298369473861, "step": 40600 }, { "epoch": 7.04, "eval_loss": Infinity, "eval_runtime": 550.4036, "eval_samples_per_second": 20.478, "eval_steps_per_second": 2.56, "eval_wer": 0.24198394688182887, "step": 40700 }, { "epoch": 7.06, "eval_loss": Infinity, "eval_runtime": 544.257, "eval_samples_per_second": 20.709, "eval_steps_per_second": 2.589, "eval_wer": 0.24069171289292318, "step": 40800 }, { "epoch": 7.07, "eval_loss": Infinity, "eval_runtime": 552.2615, "eval_samples_per_second": 20.409, "eval_steps_per_second": 2.551, "eval_wer": 0.24138510674062869, "step": 40900 }, { "epoch": 7.09, "learning_rate": 0.0001591534268815957, "loss": 0.1132, "step": 41000 }, { "epoch": 7.09, "eval_loss": Infinity, "eval_runtime": 544.7913, "eval_samples_per_second": 20.689, "eval_steps_per_second": 2.586, "eval_wer": 0.24250924525130274, "step": 41000 }, { "epoch": 7.11, "eval_loss": Infinity, "eval_runtime": 549.0429, "eval_samples_per_second": 20.528, "eval_steps_per_second": 2.566, "eval_wer": 0.2376870062195327, "step": 41100 }, { "epoch": 7.13, "eval_loss": Infinity, "eval_runtime": 549.5056, "eval_samples_per_second": 20.511, "eval_steps_per_second": 2.564, "eval_wer": 0.23895822827365945, "step": 41200 }, { "epoch": 7.14, "eval_loss": Infinity, "eval_runtime": 551.038, "eval_samples_per_second": 20.454, "eval_steps_per_second": 2.557, "eval_wer": 0.23946251470835433, "step": 41300 }, { "epoch": 7.16, "eval_loss": Infinity, "eval_runtime": 551.6556, "eval_samples_per_second": 20.431, "eval_steps_per_second": 2.554, "eval_wer": 0.24171079172970247, "step": 41400 }, { "epoch": 7.18, "learning_rate": 0.00015741389307665545, "loss": 0.1058, "step": 41500 }, { "epoch": 7.18, "eval_loss": Infinity, "eval_runtime": 551.1685, "eval_samples_per_second": 20.449, "eval_steps_per_second": 2.556, "eval_wer": 0.23923138342578584, "step": 41500 }, { "epoch": 7.19, "eval_loss": Infinity, "eval_runtime": 547.2412, "eval_samples_per_second": 20.596, "eval_steps_per_second": 2.575, "eval_wer": 0.23935745503445957, "step": 41600 }, { "epoch": 7.21, "eval_loss": Infinity, "eval_runtime": 545.7997, "eval_samples_per_second": 20.65, "eval_steps_per_second": 2.582, "eval_wer": 0.23876912086064886, "step": 41700 }, { "epoch": 7.23, "eval_loss": Infinity, "eval_runtime": 544.9052, "eval_samples_per_second": 20.684, "eval_steps_per_second": 2.586, "eval_wer": 0.24115397545806017, "step": 41800 }, { "epoch": 7.25, "eval_loss": Infinity, "eval_runtime": 551.8822, "eval_samples_per_second": 20.423, "eval_steps_per_second": 2.553, "eval_wer": 0.24514624306606153, "step": 41900 }, { "epoch": 7.26, "learning_rate": 0.00015567435927171518, "loss": 0.1038, "step": 42000 }, { "epoch": 7.26, "eval_loss": Infinity, "eval_runtime": 544.2814, "eval_samples_per_second": 20.708, "eval_steps_per_second": 2.589, "eval_wer": 0.24196293494704993, "step": 42000 }, { "epoch": 7.28, "eval_loss": Infinity, "eval_runtime": 546.2453, "eval_samples_per_second": 20.634, "eval_steps_per_second": 2.579, "eval_wer": 0.23996680114304925, "step": 42100 }, { "epoch": 7.3, "eval_loss": Infinity, "eval_runtime": 542.654, "eval_samples_per_second": 20.77, "eval_steps_per_second": 2.596, "eval_wer": 0.24099638594721803, "step": 42200 }, { "epoch": 7.32, "eval_loss": Infinity, "eval_runtime": 545.7874, "eval_samples_per_second": 20.651, "eval_steps_per_second": 2.582, "eval_wer": 0.2377710539586485, "step": 42300 }, { "epoch": 7.33, "eval_loss": Infinity, "eval_runtime": 543.8176, "eval_samples_per_second": 20.726, "eval_steps_per_second": 2.591, "eval_wer": 0.24062867708858632, "step": 42400 }, { "epoch": 7.35, "learning_rate": 0.00015393830453438477, "loss": 0.1084, "step": 42500 }, { "epoch": 7.35, "eval_loss": Infinity, "eval_runtime": 542.352, "eval_samples_per_second": 20.782, "eval_steps_per_second": 2.598, "eval_wer": 0.23573289628508992, "step": 42500 }, { "epoch": 7.37, "eval_loss": Infinity, "eval_runtime": 543.3886, "eval_samples_per_second": 20.742, "eval_steps_per_second": 2.593, "eval_wer": 0.23681501092620608, "step": 42600 }, { "epoch": 7.38, "eval_loss": Infinity, "eval_runtime": 545.4438, "eval_samples_per_second": 20.664, "eval_steps_per_second": 2.583, "eval_wer": 0.23580643805681628, "step": 42700 }, { "epoch": 7.4, "eval_loss": Infinity, "eval_runtime": 545.4721, "eval_samples_per_second": 20.663, "eval_steps_per_second": 2.583, "eval_wer": 0.24020843839300723, "step": 42800 }, { "epoch": 7.42, "eval_loss": Infinity, "eval_runtime": 544.5151, "eval_samples_per_second": 20.699, "eval_steps_per_second": 2.588, "eval_wer": 0.23803370314338546, "step": 42900 }, { "epoch": 7.44, "learning_rate": 0.0001521987707294445, "loss": 0.1094, "step": 43000 }, { "epoch": 7.44, "eval_loss": Infinity, "eval_runtime": 545.5739, "eval_samples_per_second": 20.659, "eval_steps_per_second": 2.583, "eval_wer": 0.23912632375189108, "step": 43000 }, { "epoch": 7.45, "eval_loss": Infinity, "eval_runtime": 546.28, "eval_samples_per_second": 20.632, "eval_steps_per_second": 2.579, "eval_wer": 0.24224659606656582, "step": 43100 }, { "epoch": 7.47, "eval_loss": Infinity, "eval_runtime": 546.7274, "eval_samples_per_second": 20.615, "eval_steps_per_second": 2.577, "eval_wer": 0.23834888216506975, "step": 43200 }, { "epoch": 7.49, "eval_loss": Infinity, "eval_runtime": 546.5993, "eval_samples_per_second": 20.62, "eval_steps_per_second": 2.578, "eval_wer": 0.23654185577407968, "step": 43300 }, { "epoch": 7.51, "eval_loss": Infinity, "eval_runtime": 544.9504, "eval_samples_per_second": 20.683, "eval_steps_per_second": 2.586, "eval_wer": 0.2389372163388805, "step": 43400 }, { "epoch": 7.52, "learning_rate": 0.00015045923692450422, "loss": 0.1088, "step": 43500 }, { "epoch": 7.52, "eval_loss": Infinity, "eval_runtime": 545.8554, "eval_samples_per_second": 20.648, "eval_steps_per_second": 2.581, "eval_wer": 0.2359745335350479, "step": 43500 }, { "epoch": 7.54, "eval_loss": Infinity, "eval_runtime": 546.547, "eval_samples_per_second": 20.622, "eval_steps_per_second": 2.578, "eval_wer": 0.24074424272987058, "step": 43600 }, { "epoch": 7.56, "eval_loss": Infinity, "eval_runtime": 546.4586, "eval_samples_per_second": 20.626, "eval_steps_per_second": 2.578, "eval_wer": 0.23735081526306942, "step": 43700 }, { "epoch": 7.58, "eval_loss": Infinity, "eval_runtime": 545.2466, "eval_samples_per_second": 20.671, "eval_steps_per_second": 2.584, "eval_wer": 0.23444066229618424, "step": 43800 }, { "epoch": 7.59, "eval_loss": Infinity, "eval_runtime": 559.1801, "eval_samples_per_second": 20.156, "eval_steps_per_second": 2.52, "eval_wer": 0.23550176500252143, "step": 43900 }, { "epoch": 7.61, "learning_rate": 0.00014871970311956394, "loss": 0.1082, "step": 44000 }, { "epoch": 7.61, "eval_loss": Infinity, "eval_runtime": 544.6369, "eval_samples_per_second": 20.695, "eval_steps_per_second": 2.587, "eval_wer": 0.23964111615397546, "step": 44000 }, { "epoch": 7.63, "eval_loss": Infinity, "eval_runtime": 546.7779, "eval_samples_per_second": 20.613, "eval_steps_per_second": 2.577, "eval_wer": 0.2347348293830896, "step": 44100 }, { "epoch": 7.64, "eval_loss": Infinity, "eval_runtime": 544.3794, "eval_samples_per_second": 20.704, "eval_steps_per_second": 2.588, "eval_wer": 0.2344091443940158, "step": 44200 }, { "epoch": 7.66, "eval_loss": Infinity, "eval_runtime": 545.2672, "eval_samples_per_second": 20.671, "eval_steps_per_second": 2.584, "eval_wer": 0.2359745335350479, "step": 44300 }, { "epoch": 7.68, "eval_loss": Infinity, "eval_runtime": 546.2821, "eval_samples_per_second": 20.632, "eval_steps_per_second": 2.579, "eval_wer": 0.24059715918641789, "step": 44400 }, { "epoch": 7.7, "learning_rate": 0.00014698364838223354, "loss": 0.1101, "step": 44500 }, { "epoch": 7.7, "eval_loss": Infinity, "eval_runtime": 544.6729, "eval_samples_per_second": 20.693, "eval_steps_per_second": 2.587, "eval_wer": 0.23647881996974282, "step": 44500 }, { "epoch": 7.71, "eval_loss": Infinity, "eval_runtime": 545.37, "eval_samples_per_second": 20.667, "eval_steps_per_second": 2.584, "eval_wer": 0.2358799798285426, "step": 44600 }, { "epoch": 7.73, "eval_loss": Infinity, "eval_runtime": 546.597, "eval_samples_per_second": 20.62, "eval_steps_per_second": 2.578, "eval_wer": 0.24444234325096656, "step": 44700 }, { "epoch": 7.75, "eval_loss": Infinity, "eval_runtime": 547.5764, "eval_samples_per_second": 20.583, "eval_steps_per_second": 2.573, "eval_wer": 0.23757144057824844, "step": 44800 }, { "epoch": 7.77, "eval_loss": Infinity, "eval_runtime": 547.3757, "eval_samples_per_second": 20.591, "eval_steps_per_second": 2.574, "eval_wer": 0.2360270633719953, "step": 44900 }, { "epoch": 7.78, "learning_rate": 0.00014524411457729328, "loss": 0.1114, "step": 45000 }, { "epoch": 7.78, "eval_loss": Infinity, "eval_runtime": 547.5394, "eval_samples_per_second": 20.585, "eval_steps_per_second": 2.573, "eval_wer": 0.23577492015464785, "step": 45000 }, { "epoch": 7.8, "eval_loss": Infinity, "eval_runtime": 547.5618, "eval_samples_per_second": 20.584, "eval_steps_per_second": 2.573, "eval_wer": 0.23652084383930072, "step": 45100 }, { "epoch": 7.82, "eval_loss": Infinity, "eval_runtime": 547.0038, "eval_samples_per_second": 20.605, "eval_steps_per_second": 2.576, "eval_wer": 0.2381072449151118, "step": 45200 }, { "epoch": 7.83, "eval_loss": Infinity, "eval_runtime": 547.295, "eval_samples_per_second": 20.594, "eval_steps_per_second": 2.574, "eval_wer": 0.23496596066565809, "step": 45300 }, { "epoch": 7.85, "eval_loss": Infinity, "eval_runtime": 547.0451, "eval_samples_per_second": 20.603, "eval_steps_per_second": 2.576, "eval_wer": 0.23590099176332158, "step": 45400 }, { "epoch": 7.87, "learning_rate": 0.00014350458077235298, "loss": 0.1133, "step": 45500 }, { "epoch": 7.87, "eval_loss": Infinity, "eval_runtime": 545.0755, "eval_samples_per_second": 20.678, "eval_steps_per_second": 2.585, "eval_wer": 0.23681501092620608, "step": 45500 }, { "epoch": 7.89, "eval_loss": Infinity, "eval_runtime": 546.4556, "eval_samples_per_second": 20.626, "eval_steps_per_second": 2.578, "eval_wer": 0.24080727853420744, "step": 45600 }, { "epoch": 7.9, "eval_loss": Infinity, "eval_runtime": 543.2499, "eval_samples_per_second": 20.747, "eval_steps_per_second": 2.594, "eval_wer": 0.23743486300218525, "step": 45700 }, { "epoch": 7.92, "eval_loss": Infinity, "eval_runtime": 544.8106, "eval_samples_per_second": 20.688, "eval_steps_per_second": 2.586, "eval_wer": 0.23604807530677424, "step": 45800 }, { "epoch": 7.94, "eval_loss": Infinity, "eval_runtime": 543.3851, "eval_samples_per_second": 20.742, "eval_steps_per_second": 2.593, "eval_wer": 0.23178265254664648, "step": 45900 }, { "epoch": 7.96, "learning_rate": 0.00014176504696741273, "loss": 0.1058, "step": 46000 }, { "epoch": 7.96, "eval_loss": Infinity, "eval_runtime": 543.8967, "eval_samples_per_second": 20.723, "eval_steps_per_second": 2.591, "eval_wer": 0.23223440914439403, "step": 46000 }, { "epoch": 7.97, "eval_loss": Infinity, "eval_runtime": 544.0937, "eval_samples_per_second": 20.715, "eval_steps_per_second": 2.59, "eval_wer": 0.23738233316523785, "step": 46100 }, { "epoch": 7.99, "eval_loss": Infinity, "eval_runtime": 544.8297, "eval_samples_per_second": 20.687, "eval_steps_per_second": 2.586, "eval_wer": 0.23216086737266767, "step": 46200 }, { "epoch": 8.01, "eval_loss": Infinity, "eval_runtime": 544.7266, "eval_samples_per_second": 20.691, "eval_steps_per_second": 2.587, "eval_wer": 0.23605858127416374, "step": 46300 }, { "epoch": 8.02, "eval_loss": Infinity, "eval_runtime": 543.6144, "eval_samples_per_second": 20.733, "eval_steps_per_second": 2.592, "eval_wer": 0.2351970919482266, "step": 46400 }, { "epoch": 8.04, "learning_rate": 0.00014002551316247245, "loss": 0.1024, "step": 46500 }, { "epoch": 8.04, "eval_loss": Infinity, "eval_runtime": 544.0783, "eval_samples_per_second": 20.716, "eval_steps_per_second": 2.59, "eval_wer": 0.23300134476382586, "step": 46500 }, { "epoch": 8.06, "eval_loss": Infinity, "eval_runtime": 544.1678, "eval_samples_per_second": 20.712, "eval_steps_per_second": 2.589, "eval_wer": 0.23152000336190956, "step": 46600 }, { "epoch": 8.08, "eval_loss": Infinity, "eval_runtime": 547.7672, "eval_samples_per_second": 20.576, "eval_steps_per_second": 2.572, "eval_wer": 0.23152000336190956, "step": 46700 }, { "epoch": 8.09, "eval_loss": Infinity, "eval_runtime": 545.4647, "eval_samples_per_second": 20.663, "eval_steps_per_second": 2.583, "eval_wer": 0.23452471003530004, "step": 46800 }, { "epoch": 8.11, "eval_loss": Infinity, "eval_runtime": 544.6881, "eval_samples_per_second": 20.693, "eval_steps_per_second": 2.587, "eval_wer": 0.2372247436543957, "step": 46900 }, { "epoch": 8.13, "learning_rate": 0.00013828597935753217, "loss": 0.093, "step": 47000 }, { "epoch": 8.13, "eval_loss": Infinity, "eval_runtime": 542.6307, "eval_samples_per_second": 20.771, "eval_steps_per_second": 2.597, "eval_wer": 0.2356173306438057, "step": 47000 }, { "epoch": 8.15, "eval_loss": Infinity, "eval_runtime": 544.7932, "eval_samples_per_second": 20.689, "eval_steps_per_second": 2.586, "eval_wer": 0.2337577744158682, "step": 47100 }, { "epoch": 8.16, "eval_loss": Infinity, "eval_runtime": 545.3612, "eval_samples_per_second": 20.667, "eval_steps_per_second": 2.584, "eval_wer": 0.23032232307950917, "step": 47200 }, { "epoch": 8.18, "eval_loss": Infinity, "eval_runtime": 544.9025, "eval_samples_per_second": 20.684, "eval_steps_per_second": 2.586, "eval_wer": 0.23370524457892083, "step": 47300 }, { "epoch": 8.2, "eval_loss": Infinity, "eval_runtime": 542.8145, "eval_samples_per_second": 20.764, "eval_steps_per_second": 2.596, "eval_wer": 0.23327449991595225, "step": 47400 }, { "epoch": 8.22, "learning_rate": 0.0001365464455525919, "loss": 0.0907, "step": 47500 }, { "epoch": 8.22, "eval_loss": Infinity, "eval_runtime": 543.608, "eval_samples_per_second": 20.734, "eval_steps_per_second": 2.592, "eval_wer": 0.23349512523113128, "step": 47500 }, { "epoch": 8.23, "eval_loss": Infinity, "eval_runtime": 544.4985, "eval_samples_per_second": 20.7, "eval_steps_per_second": 2.588, "eval_wer": 0.2339048579593209, "step": 47600 }, { "epoch": 8.25, "eval_loss": Infinity, "eval_runtime": 557.8672, "eval_samples_per_second": 20.204, "eval_steps_per_second": 2.526, "eval_wer": 0.23124684820978317, "step": 47700 }, { "epoch": 8.27, "eval_loss": Infinity, "eval_runtime": 545.0667, "eval_samples_per_second": 20.678, "eval_steps_per_second": 2.585, "eval_wer": 0.23343208942679441, "step": 47800 }, { "epoch": 8.28, "eval_loss": Infinity, "eval_runtime": 544.2596, "eval_samples_per_second": 20.709, "eval_steps_per_second": 2.589, "eval_wer": 0.2310787527315515, "step": 47900 }, { "epoch": 8.3, "learning_rate": 0.0001348103908152615, "loss": 0.0909, "step": 48000 }, { "epoch": 8.3, "eval_loss": Infinity, "eval_runtime": 542.9121, "eval_samples_per_second": 20.76, "eval_steps_per_second": 2.595, "eval_wer": 0.23346360732896285, "step": 48000 }, { "epoch": 8.32, "eval_loss": Infinity, "eval_runtime": 545.1225, "eval_samples_per_second": 20.676, "eval_steps_per_second": 2.585, "eval_wer": 0.23476634728525803, "step": 48100 }, { "epoch": 8.34, "eval_loss": Infinity, "eval_runtime": 543.7866, "eval_samples_per_second": 20.727, "eval_steps_per_second": 2.591, "eval_wer": 0.22904059505799293, "step": 48200 }, { "epoch": 8.35, "eval_loss": Infinity, "eval_runtime": 544.9739, "eval_samples_per_second": 20.682, "eval_steps_per_second": 2.585, "eval_wer": 0.23550176500252143, "step": 48300 }, { "epoch": 8.37, "eval_loss": Infinity, "eval_runtime": 557.5362, "eval_samples_per_second": 20.216, "eval_steps_per_second": 2.527, "eval_wer": 0.2322869389813414, "step": 48400 }, { "epoch": 8.39, "learning_rate": 0.00013307085701032124, "loss": 0.0956, "step": 48500 }, { "epoch": 8.39, "eval_loss": Infinity, "eval_runtime": 542.6037, "eval_samples_per_second": 20.772, "eval_steps_per_second": 2.597, "eval_wer": 0.22925071440578249, "step": 48500 }, { "epoch": 8.41, "eval_loss": Infinity, "eval_runtime": 554.9667, "eval_samples_per_second": 20.309, "eval_steps_per_second": 2.539, "eval_wer": 0.22897755925365607, "step": 48600 }, { "epoch": 8.42, "eval_loss": Infinity, "eval_runtime": 545.2076, "eval_samples_per_second": 20.673, "eval_steps_per_second": 2.584, "eval_wer": 0.22791645654731887, "step": 48700 }, { "epoch": 8.44, "eval_loss": Infinity, "eval_runtime": 545.724, "eval_samples_per_second": 20.653, "eval_steps_per_second": 2.582, "eval_wer": 0.2311312825684989, "step": 48800 }, { "epoch": 8.46, "eval_loss": Infinity, "eval_runtime": 545.671, "eval_samples_per_second": 20.655, "eval_steps_per_second": 2.582, "eval_wer": 0.23051143049251976, "step": 48900 }, { "epoch": 8.47, "learning_rate": 0.00013133132320538094, "loss": 0.0923, "step": 49000 }, { "epoch": 8.47, "eval_loss": Infinity, "eval_runtime": 553.4158, "eval_samples_per_second": 20.366, "eval_steps_per_second": 2.546, "eval_wer": 0.2332114641116154, "step": 49000 }, { "epoch": 8.49, "eval_loss": Infinity, "eval_runtime": 547.8596, "eval_samples_per_second": 20.573, "eval_steps_per_second": 2.572, "eval_wer": 0.2293347621448983, "step": 49100 }, { "epoch": 8.51, "eval_loss": Infinity, "eval_runtime": 546.9612, "eval_samples_per_second": 20.607, "eval_steps_per_second": 2.576, "eval_wer": 0.2290090771558245, "step": 49200 }, { "epoch": 8.53, "eval_loss": Infinity, "eval_runtime": 545.7413, "eval_samples_per_second": 20.653, "eval_steps_per_second": 2.582, "eval_wer": 0.23329551185073122, "step": 49300 }, { "epoch": 8.54, "eval_loss": Infinity, "eval_runtime": 547.3327, "eval_samples_per_second": 20.593, "eval_steps_per_second": 2.574, "eval_wer": 0.23098419902504622, "step": 49400 }, { "epoch": 8.56, "learning_rate": 0.00012959178940044069, "loss": 0.0922, "step": 49500 }, { "epoch": 8.56, "eval_loss": Infinity, "eval_runtime": 549.3327, "eval_samples_per_second": 20.518, "eval_steps_per_second": 2.565, "eval_wer": 0.2294293158514036, "step": 49500 }, { "epoch": 8.58, "eval_loss": Infinity, "eval_runtime": 547.2867, "eval_samples_per_second": 20.594, "eval_steps_per_second": 2.575, "eval_wer": 0.22784291477559254, "step": 49600 }, { "epoch": 8.6, "eval_loss": Infinity, "eval_runtime": 545.8501, "eval_samples_per_second": 20.649, "eval_steps_per_second": 2.581, "eval_wer": 0.23023827534039334, "step": 49700 }, { "epoch": 8.61, "eval_loss": Infinity, "eval_runtime": 553.5261, "eval_samples_per_second": 20.362, "eval_steps_per_second": 2.545, "eval_wer": 0.23106824676416204, "step": 49800 }, { "epoch": 8.63, "eval_loss": Infinity, "eval_runtime": 544.8885, "eval_samples_per_second": 20.685, "eval_steps_per_second": 2.586, "eval_wer": 0.22471213649352834, "step": 49900 }, { "epoch": 8.65, "learning_rate": 0.00012785225559550038, "loss": 0.0922, "step": 50000 }, { "epoch": 8.65, "eval_loss": Infinity, "eval_runtime": 544.5289, "eval_samples_per_second": 20.699, "eval_steps_per_second": 2.588, "eval_wer": 0.22955538746007734, "step": 50000 }, { "epoch": 8.66, "eval_loss": Infinity, "eval_runtime": 546.894, "eval_samples_per_second": 20.609, "eval_steps_per_second": 2.576, "eval_wer": 0.23000714405782485, "step": 50100 }, { "epoch": 8.68, "eval_loss": Infinity, "eval_runtime": 545.6073, "eval_samples_per_second": 20.658, "eval_steps_per_second": 2.582, "eval_wer": 0.2265191628845184, "step": 50200 }, { "epoch": 8.7, "eval_loss": Infinity, "eval_runtime": 545.5673, "eval_samples_per_second": 20.659, "eval_steps_per_second": 2.583, "eval_wer": 0.22610943015632878, "step": 50300 }, { "epoch": 8.72, "eval_loss": Infinity, "eval_runtime": 548.0111, "eval_samples_per_second": 20.567, "eval_steps_per_second": 2.571, "eval_wer": 0.22705496722138174, "step": 50400 }, { "epoch": 8.73, "learning_rate": 0.00012611272179056013, "loss": 0.0963, "step": 50500 }, { "epoch": 8.73, "eval_loss": Infinity, "eval_runtime": 545.7263, "eval_samples_per_second": 20.653, "eval_steps_per_second": 2.582, "eval_wer": 0.2270759791561607, "step": 50500 }, { "epoch": 8.75, "eval_loss": Infinity, "eval_runtime": 545.0461, "eval_samples_per_second": 20.679, "eval_steps_per_second": 2.585, "eval_wer": 0.22822112960161373, "step": 50600 }, { "epoch": 8.77, "eval_loss": Infinity, "eval_runtime": 544.416, "eval_samples_per_second": 20.703, "eval_steps_per_second": 2.588, "eval_wer": 0.2308581274163725, "step": 50700 }, { "epoch": 8.79, "eval_loss": Infinity, "eval_runtime": 544.2614, "eval_samples_per_second": 20.709, "eval_steps_per_second": 2.589, "eval_wer": 0.22995461422087746, "step": 50800 }, { "epoch": 8.8, "eval_loss": Infinity, "eval_runtime": 544.7154, "eval_samples_per_second": 20.692, "eval_steps_per_second": 2.587, "eval_wer": 0.23181417044881492, "step": 50900 }, { "epoch": 8.82, "learning_rate": 0.00012437318798561982, "loss": 0.0922, "step": 51000 }, { "epoch": 8.82, "eval_loss": Infinity, "eval_runtime": 556.1696, "eval_samples_per_second": 20.265, "eval_steps_per_second": 2.533, "eval_wer": 0.23071104387291982, "step": 51000 }, { "epoch": 8.84, "eval_loss": Infinity, "eval_runtime": 548.0972, "eval_samples_per_second": 20.564, "eval_steps_per_second": 2.571, "eval_wer": 0.22771684316691881, "step": 51100 }, { "epoch": 8.86, "eval_loss": Infinity, "eval_runtime": 548.2781, "eval_samples_per_second": 20.557, "eval_steps_per_second": 2.57, "eval_wer": 0.23090015128593042, "step": 51200 }, { "epoch": 8.87, "eval_loss": Infinity, "eval_runtime": 546.0918, "eval_samples_per_second": 20.639, "eval_steps_per_second": 2.58, "eval_wer": 0.22607791225416035, "step": 51300 }, { "epoch": 8.89, "eval_loss": Infinity, "eval_runtime": 547.4138, "eval_samples_per_second": 20.59, "eval_steps_per_second": 2.574, "eval_wer": 0.22970247100353, "step": 51400 }, { "epoch": 8.91, "learning_rate": 0.00012264061231589932, "loss": 0.0959, "step": 51500 }, { "epoch": 8.91, "eval_loss": Infinity, "eval_runtime": 547.932, "eval_samples_per_second": 20.57, "eval_steps_per_second": 2.571, "eval_wer": 0.22756975962346612, "step": 51500 }, { "epoch": 8.92, "eval_loss": Infinity, "eval_runtime": 549.2316, "eval_samples_per_second": 20.521, "eval_steps_per_second": 2.565, "eval_wer": 0.2244915111783493, "step": 51600 }, { "epoch": 8.94, "eval_loss": Infinity, "eval_runtime": 546.2517, "eval_samples_per_second": 20.633, "eval_steps_per_second": 2.579, "eval_wer": 0.22511136325432846, "step": 51700 }, { "epoch": 8.96, "eval_loss": Infinity, "eval_runtime": 547.2468, "eval_samples_per_second": 20.596, "eval_steps_per_second": 2.575, "eval_wer": 0.2243549336022861, "step": 51800 }, { "epoch": 8.98, "eval_loss": Infinity, "eval_runtime": 545.227, "eval_samples_per_second": 20.672, "eval_steps_per_second": 2.584, "eval_wer": 0.2264351151454026, "step": 51900 }, { "epoch": 8.99, "learning_rate": 0.00012090107851095906, "loss": 0.0936, "step": 52000 }, { "epoch": 8.99, "eval_loss": Infinity, "eval_runtime": 548.1848, "eval_samples_per_second": 20.561, "eval_steps_per_second": 2.57, "eval_wer": 0.22675029416708692, "step": 52000 }, { "epoch": 9.01, "eval_loss": Infinity, "eval_runtime": 546.0278, "eval_samples_per_second": 20.642, "eval_steps_per_second": 2.58, "eval_wer": 0.2266137165910237, "step": 52100 }, { "epoch": 9.03, "eval_loss": Infinity, "eval_runtime": 545.9251, "eval_samples_per_second": 20.646, "eval_steps_per_second": 2.581, "eval_wer": 0.22677130610186585, "step": 52200 }, { "epoch": 9.05, "eval_loss": Infinity, "eval_runtime": 544.7867, "eval_samples_per_second": 20.689, "eval_steps_per_second": 2.586, "eval_wer": 0.2291036308623298, "step": 52300 }, { "epoch": 9.06, "eval_loss": Infinity, "eval_runtime": 543.6097, "eval_samples_per_second": 20.734, "eval_steps_per_second": 2.592, "eval_wer": 0.22948184568835098, "step": 52400 }, { "epoch": 9.08, "learning_rate": 0.00011916154470601877, "loss": 0.0829, "step": 52500 }, { "epoch": 9.08, "eval_loss": Infinity, "eval_runtime": 545.0074, "eval_samples_per_second": 20.68, "eval_steps_per_second": 2.585, "eval_wer": 0.2251849050260548, "step": 52500 }, { "epoch": 9.1, "eval_loss": Infinity, "eval_runtime": 543.7151, "eval_samples_per_second": 20.73, "eval_steps_per_second": 2.591, "eval_wer": 0.22575222726508656, "step": 52600 }, { "epoch": 9.11, "eval_loss": Infinity, "eval_runtime": 544.2283, "eval_samples_per_second": 20.71, "eval_steps_per_second": 2.589, "eval_wer": 0.2293767860144562, "step": 52700 }, { "epoch": 9.13, "eval_loss": Infinity, "eval_runtime": 545.1003, "eval_samples_per_second": 20.677, "eval_steps_per_second": 2.585, "eval_wer": 0.22807404605816103, "step": 52800 }, { "epoch": 9.15, "eval_loss": Infinity, "eval_runtime": 546.4159, "eval_samples_per_second": 20.627, "eval_steps_per_second": 2.579, "eval_wer": 0.2287359220036981, "step": 52900 }, { "epoch": 9.17, "learning_rate": 0.0001174220109010785, "loss": 0.0759, "step": 53000 }, { "epoch": 9.17, "eval_loss": Infinity, "eval_runtime": 546.0093, "eval_samples_per_second": 20.643, "eval_steps_per_second": 2.581, "eval_wer": 0.22631954950411834, "step": 53000 }, { "epoch": 9.18, "eval_loss": Infinity, "eval_runtime": 553.224, "eval_samples_per_second": 20.373, "eval_steps_per_second": 2.547, "eval_wer": 0.2282736594385611, "step": 53100 }, { "epoch": 9.2, "eval_loss": Infinity, "eval_runtime": 549.148, "eval_samples_per_second": 20.525, "eval_steps_per_second": 2.566, "eval_wer": 0.22410279038493863, "step": 53200 }, { "epoch": 9.22, "eval_loss": Infinity, "eval_runtime": 545.6751, "eval_samples_per_second": 20.655, "eval_steps_per_second": 2.582, "eval_wer": 0.22418683812405446, "step": 53300 }, { "epoch": 9.24, "eval_loss": Infinity, "eval_runtime": 549.3438, "eval_samples_per_second": 20.517, "eval_steps_per_second": 2.565, "eval_wer": 0.224859220036981, "step": 53400 }, { "epoch": 9.25, "learning_rate": 0.0001156859561637481, "loss": 0.0775, "step": 53500 }, { "epoch": 9.25, "eval_loss": Infinity, "eval_runtime": 580.7095, "eval_samples_per_second": 19.409, "eval_steps_per_second": 2.426, "eval_wer": 0.22645612708018154, "step": 53500 }, { "epoch": 9.27, "eval_loss": Infinity, "eval_runtime": 580.879, "eval_samples_per_second": 19.403, "eval_steps_per_second": 2.426, "eval_wer": 0.22520591696083375, "step": 53600 }, { "epoch": 9.29, "eval_loss": Infinity, "eval_runtime": 548.8124, "eval_samples_per_second": 20.537, "eval_steps_per_second": 2.567, "eval_wer": 0.22562615565641284, "step": 53700 }, { "epoch": 9.3, "eval_loss": Infinity, "eval_runtime": 578.538, "eval_samples_per_second": 19.482, "eval_steps_per_second": 2.435, "eval_wer": 0.22503782148260212, "step": 53800 }, { "epoch": 9.32, "eval_loss": Infinity, "eval_runtime": 578.8587, "eval_samples_per_second": 19.471, "eval_steps_per_second": 2.434, "eval_wer": 0.2237981173306438, "step": 53900 }, { "epoch": 9.34, "learning_rate": 0.00011394642235880784, "loss": 0.0763, "step": 54000 }, { "epoch": 9.34, "eval_loss": Infinity, "eval_runtime": 547.6879, "eval_samples_per_second": 20.579, "eval_steps_per_second": 2.573, "eval_wer": 0.223251807026391, "step": 54000 }, { "epoch": 9.36, "eval_loss": Infinity, "eval_runtime": 576.5045, "eval_samples_per_second": 19.551, "eval_steps_per_second": 2.444, "eval_wer": 0.22266347285258026, "step": 54100 }, { "epoch": 9.37, "eval_loss": Infinity, "eval_runtime": 579.2016, "eval_samples_per_second": 19.46, "eval_steps_per_second": 2.433, "eval_wer": 0.22562615565641284, "step": 54200 }, { "epoch": 9.39, "eval_loss": Infinity, "eval_runtime": 546.2896, "eval_samples_per_second": 20.632, "eval_steps_per_second": 2.579, "eval_wer": 0.2248171961674231, "step": 54300 }, { "epoch": 9.41, "eval_loss": Infinity, "eval_runtime": 576.9166, "eval_samples_per_second": 19.537, "eval_steps_per_second": 2.442, "eval_wer": 0.22520591696083375, "step": 54400 }, { "epoch": 9.43, "learning_rate": 0.00011220688855386754, "loss": 0.0736, "step": 54500 }, { "epoch": 9.43, "eval_loss": Infinity, "eval_runtime": 552.0198, "eval_samples_per_second": 20.418, "eval_steps_per_second": 2.552, "eval_wer": 0.2253635064716759, "step": 54500 }, { "epoch": 9.44, "eval_loss": Infinity, "eval_runtime": 589.0127, "eval_samples_per_second": 19.135, "eval_steps_per_second": 2.392, "eval_wer": 0.2293767860144562, "step": 54600 }, { "epoch": 9.46, "eval_loss": Infinity, "eval_runtime": 599.9148, "eval_samples_per_second": 18.788, "eval_steps_per_second": 2.349, "eval_wer": 0.2285468145906875, "step": 54700 }, { "epoch": 9.48, "eval_loss": Infinity, "eval_runtime": 584.9159, "eval_samples_per_second": 19.269, "eval_steps_per_second": 2.409, "eval_wer": 0.22438645150445452, "step": 54800 }, { "epoch": 9.49, "eval_loss": Infinity, "eval_runtime": 579.4563, "eval_samples_per_second": 19.451, "eval_steps_per_second": 2.432, "eval_wer": 0.2259728525802656, "step": 54900 }, { "epoch": 9.51, "learning_rate": 0.00011046735474892728, "loss": 0.0787, "step": 55000 }, { "epoch": 9.51, "eval_loss": Infinity, "eval_runtime": 580.0188, "eval_samples_per_second": 19.432, "eval_steps_per_second": 2.429, "eval_wer": 0.22143427466801144, "step": 55000 }, { "epoch": 9.53, "eval_loss": Infinity, "eval_runtime": 592.0777, "eval_samples_per_second": 19.036, "eval_steps_per_second": 2.38, "eval_wer": 0.22351445621112792, "step": 55100 }, { "epoch": 9.55, "eval_loss": Infinity, "eval_runtime": 576.7489, "eval_samples_per_second": 19.542, "eval_steps_per_second": 2.443, "eval_wer": 0.22336737266767523, "step": 55200 }, { "epoch": 9.56, "eval_loss": Infinity, "eval_runtime": 579.5329, "eval_samples_per_second": 19.448, "eval_steps_per_second": 2.431, "eval_wer": 0.22437594553706505, "step": 55300 }, { "epoch": 9.58, "eval_loss": Infinity, "eval_runtime": 578.7168, "eval_samples_per_second": 19.476, "eval_steps_per_second": 2.435, "eval_wer": 0.22677130610186585, "step": 55400 }, { "epoch": 9.6, "learning_rate": 0.00010872782094398702, "loss": 0.078, "step": 55500 }, { "epoch": 9.6, "eval_loss": Infinity, "eval_runtime": 592.5376, "eval_samples_per_second": 19.022, "eval_steps_per_second": 2.378, "eval_wer": 0.22233778786350647, "step": 55500 }, { "epoch": 9.62, "eval_loss": Infinity, "eval_runtime": 579.5326, "eval_samples_per_second": 19.448, "eval_steps_per_second": 2.431, "eval_wer": 0.22266347285258026, "step": 55600 }, { "epoch": 9.63, "eval_loss": Infinity, "eval_runtime": 578.7638, "eval_samples_per_second": 19.474, "eval_steps_per_second": 2.434, "eval_wer": 0.22395570684148597, "step": 55700 }, { "epoch": 9.65, "eval_loss": Infinity, "eval_runtime": 554.6371, "eval_samples_per_second": 20.321, "eval_steps_per_second": 2.54, "eval_wer": 0.22456505295007564, "step": 55800 }, { "epoch": 9.67, "eval_loss": Infinity, "eval_runtime": 545.7119, "eval_samples_per_second": 20.654, "eval_steps_per_second": 2.582, "eval_wer": 0.2248697260043705, "step": 55900 }, { "epoch": 9.69, "learning_rate": 0.00010698828713904672, "loss": 0.0784, "step": 56000 }, { "epoch": 9.69, "eval_loss": Infinity, "eval_runtime": 545.3578, "eval_samples_per_second": 20.667, "eval_steps_per_second": 2.584, "eval_wer": 0.2238926710371491, "step": 56000 }, { "epoch": 9.7, "eval_loss": Infinity, "eval_runtime": 546.7066, "eval_samples_per_second": 20.616, "eval_steps_per_second": 2.577, "eval_wer": 0.2213502269288956, "step": 56100 }, { "epoch": 9.72, "eval_loss": Infinity, "eval_runtime": 545.4792, "eval_samples_per_second": 20.663, "eval_steps_per_second": 2.583, "eval_wer": 0.22418683812405446, "step": 56200 }, { "epoch": 9.74, "eval_loss": Infinity, "eval_runtime": 546.6115, "eval_samples_per_second": 20.62, "eval_steps_per_second": 2.578, "eval_wer": 0.2221381744831064, "step": 56300 }, { "epoch": 9.75, "eval_loss": Infinity, "eval_runtime": 549.1114, "eval_samples_per_second": 20.526, "eval_steps_per_second": 2.566, "eval_wer": 0.2241238023197176, "step": 56400 }, { "epoch": 9.77, "learning_rate": 0.00010524875333410646, "loss": 0.0771, "step": 56500 }, { "epoch": 9.77, "eval_loss": Infinity, "eval_runtime": 545.5876, "eval_samples_per_second": 20.658, "eval_steps_per_second": 2.583, "eval_wer": 0.2237981173306438, "step": 56500 }, { "epoch": 9.79, "eval_loss": Infinity, "eval_runtime": 543.6977, "eval_samples_per_second": 20.73, "eval_steps_per_second": 2.592, "eval_wer": 0.22221171625483274, "step": 56600 }, { "epoch": 9.81, "eval_loss": Infinity, "eval_runtime": 543.8359, "eval_samples_per_second": 20.725, "eval_steps_per_second": 2.591, "eval_wer": 0.2245755589174651, "step": 56700 }, { "epoch": 9.82, "eval_loss": Infinity, "eval_runtime": 543.7056, "eval_samples_per_second": 20.73, "eval_steps_per_second": 2.591, "eval_wer": 0.2232413010590015, "step": 56800 }, { "epoch": 9.84, "eval_loss": Infinity, "eval_runtime": 543.9681, "eval_samples_per_second": 20.72, "eval_steps_per_second": 2.59, "eval_wer": 0.22365103378719112, "step": 56900 }, { "epoch": 9.86, "learning_rate": 0.00010350921952916617, "loss": 0.076, "step": 57000 }, { "epoch": 9.86, "eval_loss": Infinity, "eval_runtime": 544.4231, "eval_samples_per_second": 20.703, "eval_steps_per_second": 2.588, "eval_wer": 0.22464910068919147, "step": 57000 }, { "epoch": 9.88, "eval_loss": Infinity, "eval_runtime": 544.6818, "eval_samples_per_second": 20.693, "eval_steps_per_second": 2.587, "eval_wer": 0.22017355858127416, "step": 57100 }, { "epoch": 9.89, "eval_loss": Infinity, "eval_runtime": 547.1699, "eval_samples_per_second": 20.599, "eval_steps_per_second": 2.575, "eval_wer": 0.2221801983526643, "step": 57200 }, { "epoch": 9.91, "eval_loss": Infinity, "eval_runtime": 546.1115, "eval_samples_per_second": 20.639, "eval_steps_per_second": 2.58, "eval_wer": 0.2243549336022861, "step": 57300 }, { "epoch": 9.93, "eval_loss": Infinity, "eval_runtime": 545.2721, "eval_samples_per_second": 20.67, "eval_steps_per_second": 2.584, "eval_wer": 0.22443898134140192, "step": 57400 }, { "epoch": 9.94, "learning_rate": 0.00010177316479183579, "loss": 0.0777, "step": 57500 }, { "epoch": 9.94, "eval_loss": Infinity, "eval_runtime": 545.5824, "eval_samples_per_second": 20.659, "eval_steps_per_second": 2.583, "eval_wer": 0.2209930240376534, "step": 57500 }, { "epoch": 9.96, "eval_loss": Infinity, "eval_runtime": 546.1798, "eval_samples_per_second": 20.636, "eval_steps_per_second": 2.58, "eval_wer": 0.218166918809884, "step": 57600 }, { "epoch": 9.98, "eval_loss": Infinity, "eval_runtime": 550.3082, "eval_samples_per_second": 20.481, "eval_steps_per_second": 2.56, "eval_wer": 0.2208039166246428, "step": 57700 }, { "epoch": 10.0, "eval_loss": Infinity, "eval_runtime": 548.1847, "eval_samples_per_second": 20.561, "eval_steps_per_second": 2.57, "eval_wer": 0.2210350479072113, "step": 57800 }, { "epoch": 10.01, "eval_loss": Infinity, "eval_runtime": 546.4203, "eval_samples_per_second": 20.627, "eval_steps_per_second": 2.579, "eval_wer": 0.22032064212472685, "step": 57900 }, { "epoch": 10.03, "learning_rate": 0.0001000336309868955, "loss": 0.0745, "step": 58000 }, { "epoch": 10.03, "eval_loss": Infinity, "eval_runtime": 545.6515, "eval_samples_per_second": 20.656, "eval_steps_per_second": 2.582, "eval_wer": 0.22211716254832745, "step": 58000 }, { "epoch": 10.05, "eval_loss": Infinity, "eval_runtime": 547.4513, "eval_samples_per_second": 20.588, "eval_steps_per_second": 2.574, "eval_wer": 0.22035216002689528, "step": 58100 }, { "epoch": 10.07, "eval_loss": Infinity, "eval_runtime": 548.349, "eval_samples_per_second": 20.554, "eval_steps_per_second": 2.57, "eval_wer": 0.22224323415700117, "step": 58200 }, { "epoch": 10.08, "eval_loss": Infinity, "eval_runtime": 548.8654, "eval_samples_per_second": 20.535, "eval_steps_per_second": 2.567, "eval_wer": 0.21902840813582114, "step": 58300 }, { "epoch": 10.1, "eval_loss": Infinity, "eval_runtime": 578.3959, "eval_samples_per_second": 19.487, "eval_steps_per_second": 2.436, "eval_wer": 0.22157085224407463, "step": 58400 }, { "epoch": 10.12, "learning_rate": 9.829409718195524e-05, "loss": 0.0656, "step": 58500 }, { "epoch": 10.12, "eval_loss": Infinity, "eval_runtime": 574.8445, "eval_samples_per_second": 19.607, "eval_steps_per_second": 2.451, "eval_wer": 0.2210875777441587, "step": 58500 }, { "epoch": 10.13, "eval_loss": Infinity, "eval_runtime": 548.4437, "eval_samples_per_second": 20.551, "eval_steps_per_second": 2.569, "eval_wer": 0.22125567322239031, "step": 58600 }, { "epoch": 10.15, "eval_loss": Infinity, "eval_runtime": 546.1949, "eval_samples_per_second": 20.635, "eval_steps_per_second": 2.58, "eval_wer": 0.22302067574382248, "step": 58700 }, { "epoch": 10.17, "eval_loss": Infinity, "eval_runtime": 544.4777, "eval_samples_per_second": 20.701, "eval_steps_per_second": 2.588, "eval_wer": 0.22341990250462263, "step": 58800 }, { "epoch": 10.19, "eval_loss": Infinity, "eval_runtime": 545.4451, "eval_samples_per_second": 20.664, "eval_steps_per_second": 2.583, "eval_wer": 0.22386115313498067, "step": 58900 }, { "epoch": 10.2, "learning_rate": 9.655456337701495e-05, "loss": 0.0688, "step": 59000 }, { "epoch": 10.2, "eval_loss": Infinity, "eval_runtime": 548.1142, "eval_samples_per_second": 20.563, "eval_steps_per_second": 2.571, "eval_wer": 0.22226424609178014, "step": 59000 }, { "epoch": 10.22, "eval_loss": Infinity, "eval_runtime": 547.69, "eval_samples_per_second": 20.579, "eval_steps_per_second": 2.573, "eval_wer": 0.217484030929568, "step": 59100 }, { "epoch": 10.24, "eval_loss": Infinity, "eval_runtime": 546.4205, "eval_samples_per_second": 20.627, "eval_steps_per_second": 2.579, "eval_wer": 0.21911245587493697, "step": 59200 }, { "epoch": 10.26, "eval_loss": Infinity, "eval_runtime": 547.1932, "eval_samples_per_second": 20.598, "eval_steps_per_second": 2.575, "eval_wer": 0.2226004370482434, "step": 59300 }, { "epoch": 10.27, "eval_loss": Infinity, "eval_runtime": 546.9117, "eval_samples_per_second": 20.608, "eval_steps_per_second": 2.576, "eval_wer": 0.21787275172297865, "step": 59400 }, { "epoch": 10.29, "learning_rate": 9.481502957207468e-05, "loss": 0.0633, "step": 59500 }, { "epoch": 10.29, "eval_loss": Infinity, "eval_runtime": 548.8254, "eval_samples_per_second": 20.537, "eval_steps_per_second": 2.567, "eval_wer": 0.2196902840813582, "step": 59500 }, { "epoch": 10.31, "eval_loss": Infinity, "eval_runtime": 546.9648, "eval_samples_per_second": 20.606, "eval_steps_per_second": 2.576, "eval_wer": 0.22122415532022188, "step": 59600 }, { "epoch": 10.33, "eval_loss": Infinity, "eval_runtime": 545.9902, "eval_samples_per_second": 20.643, "eval_steps_per_second": 2.581, "eval_wer": 0.21917549167927383, "step": 59700 }, { "epoch": 10.34, "eval_loss": Infinity, "eval_runtime": 546.727, "eval_samples_per_second": 20.615, "eval_steps_per_second": 2.577, "eval_wer": 0.21952218860312658, "step": 59800 }, { "epoch": 10.36, "eval_loss": Infinity, "eval_runtime": 547.09, "eval_samples_per_second": 20.602, "eval_steps_per_second": 2.575, "eval_wer": 0.21751554883173643, "step": 59900 }, { "epoch": 10.38, "learning_rate": 9.307549576713439e-05, "loss": 0.0646, "step": 60000 }, { "epoch": 10.38, "eval_loss": Infinity, "eval_runtime": 547.783, "eval_samples_per_second": 20.576, "eval_steps_per_second": 2.572, "eval_wer": 0.21554042696251471, "step": 60000 }, { "epoch": 10.39, "eval_loss": Infinity, "eval_runtime": 552.4006, "eval_samples_per_second": 20.404, "eval_steps_per_second": 2.551, "eval_wer": 0.21595015969070433, "step": 60100 }, { "epoch": 10.41, "eval_loss": Infinity, "eval_runtime": 546.4271, "eval_samples_per_second": 20.627, "eval_steps_per_second": 2.579, "eval_wer": 0.21806185913598924, "step": 60200 }, { "epoch": 10.43, "eval_loss": Infinity, "eval_runtime": 545.6537, "eval_samples_per_second": 20.656, "eval_steps_per_second": 2.582, "eval_wer": 0.21958522440746345, "step": 60300 }, { "epoch": 10.45, "eval_loss": Infinity, "eval_runtime": 546.0782, "eval_samples_per_second": 20.64, "eval_steps_per_second": 2.58, "eval_wer": 0.22041519583123215, "step": 60400 }, { "epoch": 10.46, "learning_rate": 9.133596196219412e-05, "loss": 0.0617, "step": 60500 }, { "epoch": 10.46, "eval_loss": Infinity, "eval_runtime": 549.3529, "eval_samples_per_second": 20.517, "eval_steps_per_second": 2.565, "eval_wer": 0.21913346780971593, "step": 60500 }, { "epoch": 10.48, "eval_loss": Infinity, "eval_runtime": 548.3, "eval_samples_per_second": 20.556, "eval_steps_per_second": 2.57, "eval_wer": 0.22019457051605312, "step": 60600 }, { "epoch": 10.5, "eval_loss": Infinity, "eval_runtime": 547.5552, "eval_samples_per_second": 20.584, "eval_steps_per_second": 2.573, "eval_wer": 0.22350395024373845, "step": 60700 }, { "epoch": 10.52, "eval_loss": Infinity, "eval_runtime": 546.6552, "eval_samples_per_second": 20.618, "eval_steps_per_second": 2.577, "eval_wer": 0.2166540595057993, "step": 60800 }, { "epoch": 10.53, "eval_loss": Infinity, "eval_runtime": 559.9166, "eval_samples_per_second": 20.13, "eval_steps_per_second": 2.516, "eval_wer": 0.2203416540595058, "step": 60900 }, { "epoch": 10.55, "learning_rate": 8.959642815725385e-05, "loss": 0.0662, "step": 61000 }, { "epoch": 10.55, "eval_loss": Infinity, "eval_runtime": 549.9016, "eval_samples_per_second": 20.496, "eval_steps_per_second": 2.562, "eval_wer": 0.21820894267944194, "step": 61000 }, { "epoch": 10.57, "eval_loss": Infinity, "eval_runtime": 549.326, "eval_samples_per_second": 20.518, "eval_steps_per_second": 2.565, "eval_wer": 0.21708480416876785, "step": 61100 }, { "epoch": 10.58, "eval_loss": Infinity, "eval_runtime": 550.9593, "eval_samples_per_second": 20.457, "eval_steps_per_second": 2.557, "eval_wer": 0.2189968902336527, "step": 61200 }, { "epoch": 10.6, "eval_loss": Infinity, "eval_runtime": 548.4716, "eval_samples_per_second": 20.55, "eval_steps_per_second": 2.569, "eval_wer": 0.22214868045049588, "step": 61300 }, { "epoch": 10.62, "eval_loss": Infinity, "eval_runtime": 549.5474, "eval_samples_per_second": 20.51, "eval_steps_per_second": 2.564, "eval_wer": 0.22244284753740123, "step": 61400 }, { "epoch": 10.64, "learning_rate": 8.785689435231357e-05, "loss": 0.0656, "step": 61500 }, { "epoch": 10.64, "eval_loss": Infinity, "eval_runtime": 549.7646, "eval_samples_per_second": 20.502, "eval_steps_per_second": 2.563, "eval_wer": 0.22150781643973777, "step": 61500 }, { "epoch": 10.65, "eval_loss": Infinity, "eval_runtime": 551.0007, "eval_samples_per_second": 20.456, "eval_steps_per_second": 2.557, "eval_wer": 0.21958522440746345, "step": 61600 }, { "epoch": 10.67, "eval_loss": Infinity, "eval_runtime": 551.2483, "eval_samples_per_second": 20.446, "eval_steps_per_second": 2.556, "eval_wer": 0.2200684989073794, "step": 61700 }, { "epoch": 10.69, "eval_loss": Infinity, "eval_runtime": 549.7815, "eval_samples_per_second": 20.501, "eval_steps_per_second": 2.563, "eval_wer": 0.21851361573373676, "step": 61800 }, { "epoch": 10.71, "eval_loss": Infinity, "eval_runtime": 553.4559, "eval_samples_per_second": 20.365, "eval_steps_per_second": 2.546, "eval_wer": 0.2173789712556732, "step": 61900 }, { "epoch": 10.72, "learning_rate": 8.612083961498317e-05, "loss": 0.0636, "step": 62000 }, { "epoch": 10.72, "eval_loss": Infinity, "eval_runtime": 547.7095, "eval_samples_per_second": 20.578, "eval_steps_per_second": 2.573, "eval_wer": 0.21892334846192638, "step": 62000 }, { "epoch": 10.74, "eval_loss": Infinity, "eval_runtime": 547.6345, "eval_samples_per_second": 20.581, "eval_steps_per_second": 2.573, "eval_wer": 0.2205202555051269, "step": 62100 }, { "epoch": 10.76, "eval_loss": Infinity, "eval_runtime": 546.4002, "eval_samples_per_second": 20.628, "eval_steps_per_second": 2.579, "eval_wer": 0.22041519583123215, "step": 62200 }, { "epoch": 10.77, "eval_loss": Infinity, "eval_runtime": 547.84, "eval_samples_per_second": 20.574, "eval_steps_per_second": 2.572, "eval_wer": 0.22165489998319046, "step": 62300 }, { "epoch": 10.79, "eval_loss": Infinity, "eval_runtime": 551.3251, "eval_samples_per_second": 20.443, "eval_steps_per_second": 2.556, "eval_wer": 0.21917549167927383, "step": 62400 }, { "epoch": 10.81, "learning_rate": 8.438826394526265e-05, "loss": 0.0626, "step": 62500 }, { "epoch": 10.81, "eval_loss": Infinity, "eval_runtime": 553.1486, "eval_samples_per_second": 20.376, "eval_steps_per_second": 2.547, "eval_wer": 0.21754706673390486, "step": 62500 }, { "epoch": 10.83, "eval_loss": Infinity, "eval_runtime": 551.2466, "eval_samples_per_second": 20.446, "eval_steps_per_second": 2.556, "eval_wer": 0.2192385274836107, "step": 62600 }, { "epoch": 10.84, "eval_loss": Infinity, "eval_runtime": 545.0806, "eval_samples_per_second": 20.678, "eval_steps_per_second": 2.585, "eval_wer": 0.21865019330979996, "step": 62700 }, { "epoch": 10.86, "eval_loss": Infinity, "eval_runtime": 545.5781, "eval_samples_per_second": 20.659, "eval_steps_per_second": 2.583, "eval_wer": 0.21712682803832578, "step": 62800 }, { "epoch": 10.88, "eval_loss": Infinity, "eval_runtime": 546.2445, "eval_samples_per_second": 20.634, "eval_steps_per_second": 2.579, "eval_wer": 0.2154563792233989, "step": 62900 }, { "epoch": 10.9, "learning_rate": 8.264873014032239e-05, "loss": 0.0641, "step": 63000 }, { "epoch": 10.9, "eval_loss": Infinity, "eval_runtime": 546.3019, "eval_samples_per_second": 20.631, "eval_steps_per_second": 2.579, "eval_wer": 0.21682215498403093, "step": 63000 }, { "epoch": 10.91, "eval_loss": Infinity, "eval_runtime": 546.5842, "eval_samples_per_second": 20.621, "eval_steps_per_second": 2.578, "eval_wer": 0.2183140023533367, "step": 63100 }, { "epoch": 10.93, "eval_loss": Infinity, "eval_runtime": 547.5037, "eval_samples_per_second": 20.586, "eval_steps_per_second": 2.573, "eval_wer": 0.2177151622121365, "step": 63200 }, { "epoch": 10.95, "eval_loss": Infinity, "eval_runtime": 546.2904, "eval_samples_per_second": 20.632, "eval_steps_per_second": 2.579, "eval_wer": 0.2180303412338208, "step": 63300 }, { "epoch": 10.97, "eval_loss": Infinity, "eval_runtime": 546.5707, "eval_samples_per_second": 20.621, "eval_steps_per_second": 2.578, "eval_wer": 0.21799882333165238, "step": 63400 }, { "epoch": 10.98, "learning_rate": 8.090919633538211e-05, "loss": 0.064, "step": 63500 }, { "epoch": 10.98, "eval_loss": Infinity, "eval_runtime": 544.7426, "eval_samples_per_second": 20.691, "eval_steps_per_second": 2.587, "eval_wer": 0.2185871575054631, "step": 63500 }, { "epoch": 11.0, "eval_loss": Infinity, "eval_runtime": 551.0764, "eval_samples_per_second": 20.453, "eval_steps_per_second": 2.557, "eval_wer": 0.21916498571188436, "step": 63600 }, { "epoch": 11.02, "eval_loss": Infinity, "eval_runtime": 548.7516, "eval_samples_per_second": 20.539, "eval_steps_per_second": 2.568, "eval_wer": 0.2194171289292318, "step": 63700 }, { "epoch": 11.03, "eval_loss": Infinity, "eval_runtime": 551.4195, "eval_samples_per_second": 20.44, "eval_steps_per_second": 2.555, "eval_wer": 0.21774668011430492, "step": 63800 }, { "epoch": 11.05, "eval_loss": Infinity, "eval_runtime": 552.4039, "eval_samples_per_second": 20.404, "eval_steps_per_second": 2.551, "eval_wer": 0.21732644141872584, "step": 63900 }, { "epoch": 11.07, "learning_rate": 7.916966253044183e-05, "loss": 0.0571, "step": 64000 }, { "epoch": 11.07, "eval_loss": Infinity, "eval_runtime": 552.3428, "eval_samples_per_second": 20.406, "eval_steps_per_second": 2.551, "eval_wer": 0.21994242729870567, "step": 64000 }, { "epoch": 11.09, "eval_loss": Infinity, "eval_runtime": 550.7081, "eval_samples_per_second": 20.466, "eval_steps_per_second": 2.559, "eval_wer": 0.2176626323751891, "step": 64100 }, { "epoch": 11.1, "eval_loss": Infinity, "eval_runtime": 549.2417, "eval_samples_per_second": 20.521, "eval_steps_per_second": 2.565, "eval_wer": 0.21783072785342075, "step": 64200 }, { "epoch": 11.12, "eval_loss": Infinity, "eval_runtime": 553.1807, "eval_samples_per_second": 20.375, "eval_steps_per_second": 2.547, "eval_wer": 0.21962724827702135, "step": 64300 }, { "epoch": 11.14, "eval_loss": Infinity, "eval_runtime": 548.6438, "eval_samples_per_second": 20.543, "eval_steps_per_second": 2.568, "eval_wer": 0.21541435535384099, "step": 64400 }, { "epoch": 11.16, "learning_rate": 7.743012872550157e-05, "loss": 0.0536, "step": 64500 }, { "epoch": 11.16, "eval_loss": Infinity, "eval_runtime": 551.8385, "eval_samples_per_second": 20.424, "eval_steps_per_second": 2.553, "eval_wer": 0.21403807362581947, "step": 64500 }, { "epoch": 11.17, "eval_loss": Infinity, "eval_runtime": 551.8565, "eval_samples_per_second": 20.424, "eval_steps_per_second": 2.553, "eval_wer": 0.21514120020171457, "step": 64600 }, { "epoch": 11.19, "eval_loss": Infinity, "eval_runtime": 551.0728, "eval_samples_per_second": 20.453, "eval_steps_per_second": 2.557, "eval_wer": 0.21558245083207261, "step": 64700 }, { "epoch": 11.21, "eval_loss": Infinity, "eval_runtime": 550.1479, "eval_samples_per_second": 20.487, "eval_steps_per_second": 2.561, "eval_wer": 0.21810388300554714, "step": 64800 }, { "epoch": 11.22, "eval_loss": Infinity, "eval_runtime": 556.5349, "eval_samples_per_second": 20.252, "eval_steps_per_second": 2.532, "eval_wer": 0.2173369473861153, "step": 64900 }, { "epoch": 11.24, "learning_rate": 7.569059492056128e-05, "loss": 0.0544, "step": 65000 }, { "epoch": 11.24, "eval_loss": Infinity, "eval_runtime": 554.5243, "eval_samples_per_second": 20.326, "eval_steps_per_second": 2.541, "eval_wer": 0.21618129097327282, "step": 65000 }, { "epoch": 11.26, "eval_loss": Infinity, "eval_runtime": 553.3737, "eval_samples_per_second": 20.368, "eval_steps_per_second": 2.546, "eval_wer": 0.2145738779626828, "step": 65100 }, { "epoch": 11.28, "eval_loss": Infinity, "eval_runtime": 553.6751, "eval_samples_per_second": 20.357, "eval_steps_per_second": 2.545, "eval_wer": 0.22014204067910573, "step": 65200 }, { "epoch": 11.29, "eval_loss": Infinity, "eval_runtime": 548.8824, "eval_samples_per_second": 20.534, "eval_steps_per_second": 2.567, "eval_wer": 0.21588712388636747, "step": 65300 }, { "epoch": 11.31, "eval_loss": Infinity, "eval_runtime": 554.3172, "eval_samples_per_second": 20.333, "eval_steps_per_second": 2.542, "eval_wer": 0.2159081358211464, "step": 65400 }, { "epoch": 11.33, "learning_rate": 7.395454018323089e-05, "loss": 0.0546, "step": 65500 }, { "epoch": 11.33, "eval_loss": Infinity, "eval_runtime": 548.0012, "eval_samples_per_second": 20.567, "eval_steps_per_second": 2.571, "eval_wer": 0.21578206421247267, "step": 65500 }, { "epoch": 11.35, "eval_loss": Infinity, "eval_runtime": 546.2415, "eval_samples_per_second": 20.634, "eval_steps_per_second": 2.579, "eval_wer": 0.21603420742982013, "step": 65600 }, { "epoch": 11.36, "eval_loss": Infinity, "eval_runtime": 549.3565, "eval_samples_per_second": 20.517, "eval_steps_per_second": 2.565, "eval_wer": 0.21724239367961, "step": 65700 }, { "epoch": 11.38, "eval_loss": Infinity, "eval_runtime": 547.895, "eval_samples_per_second": 20.571, "eval_steps_per_second": 2.572, "eval_wer": 0.21695873256009413, "step": 65800 }, { "epoch": 11.4, "eval_loss": Infinity, "eval_runtime": 549.1149, "eval_samples_per_second": 20.526, "eval_steps_per_second": 2.566, "eval_wer": 0.216097243234157, "step": 65900 }, { "epoch": 11.41, "learning_rate": 7.221500637829061e-05, "loss": 0.0545, "step": 66000 }, { "epoch": 11.41, "eval_loss": Infinity, "eval_runtime": 557.4232, "eval_samples_per_second": 20.22, "eval_steps_per_second": 2.528, "eval_wer": 0.21853462766851572, "step": 66000 }, { "epoch": 11.43, "eval_loss": Infinity, "eval_runtime": 551.3783, "eval_samples_per_second": 20.442, "eval_steps_per_second": 2.555, "eval_wer": 0.2169377206253152, "step": 66100 }, { "epoch": 11.45, "eval_loss": Infinity, "eval_runtime": 548.1583, "eval_samples_per_second": 20.562, "eval_steps_per_second": 2.57, "eval_wer": 0.21663304757102034, "step": 66200 }, { "epoch": 11.47, "eval_loss": Infinity, "eval_runtime": 549.1862, "eval_samples_per_second": 20.523, "eval_steps_per_second": 2.566, "eval_wer": 0.21433224071272483, "step": 66300 }, { "epoch": 11.48, "eval_loss": Infinity, "eval_runtime": 547.0477, "eval_samples_per_second": 20.603, "eval_steps_per_second": 2.576, "eval_wer": 0.2137964363758615, "step": 66400 }, { "epoch": 11.5, "learning_rate": 7.047547257335033e-05, "loss": 0.0539, "step": 66500 }, { "epoch": 11.5, "eval_loss": Infinity, "eval_runtime": 545.649, "eval_samples_per_second": 20.656, "eval_steps_per_second": 2.582, "eval_wer": 0.21467893763657758, "step": 66500 }, { "epoch": 11.52, "eval_loss": Infinity, "eval_runtime": 545.0721, "eval_samples_per_second": 20.678, "eval_steps_per_second": 2.585, "eval_wer": 0.2143532526475038, "step": 66600 }, { "epoch": 11.54, "eval_loss": Infinity, "eval_runtime": 546.699, "eval_samples_per_second": 20.616, "eval_steps_per_second": 2.577, "eval_wer": 0.21421667507144057, "step": 66700 }, { "epoch": 11.55, "eval_loss": Infinity, "eval_runtime": 547.5775, "eval_samples_per_second": 20.583, "eval_steps_per_second": 2.573, "eval_wer": 0.2140590855605984, "step": 66800 }, { "epoch": 11.57, "eval_loss": Infinity, "eval_runtime": 546.57, "eval_samples_per_second": 20.621, "eval_steps_per_second": 2.578, "eval_wer": 0.2135547991259035, "step": 66900 }, { "epoch": 11.59, "learning_rate": 6.873593876841007e-05, "loss": 0.0545, "step": 67000 }, { "epoch": 11.59, "eval_loss": Infinity, "eval_runtime": 546.0529, "eval_samples_per_second": 20.641, "eval_steps_per_second": 2.58, "eval_wer": 0.21575054631030424, "step": 67000 }, { "epoch": 11.6, "eval_loss": Infinity, "eval_runtime": 546.2996, "eval_samples_per_second": 20.632, "eval_steps_per_second": 2.579, "eval_wer": 0.21779920995125232, "step": 67100 }, { "epoch": 11.62, "eval_loss": Infinity, "eval_runtime": 546.7915, "eval_samples_per_second": 20.613, "eval_steps_per_second": 2.577, "eval_wer": 0.21658051773407294, "step": 67200 }, { "epoch": 11.64, "eval_loss": Infinity, "eval_runtime": 545.549, "eval_samples_per_second": 20.66, "eval_steps_per_second": 2.583, "eval_wer": 0.21400655572365104, "step": 67300 }, { "epoch": 11.66, "eval_loss": Infinity, "eval_runtime": 546.7529, "eval_samples_per_second": 20.614, "eval_steps_per_second": 2.577, "eval_wer": 0.21427971087577743, "step": 67400 }, { "epoch": 11.67, "learning_rate": 6.699640496346979e-05, "loss": 0.0538, "step": 67500 }, { "epoch": 11.67, "eval_loss": Infinity, "eval_runtime": 548.0068, "eval_samples_per_second": 20.567, "eval_steps_per_second": 2.571, "eval_wer": 0.21409060346276684, "step": 67500 }, { "epoch": 11.69, "eval_loss": Infinity, "eval_runtime": 545.7442, "eval_samples_per_second": 20.653, "eval_steps_per_second": 2.582, "eval_wer": 0.21662254160363087, "step": 67600 }, { "epoch": 11.71, "eval_loss": Infinity, "eval_runtime": 548.6181, "eval_samples_per_second": 20.544, "eval_steps_per_second": 2.568, "eval_wer": 0.21437426458228273, "step": 67700 }, { "epoch": 11.73, "eval_loss": Infinity, "eval_runtime": 544.7509, "eval_samples_per_second": 20.69, "eval_steps_per_second": 2.587, "eval_wer": 0.21205244578920826, "step": 67800 }, { "epoch": 11.74, "eval_loss": Infinity, "eval_runtime": 545.7434, "eval_samples_per_second": 20.653, "eval_steps_per_second": 2.582, "eval_wer": 0.21325012607160868, "step": 67900 }, { "epoch": 11.76, "learning_rate": 6.525687115852951e-05, "loss": 0.0529, "step": 68000 }, { "epoch": 11.76, "eval_loss": Infinity, "eval_runtime": 545.6556, "eval_samples_per_second": 20.656, "eval_steps_per_second": 2.582, "eval_wer": 0.2136073289628509, "step": 68000 }, { "epoch": 11.78, "eval_loss": Infinity, "eval_runtime": 545.981, "eval_samples_per_second": 20.644, "eval_steps_per_second": 2.581, "eval_wer": 0.21634938645150445, "step": 68100 }, { "epoch": 11.8, "eval_loss": Infinity, "eval_runtime": 544.2745, "eval_samples_per_second": 20.708, "eval_steps_per_second": 2.589, "eval_wer": 0.21389099008236678, "step": 68200 }, { "epoch": 11.81, "eval_loss": Infinity, "eval_runtime": 544.5409, "eval_samples_per_second": 20.698, "eval_steps_per_second": 2.588, "eval_wer": 0.21302950075642965, "step": 68300 }, { "epoch": 11.83, "eval_loss": Infinity, "eval_runtime": 546.1049, "eval_samples_per_second": 20.639, "eval_steps_per_second": 2.58, "eval_wer": 0.21082324760463944, "step": 68400 }, { "epoch": 11.85, "learning_rate": 6.351733735358923e-05, "loss": 0.0528, "step": 68500 }, { "epoch": 11.85, "eval_loss": Infinity, "eval_runtime": 546.5201, "eval_samples_per_second": 20.623, "eval_steps_per_second": 2.578, "eval_wer": 0.2115691712892923, "step": 68500 }, { "epoch": 11.86, "eval_loss": Infinity, "eval_runtime": 546.1767, "eval_samples_per_second": 20.636, "eval_steps_per_second": 2.58, "eval_wer": 0.21026643133299713, "step": 68600 }, { "epoch": 11.88, "eval_loss": Infinity, "eval_runtime": 548.1438, "eval_samples_per_second": 20.562, "eval_steps_per_second": 2.57, "eval_wer": 0.21120146243066062, "step": 68700 }, { "epoch": 11.9, "eval_loss": Infinity, "eval_runtime": 545.8375, "eval_samples_per_second": 20.649, "eval_steps_per_second": 2.581, "eval_wer": 0.212399142713061, "step": 68800 }, { "epoch": 11.92, "eval_loss": Infinity, "eval_runtime": 559.1437, "eval_samples_per_second": 20.158, "eval_steps_per_second": 2.52, "eval_wer": 0.21138006387628172, "step": 68900 }, { "epoch": 11.93, "learning_rate": 6.177780354864895e-05, "loss": 0.0523, "step": 69000 }, { "epoch": 11.93, "eval_loss": Infinity, "eval_runtime": 547.1977, "eval_samples_per_second": 20.598, "eval_steps_per_second": 2.575, "eval_wer": 0.21378593040847202, "step": 69000 }, { "epoch": 11.95, "eval_loss": Infinity, "eval_runtime": 546.6331, "eval_samples_per_second": 20.619, "eval_steps_per_second": 2.578, "eval_wer": 0.2135232812237351, "step": 69100 }, { "epoch": 11.97, "eval_loss": Infinity, "eval_runtime": 546.1655, "eval_samples_per_second": 20.637, "eval_steps_per_second": 2.58, "eval_wer": 0.21153765338712388, "step": 69200 }, { "epoch": 11.99, "eval_loss": Infinity, "eval_runtime": 546.7795, "eval_samples_per_second": 20.613, "eval_steps_per_second": 2.577, "eval_wer": 0.21012985375693394, "step": 69300 }, { "epoch": 12.0, "eval_loss": Infinity, "eval_runtime": 546.9894, "eval_samples_per_second": 20.606, "eval_steps_per_second": 2.576, "eval_wer": 0.21049756261556565, "step": 69400 }, { "epoch": 12.02, "learning_rate": 6.003826974370868e-05, "loss": 0.052, "step": 69500 }, { "epoch": 12.02, "eval_loss": Infinity, "eval_runtime": 546.4107, "eval_samples_per_second": 20.627, "eval_steps_per_second": 2.579, "eval_wer": 0.21161119515885024, "step": 69500 }, { "epoch": 12.04, "eval_loss": Infinity, "eval_runtime": 547.49, "eval_samples_per_second": 20.587, "eval_steps_per_second": 2.574, "eval_wer": 0.21267229786518743, "step": 69600 }, { "epoch": 12.05, "eval_loss": Infinity, "eval_runtime": 549.2968, "eval_samples_per_second": 20.519, "eval_steps_per_second": 2.565, "eval_wer": 0.21150613548495545, "step": 69700 }, { "epoch": 12.07, "eval_loss": Infinity, "eval_runtime": 550.0198, "eval_samples_per_second": 20.492, "eval_steps_per_second": 2.562, "eval_wer": 0.20942595394183897, "step": 69800 }, { "epoch": 12.09, "eval_loss": Infinity, "eval_runtime": 549.2856, "eval_samples_per_second": 20.519, "eval_steps_per_second": 2.565, "eval_wer": 0.21057110438729199, "step": 69900 }, { "epoch": 12.11, "learning_rate": 5.830569407398817e-05, "loss": 0.0499, "step": 70000 }, { "epoch": 12.11, "eval_loss": Infinity, "eval_runtime": 547.589, "eval_samples_per_second": 20.583, "eval_steps_per_second": 2.573, "eval_wer": 0.2110753908219869, "step": 70000 }, { "epoch": 12.12, "eval_loss": Infinity, "eval_runtime": 548.5834, "eval_samples_per_second": 20.546, "eval_steps_per_second": 2.568, "eval_wer": 0.21128551016977642, "step": 70100 }, { "epoch": 12.14, "eval_loss": Infinity, "eval_runtime": 547.8589, "eval_samples_per_second": 20.573, "eval_steps_per_second": 2.572, "eval_wer": 0.21247268448478737, "step": 70200 }, { "epoch": 12.16, "eval_loss": Infinity, "eval_runtime": 547.6862, "eval_samples_per_second": 20.579, "eval_steps_per_second": 2.573, "eval_wer": 0.21007732391998654, "step": 70300 }, { "epoch": 12.18, "eval_loss": Infinity, "eval_runtime": 548.8788, "eval_samples_per_second": 20.535, "eval_steps_per_second": 2.567, "eval_wer": 0.21147461758278702, "step": 70400 }, { "epoch": 12.19, "learning_rate": 5.656616026904789e-05, "loss": 0.0466, "step": 70500 }, { "epoch": 12.19, "eval_loss": Infinity, "eval_runtime": 547.2229, "eval_samples_per_second": 20.597, "eval_steps_per_second": 2.575, "eval_wer": 0.2119053622457556, "step": 70500 }, { "epoch": 12.21, "eval_loss": Infinity, "eval_runtime": 545.9416, "eval_samples_per_second": 20.645, "eval_steps_per_second": 2.581, "eval_wer": 0.21017187762649184, "step": 70600 }, { "epoch": 12.23, "eval_loss": Infinity, "eval_runtime": 546.221, "eval_samples_per_second": 20.635, "eval_steps_per_second": 2.58, "eval_wer": 0.21210497562615566, "step": 70700 }, { "epoch": 12.24, "eval_loss": Infinity, "eval_runtime": 546.0324, "eval_samples_per_second": 20.642, "eval_steps_per_second": 2.58, "eval_wer": 0.20912128088754411, "step": 70800 }, { "epoch": 12.26, "eval_loss": Infinity, "eval_runtime": 550.3946, "eval_samples_per_second": 20.478, "eval_steps_per_second": 2.56, "eval_wer": 0.20918431669188098, "step": 70900 }, { "epoch": 12.28, "learning_rate": 5.482662646410761e-05, "loss": 0.0475, "step": 71000 }, { "epoch": 12.28, "eval_loss": Infinity, "eval_runtime": 550.7521, "eval_samples_per_second": 20.465, "eval_steps_per_second": 2.558, "eval_wer": 0.21018238359388133, "step": 71000 }, { "epoch": 12.3, "eval_loss": Infinity, "eval_runtime": 549.8286, "eval_samples_per_second": 20.499, "eval_steps_per_second": 2.563, "eval_wer": 0.20944696587661793, "step": 71100 }, { "epoch": 12.31, "eval_loss": Infinity, "eval_runtime": 550.14, "eval_samples_per_second": 20.488, "eval_steps_per_second": 2.561, "eval_wer": 0.20863800638762817, "step": 71200 }, { "epoch": 12.33, "eval_loss": Infinity, "eval_runtime": 546.3515, "eval_samples_per_second": 20.63, "eval_steps_per_second": 2.579, "eval_wer": 0.20678895612708018, "step": 71300 }, { "epoch": 12.35, "eval_loss": Infinity, "eval_runtime": 546.7793, "eval_samples_per_second": 20.613, "eval_steps_per_second": 2.577, "eval_wer": 0.20771348125735417, "step": 71400 }, { "epoch": 12.37, "learning_rate": 5.3087092659167335e-05, "loss": 0.0433, "step": 71500 }, { "epoch": 12.37, "eval_loss": Infinity, "eval_runtime": 548.6341, "eval_samples_per_second": 20.544, "eval_steps_per_second": 2.568, "eval_wer": 0.20904773911581778, "step": 71500 }, { "epoch": 12.38, "eval_loss": Infinity, "eval_runtime": 548.8543, "eval_samples_per_second": 20.536, "eval_steps_per_second": 2.567, "eval_wer": 0.20905824508320725, "step": 71600 }, { "epoch": 12.4, "eval_loss": Infinity, "eval_runtime": 547.0279, "eval_samples_per_second": 20.604, "eval_steps_per_second": 2.576, "eval_wer": 0.21201042191965036, "step": 71700 }, { "epoch": 12.42, "eval_loss": Infinity, "eval_runtime": 546.0371, "eval_samples_per_second": 20.641, "eval_steps_per_second": 2.58, "eval_wer": 0.20892166750714405, "step": 71800 }, { "epoch": 12.44, "eval_loss": Infinity, "eval_runtime": 546.5248, "eval_samples_per_second": 20.623, "eval_steps_per_second": 2.578, "eval_wer": 0.20953101361573373, "step": 71900 }, { "epoch": 12.45, "learning_rate": 5.1347558854227064e-05, "loss": 0.0457, "step": 72000 }, { "epoch": 12.45, "eval_loss": Infinity, "eval_runtime": 547.1024, "eval_samples_per_second": 20.601, "eval_steps_per_second": 2.575, "eval_wer": 0.20903723314842831, "step": 72000 }, { "epoch": 12.47, "eval_loss": Infinity, "eval_runtime": 546.2064, "eval_samples_per_second": 20.635, "eval_steps_per_second": 2.58, "eval_wer": 0.20880610186585982, "step": 72100 }, { "epoch": 12.49, "eval_loss": Infinity, "eval_runtime": 545.9585, "eval_samples_per_second": 20.644, "eval_steps_per_second": 2.581, "eval_wer": 0.20800764834425953, "step": 72200 }, { "epoch": 12.5, "eval_loss": Infinity, "eval_runtime": 546.2479, "eval_samples_per_second": 20.633, "eval_steps_per_second": 2.579, "eval_wer": 0.20662086064884855, "step": 72300 }, { "epoch": 12.52, "eval_loss": Infinity, "eval_runtime": 550.549, "eval_samples_per_second": 20.472, "eval_steps_per_second": 2.559, "eval_wer": 0.20978315683308119, "step": 72400 }, { "epoch": 12.54, "learning_rate": 4.961150411689667e-05, "loss": 0.0446, "step": 72500 }, { "epoch": 12.54, "eval_loss": Infinity, "eval_runtime": 549.0154, "eval_samples_per_second": 20.529, "eval_steps_per_second": 2.566, "eval_wer": 0.20758740964868044, "step": 72500 }, { "epoch": 12.56, "eval_loss": Infinity, "eval_runtime": 547.3815, "eval_samples_per_second": 20.591, "eval_steps_per_second": 2.574, "eval_wer": 0.20679946209446967, "step": 72600 }, { "epoch": 12.57, "eval_loss": Infinity, "eval_runtime": 547.8075, "eval_samples_per_second": 20.575, "eval_steps_per_second": 2.572, "eval_wer": 0.20801815431164902, "step": 72700 }, { "epoch": 12.59, "eval_loss": Infinity, "eval_runtime": 546.6072, "eval_samples_per_second": 20.62, "eval_steps_per_second": 2.578, "eval_wer": 0.21288241721297696, "step": 72800 }, { "epoch": 12.61, "eval_loss": Infinity, "eval_runtime": 550.7128, "eval_samples_per_second": 20.466, "eval_steps_per_second": 2.559, "eval_wer": 0.21161119515885024, "step": 72900 }, { "epoch": 12.63, "learning_rate": 4.787197031195639e-05, "loss": 0.0423, "step": 73000 }, { "epoch": 12.63, "eval_loss": Infinity, "eval_runtime": 547.9244, "eval_samples_per_second": 20.57, "eval_steps_per_second": 2.572, "eval_wer": 0.210791729702471, "step": 73000 }, { "epoch": 12.64, "eval_loss": Infinity, "eval_runtime": 546.7393, "eval_samples_per_second": 20.615, "eval_steps_per_second": 2.577, "eval_wer": 0.20828080349638595, "step": 73100 }, { "epoch": 12.66, "eval_loss": Infinity, "eval_runtime": 549.7708, "eval_samples_per_second": 20.501, "eval_steps_per_second": 2.563, "eval_wer": 0.20792360060514373, "step": 73200 }, { "epoch": 12.68, "eval_loss": Infinity, "eval_runtime": 548.6428, "eval_samples_per_second": 20.543, "eval_steps_per_second": 2.568, "eval_wer": 0.2072932425617751, "step": 73300 }, { "epoch": 12.69, "eval_loss": Infinity, "eval_runtime": 559.0002, "eval_samples_per_second": 20.163, "eval_steps_per_second": 2.521, "eval_wer": 0.20738779626828038, "step": 73400 }, { "epoch": 12.71, "learning_rate": 4.613243650701612e-05, "loss": 0.0443, "step": 73500 }, { "epoch": 12.71, "eval_loss": Infinity, "eval_runtime": 545.8124, "eval_samples_per_second": 20.65, "eval_steps_per_second": 2.581, "eval_wer": 0.20659984871406958, "step": 73500 }, { "epoch": 12.73, "eval_loss": Infinity, "eval_runtime": 549.5227, "eval_samples_per_second": 20.511, "eval_steps_per_second": 2.564, "eval_wer": 0.2069570516053118, "step": 73600 }, { "epoch": 12.75, "eval_loss": Infinity, "eval_runtime": 547.0702, "eval_samples_per_second": 20.602, "eval_steps_per_second": 2.576, "eval_wer": 0.20542318036644813, "step": 73700 }, { "epoch": 12.76, "eval_loss": Infinity, "eval_runtime": 548.2885, "eval_samples_per_second": 20.557, "eval_steps_per_second": 2.57, "eval_wer": 0.20436207766011094, "step": 73800 }, { "epoch": 12.78, "eval_loss": Infinity, "eval_runtime": 548.5659, "eval_samples_per_second": 20.546, "eval_steps_per_second": 2.569, "eval_wer": 0.20449865523617414, "step": 73900 }, { "epoch": 12.8, "learning_rate": 4.439290270207584e-05, "loss": 0.0431, "step": 74000 }, { "epoch": 12.8, "eval_loss": Infinity, "eval_runtime": 548.4023, "eval_samples_per_second": 20.552, "eval_steps_per_second": 2.569, "eval_wer": 0.20554925197512186, "step": 74000 }, { "epoch": 12.82, "eval_loss": Infinity, "eval_runtime": 550.149, "eval_samples_per_second": 20.487, "eval_steps_per_second": 2.561, "eval_wer": 0.205486216170785, "step": 74100 }, { "epoch": 12.83, "eval_loss": Infinity, "eval_runtime": 547.5824, "eval_samples_per_second": 20.583, "eval_steps_per_second": 2.573, "eval_wer": 0.20856446461590183, "step": 74200 }, { "epoch": 12.85, "eval_loss": Infinity, "eval_runtime": 546.9058, "eval_samples_per_second": 20.609, "eval_steps_per_second": 2.576, "eval_wer": 0.20840687510505967, "step": 74300 }, { "epoch": 12.87, "eval_loss": Infinity, "eval_runtime": 547.6274, "eval_samples_per_second": 20.582, "eval_steps_per_second": 2.573, "eval_wer": 0.2061270801815431, "step": 74400 }, { "epoch": 12.88, "learning_rate": 4.265336889713556e-05, "loss": 0.045, "step": 74500 }, { "epoch": 12.88, "eval_loss": Infinity, "eval_runtime": 548.5153, "eval_samples_per_second": 20.548, "eval_steps_per_second": 2.569, "eval_wer": 0.20694654563792234, "step": 74500 }, { "epoch": 12.9, "eval_loss": Infinity, "eval_runtime": 548.6672, "eval_samples_per_second": 20.543, "eval_steps_per_second": 2.568, "eval_wer": 0.20734577239872248, "step": 74600 }, { "epoch": 12.92, "eval_loss": Infinity, "eval_runtime": 552.9233, "eval_samples_per_second": 20.384, "eval_steps_per_second": 2.548, "eval_wer": 0.20574886535552195, "step": 74700 }, { "epoch": 12.94, "eval_loss": Infinity, "eval_runtime": 550.6342, "eval_samples_per_second": 20.469, "eval_steps_per_second": 2.559, "eval_wer": 0.20813371995293325, "step": 74800 }, { "epoch": 12.95, "eval_loss": Infinity, "eval_runtime": 546.873, "eval_samples_per_second": 20.61, "eval_steps_per_second": 2.576, "eval_wer": 0.205948478735922, "step": 74900 }, { "epoch": 12.97, "learning_rate": 4.091731415980517e-05, "loss": 0.0434, "step": 75000 }, { "epoch": 12.97, "eval_loss": Infinity, "eval_runtime": 547.6534, "eval_samples_per_second": 20.581, "eval_steps_per_second": 2.573, "eval_wer": 0.20497142376870062, "step": 75000 }, { "epoch": 12.99, "eval_loss": Infinity, "eval_runtime": 547.905, "eval_samples_per_second": 20.571, "eval_steps_per_second": 2.572, "eval_wer": 0.2041939821818793, "step": 75100 }, { "epoch": 13.01, "eval_loss": Infinity, "eval_runtime": 546.051, "eval_samples_per_second": 20.641, "eval_steps_per_second": 2.58, "eval_wer": 0.20416246427971088, "step": 75200 }, { "epoch": 13.02, "eval_loss": Infinity, "eval_runtime": 548.0237, "eval_samples_per_second": 20.567, "eval_steps_per_second": 2.571, "eval_wer": 0.20353210623634224, "step": 75300 }, { "epoch": 13.04, "eval_loss": Infinity, "eval_runtime": 547.0355, "eval_samples_per_second": 20.604, "eval_steps_per_second": 2.576, "eval_wer": 0.20444612539922677, "step": 75400 }, { "epoch": 13.06, "learning_rate": 3.9177780354864895e-05, "loss": 0.0388, "step": 75500 }, { "epoch": 13.06, "eval_loss": Infinity, "eval_runtime": 547.6747, "eval_samples_per_second": 20.58, "eval_steps_per_second": 2.573, "eval_wer": 0.2026285930408472, "step": 75500 }, { "epoch": 13.08, "eval_loss": Infinity, "eval_runtime": 549.5817, "eval_samples_per_second": 20.508, "eval_steps_per_second": 2.564, "eval_wer": 0.20371070768196337, "step": 75600 }, { "epoch": 13.09, "eval_loss": Infinity, "eval_runtime": 549.0065, "eval_samples_per_second": 20.53, "eval_steps_per_second": 2.566, "eval_wer": 0.20430954782316355, "step": 75700 }, { "epoch": 13.11, "eval_loss": Infinity, "eval_runtime": 547.8794, "eval_samples_per_second": 20.572, "eval_steps_per_second": 2.572, "eval_wer": 0.20384728525802656, "step": 75800 }, { "epoch": 13.13, "eval_loss": Infinity, "eval_runtime": 548.5189, "eval_samples_per_second": 20.548, "eval_steps_per_second": 2.569, "eval_wer": 0.20399436880147925, "step": 75900 }, { "epoch": 13.14, "learning_rate": 3.743824654992462e-05, "loss": 0.0391, "step": 76000 }, { "epoch": 13.14, "eval_loss": Infinity, "eval_runtime": 547.8529, "eval_samples_per_second": 20.573, "eval_steps_per_second": 2.572, "eval_wer": 0.20545469826861656, "step": 76000 }, { "epoch": 13.16, "eval_loss": Infinity, "eval_runtime": 547.706, "eval_samples_per_second": 20.579, "eval_steps_per_second": 2.573, "eval_wer": 0.2059064548663641, "step": 76100 }, { "epoch": 13.18, "eval_loss": Infinity, "eval_runtime": 546.7268, "eval_samples_per_second": 20.615, "eval_steps_per_second": 2.577, "eval_wer": 0.20568582955118508, "step": 76200 }, { "epoch": 13.2, "eval_loss": Infinity, "eval_runtime": 545.8487, "eval_samples_per_second": 20.649, "eval_steps_per_second": 2.581, "eval_wer": 0.20443561943183727, "step": 76300 }, { "epoch": 13.21, "eval_loss": Infinity, "eval_runtime": 546.5302, "eval_samples_per_second": 20.623, "eval_steps_per_second": 2.578, "eval_wer": 0.20482434022524795, "step": 76400 }, { "epoch": 13.23, "learning_rate": 3.569871274498434e-05, "loss": 0.0416, "step": 76500 }, { "epoch": 13.23, "eval_loss": Infinity, "eval_runtime": 548.7117, "eval_samples_per_second": 20.541, "eval_steps_per_second": 2.568, "eval_wer": 0.20413094637754245, "step": 76500 }, { "epoch": 13.25, "eval_loss": Infinity, "eval_runtime": 548.0591, "eval_samples_per_second": 20.565, "eval_steps_per_second": 2.571, "eval_wer": 0.2031328794755421, "step": 76600 }, { "epoch": 13.27, "eval_loss": Infinity, "eval_runtime": 547.9137, "eval_samples_per_second": 20.571, "eval_steps_per_second": 2.572, "eval_wer": 0.20347957639939485, "step": 76700 }, { "epoch": 13.28, "eval_loss": Infinity, "eval_runtime": 547.587, "eval_samples_per_second": 20.583, "eval_steps_per_second": 2.573, "eval_wer": 0.2036476718776265, "step": 76800 }, { "epoch": 13.3, "eval_loss": Infinity, "eval_runtime": 547.4785, "eval_samples_per_second": 20.587, "eval_steps_per_second": 2.574, "eval_wer": 0.20268112287779458, "step": 76900 }, { "epoch": 13.32, "learning_rate": 3.395917894004407e-05, "loss": 0.0387, "step": 77000 }, { "epoch": 13.32, "eval_loss": Infinity, "eval_runtime": 546.9031, "eval_samples_per_second": 20.609, "eval_steps_per_second": 2.576, "eval_wer": 0.20260758110606825, "step": 77000 }, { "epoch": 13.33, "eval_loss": Infinity, "eval_runtime": 550.3877, "eval_samples_per_second": 20.478, "eval_steps_per_second": 2.56, "eval_wer": 0.20273365271474197, "step": 77100 }, { "epoch": 13.35, "eval_loss": Infinity, "eval_runtime": 548.8206, "eval_samples_per_second": 20.537, "eval_steps_per_second": 2.567, "eval_wer": 0.20204025886703647, "step": 77200 }, { "epoch": 13.37, "eval_loss": Infinity, "eval_runtime": 547.3966, "eval_samples_per_second": 20.59, "eval_steps_per_second": 2.574, "eval_wer": 0.2015254664649521, "step": 77300 }, { "epoch": 13.39, "eval_loss": Infinity, "eval_runtime": 547.7422, "eval_samples_per_second": 20.577, "eval_steps_per_second": 2.572, "eval_wer": 0.20210329467137333, "step": 77400 }, { "epoch": 13.4, "learning_rate": 3.221964513510379e-05, "loss": 0.0388, "step": 77500 }, { "epoch": 13.4, "eval_loss": Infinity, "eval_runtime": 548.8405, "eval_samples_per_second": 20.536, "eval_steps_per_second": 2.567, "eval_wer": 0.20255505126912085, "step": 77500 }, { "epoch": 13.42, "eval_loss": Infinity, "eval_runtime": 547.5989, "eval_samples_per_second": 20.583, "eval_steps_per_second": 2.573, "eval_wer": 0.20247100353000505, "step": 77600 }, { "epoch": 13.44, "eval_loss": Infinity, "eval_runtime": 549.3386, "eval_samples_per_second": 20.517, "eval_steps_per_second": 2.565, "eval_wer": 0.20259707513867878, "step": 77700 }, { "epoch": 13.46, "eval_loss": Infinity, "eval_runtime": 548.9936, "eval_samples_per_second": 20.53, "eval_steps_per_second": 2.567, "eval_wer": 0.20168305597579425, "step": 77800 }, { "epoch": 13.47, "eval_loss": Infinity, "eval_runtime": 547.7403, "eval_samples_per_second": 20.577, "eval_steps_per_second": 2.572, "eval_wer": 0.20236594385611026, "step": 77900 }, { "epoch": 13.49, "learning_rate": 3.0480111330163512e-05, "loss": 0.0393, "step": 78000 }, { "epoch": 13.49, "eval_loss": Infinity, "eval_runtime": 546.9778, "eval_samples_per_second": 20.606, "eval_steps_per_second": 2.576, "eval_wer": 0.20218734241048916, "step": 78000 }, { "epoch": 13.51, "eval_loss": Infinity, "eval_runtime": 547.4243, "eval_samples_per_second": 20.589, "eval_steps_per_second": 2.574, "eval_wer": 0.2026706169104051, "step": 78100 }, { "epoch": 13.52, "eval_loss": Infinity, "eval_runtime": 547.4439, "eval_samples_per_second": 20.588, "eval_steps_per_second": 2.574, "eval_wer": 0.20266011094301564, "step": 78200 }, { "epoch": 13.54, "eval_loss": Infinity, "eval_runtime": 548.5146, "eval_samples_per_second": 20.548, "eval_steps_per_second": 2.569, "eval_wer": 0.20126281728021517, "step": 78300 }, { "epoch": 13.56, "eval_loss": Infinity, "eval_runtime": 548.6545, "eval_samples_per_second": 20.543, "eval_steps_per_second": 2.568, "eval_wer": 0.201105227769373, "step": 78400 }, { "epoch": 13.58, "learning_rate": 2.8744056592833116e-05, "loss": 0.0389, "step": 78500 }, { "epoch": 13.58, "eval_loss": Infinity, "eval_runtime": 548.7215, "eval_samples_per_second": 20.54, "eval_steps_per_second": 2.568, "eval_wer": 0.20085308455202555, "step": 78500 }, { "epoch": 13.59, "eval_loss": Infinity, "eval_runtime": 549.8062, "eval_samples_per_second": 20.5, "eval_steps_per_second": 2.563, "eval_wer": 0.20089510842158345, "step": 78600 }, { "epoch": 13.61, "eval_loss": Infinity, "eval_runtime": 588.3973, "eval_samples_per_second": 19.155, "eval_steps_per_second": 2.395, "eval_wer": 0.20059043536728863, "step": 78700 }, { "epoch": 13.63, "eval_loss": Infinity, "eval_runtime": 552.7964, "eval_samples_per_second": 20.389, "eval_steps_per_second": 2.549, "eval_wer": 0.20140990082366783, "step": 78800 }, { "epoch": 13.65, "eval_loss": Infinity, "eval_runtime": 550.5531, "eval_samples_per_second": 20.472, "eval_steps_per_second": 2.559, "eval_wer": 0.20086359051941502, "step": 78900 }, { "epoch": 13.66, "learning_rate": 2.700452278789284e-05, "loss": 0.0413, "step": 79000 }, { "epoch": 13.66, "eval_loss": Infinity, "eval_runtime": 549.8536, "eval_samples_per_second": 20.498, "eval_steps_per_second": 2.563, "eval_wer": 0.20187216338880484, "step": 79000 }, { "epoch": 13.68, "eval_loss": Infinity, "eval_runtime": 550.6749, "eval_samples_per_second": 20.468, "eval_steps_per_second": 2.559, "eval_wer": 0.20218734241048916, "step": 79100 }, { "epoch": 13.7, "eval_loss": Infinity, "eval_runtime": 551.1265, "eval_samples_per_second": 20.451, "eval_steps_per_second": 2.557, "eval_wer": 0.20192469322575224, "step": 79200 }, { "epoch": 13.71, "eval_loss": Infinity, "eval_runtime": 548.06, "eval_samples_per_second": 20.565, "eval_steps_per_second": 2.571, "eval_wer": 0.20288073625819467, "step": 79300 }, { "epoch": 13.73, "eval_loss": Infinity, "eval_runtime": 549.0029, "eval_samples_per_second": 20.53, "eval_steps_per_second": 2.566, "eval_wer": 0.20201924693225753, "step": 79400 }, { "epoch": 13.75, "learning_rate": 2.5264988982952567e-05, "loss": 0.0384, "step": 79500 }, { "epoch": 13.75, "eval_loss": Infinity, "eval_runtime": 547.9777, "eval_samples_per_second": 20.568, "eval_steps_per_second": 2.571, "eval_wer": 0.20127332324760464, "step": 79500 }, { "epoch": 13.77, "eval_loss": Infinity, "eval_runtime": 549.5908, "eval_samples_per_second": 20.508, "eval_steps_per_second": 2.564, "eval_wer": 0.2008320726172466, "step": 79600 }, { "epoch": 13.78, "eval_loss": Infinity, "eval_runtime": 550.7209, "eval_samples_per_second": 20.466, "eval_steps_per_second": 2.558, "eval_wer": 0.20131534711716254, "step": 79700 }, { "epoch": 13.8, "eval_loss": Infinity, "eval_runtime": 549.4461, "eval_samples_per_second": 20.513, "eval_steps_per_second": 2.564, "eval_wer": 0.20072701294335182, "step": 79800 }, { "epoch": 13.82, "eval_loss": Infinity, "eval_runtime": 550.7003, "eval_samples_per_second": 20.467, "eval_steps_per_second": 2.559, "eval_wer": 0.20068498907379392, "step": 79900 }, { "epoch": 13.84, "learning_rate": 2.3525455178012292e-05, "loss": 0.0366, "step": 80000 }, { "epoch": 13.84, "eval_loss": Infinity, "eval_runtime": 549.1719, "eval_samples_per_second": 20.524, "eval_steps_per_second": 2.566, "eval_wer": 0.2013363590519415, "step": 80000 }, { "epoch": 13.85, "eval_loss": Infinity, "eval_runtime": 549.0216, "eval_samples_per_second": 20.529, "eval_steps_per_second": 2.566, "eval_wer": 0.2008320726172466, "step": 80100 }, { "epoch": 13.87, "eval_loss": Infinity, "eval_runtime": 549.1895, "eval_samples_per_second": 20.523, "eval_steps_per_second": 2.566, "eval_wer": 0.2003172802151622, "step": 80200 }, { "epoch": 13.89, "eval_loss": Infinity, "eval_runtime": 551.531, "eval_samples_per_second": 20.436, "eval_steps_per_second": 2.555, "eval_wer": 0.1995818624978988, "step": 80300 }, { "epoch": 13.91, "eval_loss": Infinity, "eval_runtime": 551.0755, "eval_samples_per_second": 20.453, "eval_steps_per_second": 2.557, "eval_wer": 0.19938224911749874, "step": 80400 }, { "epoch": 13.92, "learning_rate": 2.1785921373072014e-05, "loss": 0.0368, "step": 80500 }, { "epoch": 13.92, "eval_loss": Infinity, "eval_runtime": 550.0799, "eval_samples_per_second": 20.49, "eval_steps_per_second": 2.561, "eval_wer": 0.20009665489998318, "step": 80500 }, { "epoch": 13.94, "eval_loss": Infinity, "eval_runtime": 548.5676, "eval_samples_per_second": 20.546, "eval_steps_per_second": 2.569, "eval_wer": 0.19951882669356194, "step": 80600 }, { "epoch": 13.96, "eval_loss": Infinity, "eval_runtime": 547.3994, "eval_samples_per_second": 20.59, "eval_steps_per_second": 2.574, "eval_wer": 0.20012817280215162, "step": 80700 }, { "epoch": 13.97, "eval_loss": Infinity, "eval_runtime": 547.7377, "eval_samples_per_second": 20.577, "eval_steps_per_second": 2.572, "eval_wer": 0.19902504622625652, "step": 80800 }, { "epoch": 13.99, "eval_loss": Infinity, "eval_runtime": 547.4485, "eval_samples_per_second": 20.588, "eval_steps_per_second": 2.574, "eval_wer": 0.20012817280215162, "step": 80900 }, { "epoch": 14.01, "learning_rate": 2.0046387568131736e-05, "loss": 0.0362, "step": 81000 }, { "epoch": 14.01, "eval_loss": Infinity, "eval_runtime": 549.1806, "eval_samples_per_second": 20.523, "eval_steps_per_second": 2.566, "eval_wer": 0.19897251638930913, "step": 81000 }, { "epoch": 14.03, "eval_loss": Infinity, "eval_runtime": 550.171, "eval_samples_per_second": 20.486, "eval_steps_per_second": 2.561, "eval_wer": 0.19812153303076147, "step": 81100 }, { "epoch": 14.04, "eval_loss": Infinity, "eval_runtime": 548.9202, "eval_samples_per_second": 20.533, "eval_steps_per_second": 2.567, "eval_wer": 0.19864683140023534, "step": 81200 }, { "epoch": 14.06, "eval_loss": Infinity, "eval_runtime": 549.2666, "eval_samples_per_second": 20.52, "eval_steps_per_second": 2.565, "eval_wer": 0.19794293158514037, "step": 81300 }, { "epoch": 14.08, "eval_loss": Infinity, "eval_runtime": 548.6556, "eval_samples_per_second": 20.543, "eval_steps_per_second": 2.568, "eval_wer": 0.19731257354177173, "step": 81400 }, { "epoch": 14.1, "learning_rate": 1.8306853763191462e-05, "loss": 0.0353, "step": 81500 }, { "epoch": 14.1, "eval_loss": Infinity, "eval_runtime": 548.2556, "eval_samples_per_second": 20.558, "eval_steps_per_second": 2.57, "eval_wer": 0.1979639435199193, "step": 81500 }, { "epoch": 14.11, "eval_loss": Infinity, "eval_runtime": 549.3102, "eval_samples_per_second": 20.518, "eval_steps_per_second": 2.565, "eval_wer": 0.1986573373676248, "step": 81600 }, { "epoch": 14.13, "eval_loss": Infinity, "eval_runtime": 548.0325, "eval_samples_per_second": 20.566, "eval_steps_per_second": 2.571, "eval_wer": 0.1978798957808035, "step": 81700 }, { "epoch": 14.15, "eval_loss": Infinity, "eval_runtime": 547.6151, "eval_samples_per_second": 20.582, "eval_steps_per_second": 2.573, "eval_wer": 0.1972390317700454, "step": 81800 }, { "epoch": 14.16, "eval_loss": Infinity, "eval_runtime": 548.5829, "eval_samples_per_second": 20.546, "eval_steps_per_second": 2.568, "eval_wer": 0.19802697932425617, "step": 81900 }, { "epoch": 14.18, "learning_rate": 1.6567319958251187e-05, "loss": 0.0344, "step": 82000 }, { "epoch": 14.18, "eval_loss": Infinity, "eval_runtime": 548.2811, "eval_samples_per_second": 20.557, "eval_steps_per_second": 2.57, "eval_wer": 0.1977853420742982, "step": 82000 }, { "epoch": 14.2, "eval_loss": Infinity, "eval_runtime": 556.1898, "eval_samples_per_second": 20.265, "eval_steps_per_second": 2.533, "eval_wer": 0.19866784333501428, "step": 82100 }, { "epoch": 14.22, "eval_loss": Infinity, "eval_runtime": 556.5263, "eval_samples_per_second": 20.252, "eval_steps_per_second": 2.532, "eval_wer": 0.1974596570852244, "step": 82200 }, { "epoch": 14.23, "eval_loss": Infinity, "eval_runtime": 549.5075, "eval_samples_per_second": 20.511, "eval_steps_per_second": 2.564, "eval_wer": 0.1975121869221718, "step": 82300 }, { "epoch": 14.25, "eval_loss": Infinity, "eval_runtime": 550.8891, "eval_samples_per_second": 20.46, "eval_steps_per_second": 2.558, "eval_wer": 0.19743864515044546, "step": 82400 }, { "epoch": 14.27, "learning_rate": 1.4827786153310911e-05, "loss": 0.0348, "step": 82500 }, { "epoch": 14.27, "eval_loss": Infinity, "eval_runtime": 550.8558, "eval_samples_per_second": 20.461, "eval_steps_per_second": 2.558, "eval_wer": 0.19743864515044546, "step": 82500 }, { "epoch": 14.29, "eval_loss": Infinity, "eval_runtime": 548.9923, "eval_samples_per_second": 20.53, "eval_steps_per_second": 2.567, "eval_wer": 0.19740712724827703, "step": 82600 }, { "epoch": 14.3, "eval_loss": Infinity, "eval_runtime": 549.7751, "eval_samples_per_second": 20.501, "eval_steps_per_second": 2.563, "eval_wer": 0.19762775256345605, "step": 82700 }, { "epoch": 14.32, "eval_loss": Infinity, "eval_runtime": 549.3637, "eval_samples_per_second": 20.516, "eval_steps_per_second": 2.565, "eval_wer": 0.19734409144394016, "step": 82800 }, { "epoch": 14.34, "eval_loss": Infinity, "eval_runtime": 549.8173, "eval_samples_per_second": 20.5, "eval_steps_per_second": 2.563, "eval_wer": 0.197428139183056, "step": 82900 }, { "epoch": 14.35, "learning_rate": 1.3088252348370636e-05, "loss": 0.0328, "step": 83000 }, { "epoch": 14.35, "eval_loss": Infinity, "eval_runtime": 548.4364, "eval_samples_per_second": 20.551, "eval_steps_per_second": 2.569, "eval_wer": 0.19799546142208774, "step": 83000 }, { "epoch": 14.37, "eval_loss": Infinity, "eval_runtime": 548.2968, "eval_samples_per_second": 20.556, "eval_steps_per_second": 2.57, "eval_wer": 0.1978798957808035, "step": 83100 }, { "epoch": 14.39, "eval_loss": Infinity, "eval_runtime": 548.7906, "eval_samples_per_second": 20.538, "eval_steps_per_second": 2.567, "eval_wer": 0.197428139183056, "step": 83200 }, { "epoch": 14.41, "eval_loss": Infinity, "eval_runtime": 548.8022, "eval_samples_per_second": 20.537, "eval_steps_per_second": 2.567, "eval_wer": 0.19744915111783493, "step": 83300 }, { "epoch": 14.42, "eval_loss": Infinity, "eval_runtime": 548.604, "eval_samples_per_second": 20.545, "eval_steps_per_second": 2.568, "eval_wer": 0.19727054967221383, "step": 83400 }, { "epoch": 14.44, "learning_rate": 1.135219761104024e-05, "loss": 0.0351, "step": 83500 }, { "epoch": 14.44, "eval_loss": Infinity, "eval_runtime": 548.3355, "eval_samples_per_second": 20.555, "eval_steps_per_second": 2.57, "eval_wer": 0.19730206757438226, "step": 83500 }, { "epoch": 14.46, "eval_loss": Infinity, "eval_runtime": 548.7268, "eval_samples_per_second": 20.54, "eval_steps_per_second": 2.568, "eval_wer": 0.1972390317700454, "step": 83600 }, { "epoch": 14.48, "eval_loss": Infinity, "eval_runtime": 548.6096, "eval_samples_per_second": 20.545, "eval_steps_per_second": 2.568, "eval_wer": 0.19758572869389812, "step": 83700 }, { "epoch": 14.49, "eval_loss": Infinity, "eval_runtime": 546.9624, "eval_samples_per_second": 20.607, "eval_steps_per_second": 2.576, "eval_wer": 0.19687132291141368, "step": 83800 }, { "epoch": 14.51, "eval_loss": Infinity, "eval_runtime": 548.7393, "eval_samples_per_second": 20.54, "eval_steps_per_second": 2.568, "eval_wer": 0.19694486468314001, "step": 83900 }, { "epoch": 14.53, "learning_rate": 9.612663806099964e-06, "loss": 0.0329, "step": 84000 }, { "epoch": 14.53, "eval_loss": Infinity, "eval_runtime": 548.6856, "eval_samples_per_second": 20.542, "eval_steps_per_second": 2.568, "eval_wer": 0.1965351319549504, "step": 84000 }, { "epoch": 14.55, "eval_loss": Infinity, "eval_runtime": 560.2236, "eval_samples_per_second": 20.119, "eval_steps_per_second": 2.515, "eval_wer": 0.19655614388972936, "step": 84100 }, { "epoch": 14.56, "eval_loss": Infinity, "eval_runtime": 548.2121, "eval_samples_per_second": 20.56, "eval_steps_per_second": 2.57, "eval_wer": 0.1964090603462767, "step": 84200 }, { "epoch": 14.58, "eval_loss": Infinity, "eval_runtime": 548.7406, "eval_samples_per_second": 20.54, "eval_steps_per_second": 2.568, "eval_wer": 0.19682929904185578, "step": 84300 }, { "epoch": 14.6, "eval_loss": Infinity, "eval_runtime": 549.4063, "eval_samples_per_second": 20.515, "eval_steps_per_second": 2.565, "eval_wer": 0.1963985543788872, "step": 84400 }, { "epoch": 14.61, "learning_rate": 7.876609068769568e-06, "loss": 0.036, "step": 84500 }, { "epoch": 14.61, "eval_loss": Infinity, "eval_runtime": 549.2923, "eval_samples_per_second": 20.519, "eval_steps_per_second": 2.565, "eval_wer": 0.1965456379223399, "step": 84500 }, { "epoch": 14.63, "eval_loss": Infinity, "eval_runtime": 547.7858, "eval_samples_per_second": 20.576, "eval_steps_per_second": 2.572, "eval_wer": 0.19636703647671877, "step": 84600 }, { "epoch": 14.65, "eval_loss": Infinity, "eval_runtime": 548.7123, "eval_samples_per_second": 20.541, "eval_steps_per_second": 2.568, "eval_wer": 0.19675575727012942, "step": 84700 }, { "epoch": 14.67, "eval_loss": Infinity, "eval_runtime": 549.2306, "eval_samples_per_second": 20.521, "eval_steps_per_second": 2.565, "eval_wer": 0.19690284081358211, "step": 84800 }, { "epoch": 14.68, "eval_loss": Infinity, "eval_runtime": 548.8397, "eval_samples_per_second": 20.536, "eval_steps_per_second": 2.567, "eval_wer": 0.19665069759623466, "step": 84900 }, { "epoch": 14.7, "learning_rate": 6.1370752638292925e-06, "loss": 0.0322, "step": 85000 }, { "epoch": 14.7, "eval_loss": Infinity, "eval_runtime": 548.3915, "eval_samples_per_second": 20.553, "eval_steps_per_second": 2.569, "eval_wer": 0.19657715582450833, "step": 85000 }, { "epoch": 14.72, "eval_loss": Infinity, "eval_runtime": 547.5876, "eval_samples_per_second": 20.583, "eval_steps_per_second": 2.573, "eval_wer": 0.19665069759623466, "step": 85100 }, { "epoch": 14.74, "eval_loss": Infinity, "eval_runtime": 548.4879, "eval_samples_per_second": 20.549, "eval_steps_per_second": 2.569, "eval_wer": 0.1965456379223399, "step": 85200 }, { "epoch": 14.75, "eval_loss": Infinity, "eval_runtime": 549.2569, "eval_samples_per_second": 20.52, "eval_steps_per_second": 2.565, "eval_wer": 0.1963985543788872, "step": 85300 }, { "epoch": 14.77, "eval_loss": Infinity, "eval_runtime": 548.644, "eval_samples_per_second": 20.543, "eval_steps_per_second": 2.568, "eval_wer": 0.19644057824844513, "step": 85400 }, { "epoch": 14.79, "learning_rate": 4.397541458889018e-06, "loss": 0.0321, "step": 85500 }, { "epoch": 14.79, "eval_loss": Infinity, "eval_runtime": 547.1252, "eval_samples_per_second": 20.6, "eval_steps_per_second": 2.575, "eval_wer": 0.1963565305093293, "step": 85500 }, { "epoch": 14.8, "eval_loss": Infinity, "eval_runtime": 551.1899, "eval_samples_per_second": 20.448, "eval_steps_per_second": 2.556, "eval_wer": 0.1962094469658766, "step": 85600 }, { "epoch": 14.82, "eval_loss": Infinity, "eval_runtime": 564.4339, "eval_samples_per_second": 19.969, "eval_steps_per_second": 2.496, "eval_wer": 0.19603084552025551, "step": 85700 }, { "epoch": 14.84, "eval_loss": Infinity, "eval_runtime": 555.5114, "eval_samples_per_second": 20.289, "eval_steps_per_second": 2.536, "eval_wer": 0.1959467977811397, "step": 85800 }, { "epoch": 14.86, "eval_loss": Infinity, "eval_runtime": 551.0288, "eval_samples_per_second": 20.454, "eval_steps_per_second": 2.557, "eval_wer": 0.19618843503109767, "step": 85900 }, { "epoch": 14.87, "learning_rate": 2.6580076539487416e-06, "loss": 0.0341, "step": 86000 }, { "epoch": 14.87, "eval_loss": Infinity, "eval_runtime": 552.5092, "eval_samples_per_second": 20.4, "eval_steps_per_second": 2.55, "eval_wer": 0.19611489325937131, "step": 86000 }, { "epoch": 14.89, "eval_loss": Infinity, "eval_runtime": 551.7014, "eval_samples_per_second": 20.43, "eval_steps_per_second": 2.554, "eval_wer": 0.19637754244410827, "step": 86100 }, { "epoch": 14.91, "eval_loss": Infinity, "eval_runtime": 551.3725, "eval_samples_per_second": 20.442, "eval_steps_per_second": 2.555, "eval_wer": 0.19624096486804504, "step": 86200 }, { "epoch": 14.93, "eval_loss": Infinity, "eval_runtime": 551.3971, "eval_samples_per_second": 20.441, "eval_steps_per_second": 2.555, "eval_wer": 0.19617792906370818, "step": 86300 }, { "epoch": 14.94, "eval_loss": Infinity, "eval_runtime": 548.852, "eval_samples_per_second": 20.536, "eval_steps_per_second": 2.567, "eval_wer": 0.19632501260716087, "step": 86400 }, { "epoch": 14.96, "learning_rate": 9.184738490084656e-07, "loss": 0.0338, "step": 86500 }, { "epoch": 14.96, "eval_loss": Infinity, "eval_runtime": 549.3084, "eval_samples_per_second": 20.519, "eval_steps_per_second": 2.565, "eval_wer": 0.19634602454193983, "step": 86500 }, { "epoch": 14.98, "eval_loss": Infinity, "eval_runtime": 548.1703, "eval_samples_per_second": 20.561, "eval_steps_per_second": 2.57, "eval_wer": 0.19627248277021347, "step": 86600 }, { "epoch": 14.99, "eval_loss": Infinity, "eval_runtime": 548.1231, "eval_samples_per_second": 20.563, "eval_steps_per_second": 2.571, "eval_wer": 0.19625147083543454, "step": 86700 }, { "epoch": 15.0, "step": 86730, "total_flos": 1.1589202082196755e+20, "train_loss": 0.15599208657172234, "train_runtime": 535995.9461, "train_samples_per_second": 1.294, "train_steps_per_second": 0.162 } ], "max_steps": 86730, "num_train_epochs": 15, "total_flos": 1.1589202082196755e+20, "trial_name": null, "trial_params": null }