{ "best_metric": 18.48141795311607, "best_model_checkpoint": "whisper-base-nl-3/checkpoint-29000", "epoch": 3.5599857600569598, "global_step": 30000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 4.0000000000000003e-07, "loss": 1.3847, "step": 25 }, { "epoch": 0.0, "learning_rate": 9.000000000000001e-07, "loss": 1.4601, "step": 50 }, { "epoch": 0.0, "learning_rate": 1.4000000000000001e-06, "loss": 1.3556, "step": 75 }, { "epoch": 0.01, "learning_rate": 1.9000000000000002e-06, "loss": 1.1454, "step": 100 }, { "epoch": 0.01, "learning_rate": 2.4000000000000003e-06, "loss": 1.2552, "step": 125 }, { "epoch": 0.01, "learning_rate": 2.9e-06, "loss": 1.1695, "step": 150 }, { "epoch": 0.01, "learning_rate": 3.4000000000000005e-06, "loss": 0.9503, "step": 175 }, { "epoch": 0.01, "learning_rate": 3.900000000000001e-06, "loss": 0.9096, "step": 200 }, { "epoch": 0.01, "learning_rate": 4.4e-06, "loss": 0.8853, "step": 225 }, { "epoch": 0.02, "learning_rate": 4.9000000000000005e-06, "loss": 0.833, "step": 250 }, { "epoch": 0.02, "learning_rate": 5.400000000000001e-06, "loss": 0.8597, "step": 275 }, { "epoch": 0.02, "learning_rate": 5.9e-06, "loss": 0.8199, "step": 300 }, { "epoch": 0.02, "learning_rate": 6.4000000000000006e-06, "loss": 0.7158, "step": 325 }, { "epoch": 0.02, "learning_rate": 6.9e-06, "loss": 0.6896, "step": 350 }, { "epoch": 0.02, "learning_rate": 7.4e-06, "loss": 0.662, "step": 375 }, { "epoch": 0.03, "learning_rate": 7.9e-06, "loss": 0.8284, "step": 400 }, { "epoch": 0.03, "learning_rate": 8.400000000000001e-06, "loss": 0.6544, "step": 425 }, { "epoch": 0.03, "learning_rate": 8.900000000000001e-06, "loss": 0.7486, "step": 450 }, { "epoch": 0.03, "learning_rate": 9.4e-06, "loss": 0.5652, "step": 475 }, { "epoch": 0.03, "learning_rate": 9.9e-06, "loss": 0.6604, "step": 500 }, { "epoch": 0.03, "learning_rate": 9.994202898550725e-06, "loss": 0.7287, "step": 525 }, { "epoch": 0.04, "learning_rate": 9.986956521739132e-06, "loss": 0.6413, "step": 550 }, { "epoch": 0.04, "learning_rate": 9.979710144927537e-06, "loss": 0.6762, "step": 575 }, { "epoch": 0.04, "learning_rate": 9.972463768115943e-06, "loss": 0.6882, "step": 600 }, { "epoch": 0.04, "learning_rate": 9.965217391304348e-06, "loss": 0.7015, "step": 625 }, { "epoch": 0.04, "learning_rate": 9.957971014492755e-06, "loss": 0.6145, "step": 650 }, { "epoch": 0.04, "learning_rate": 9.95072463768116e-06, "loss": 0.6674, "step": 675 }, { "epoch": 0.05, "learning_rate": 9.943478260869565e-06, "loss": 0.5915, "step": 700 }, { "epoch": 0.05, "learning_rate": 9.936231884057972e-06, "loss": 0.6632, "step": 725 }, { "epoch": 0.05, "learning_rate": 9.928985507246378e-06, "loss": 0.6157, "step": 750 }, { "epoch": 0.05, "learning_rate": 9.921739130434783e-06, "loss": 0.7222, "step": 775 }, { "epoch": 0.05, "learning_rate": 9.91449275362319e-06, "loss": 0.6447, "step": 800 }, { "epoch": 0.05, "learning_rate": 9.907246376811595e-06, "loss": 0.6848, "step": 825 }, { "epoch": 0.06, "learning_rate": 9.9e-06, "loss": 0.6391, "step": 850 }, { "epoch": 0.06, "learning_rate": 9.892753623188407e-06, "loss": 0.6543, "step": 875 }, { "epoch": 0.06, "learning_rate": 9.885507246376812e-06, "loss": 0.5579, "step": 900 }, { "epoch": 0.06, "learning_rate": 9.878260869565218e-06, "loss": 0.5699, "step": 925 }, { "epoch": 0.06, "learning_rate": 9.871014492753625e-06, "loss": 0.5404, "step": 950 }, { "epoch": 0.06, "learning_rate": 9.86376811594203e-06, "loss": 0.6237, "step": 975 }, { "epoch": 0.06, "learning_rate": 9.856521739130435e-06, "loss": 0.5761, "step": 1000 }, { "epoch": 0.06, "eval_cer": 10.115352452161936, "eval_loss": 0.5675458908081055, "eval_runtime": 3220.6897, "eval_samples_per_second": 0.771, "eval_steps_per_second": 0.385, "eval_wer": 28.15323041738136, "step": 1000 }, { "epoch": 0.07, "learning_rate": 9.84927536231884e-06, "loss": 0.6175, "step": 1025 }, { "epoch": 0.07, "learning_rate": 9.842028985507247e-06, "loss": 0.6934, "step": 1050 }, { "epoch": 0.07, "learning_rate": 9.834782608695654e-06, "loss": 0.5818, "step": 1075 }, { "epoch": 0.07, "learning_rate": 9.827536231884059e-06, "loss": 0.6175, "step": 1100 }, { "epoch": 0.07, "learning_rate": 9.820289855072465e-06, "loss": 0.4952, "step": 1125 }, { "epoch": 0.07, "learning_rate": 9.81304347826087e-06, "loss": 0.6194, "step": 1150 }, { "epoch": 0.08, "learning_rate": 9.805797101449275e-06, "loss": 0.5897, "step": 1175 }, { "epoch": 0.08, "learning_rate": 9.798550724637682e-06, "loss": 0.5356, "step": 1200 }, { "epoch": 0.08, "learning_rate": 9.791304347826089e-06, "loss": 0.5805, "step": 1225 }, { "epoch": 0.08, "learning_rate": 9.784057971014494e-06, "loss": 0.5446, "step": 1250 }, { "epoch": 0.08, "learning_rate": 9.776811594202899e-06, "loss": 0.6734, "step": 1275 }, { "epoch": 0.08, "learning_rate": 9.769565217391305e-06, "loss": 0.5457, "step": 1300 }, { "epoch": 0.09, "learning_rate": 9.76231884057971e-06, "loss": 0.4686, "step": 1325 }, { "epoch": 0.09, "learning_rate": 9.755072463768117e-06, "loss": 0.5954, "step": 1350 }, { "epoch": 0.09, "learning_rate": 9.747826086956522e-06, "loss": 0.4973, "step": 1375 }, { "epoch": 0.09, "learning_rate": 9.740579710144929e-06, "loss": 0.5727, "step": 1400 }, { "epoch": 0.09, "learning_rate": 9.733333333333334e-06, "loss": 0.5767, "step": 1425 }, { "epoch": 0.09, "learning_rate": 9.726086956521739e-06, "loss": 0.4814, "step": 1450 }, { "epoch": 0.1, "learning_rate": 9.718840579710146e-06, "loss": 0.5544, "step": 1475 }, { "epoch": 0.1, "learning_rate": 9.71159420289855e-06, "loss": 0.5281, "step": 1500 }, { "epoch": 0.1, "learning_rate": 9.704347826086957e-06, "loss": 0.612, "step": 1525 }, { "epoch": 0.1, "learning_rate": 9.697101449275364e-06, "loss": 0.5293, "step": 1550 }, { "epoch": 0.1, "learning_rate": 9.689855072463769e-06, "loss": 0.5881, "step": 1575 }, { "epoch": 0.1, "learning_rate": 9.682608695652174e-06, "loss": 0.5571, "step": 1600 }, { "epoch": 0.11, "learning_rate": 9.67536231884058e-06, "loss": 0.429, "step": 1625 }, { "epoch": 0.11, "learning_rate": 9.668115942028986e-06, "loss": 0.4661, "step": 1650 }, { "epoch": 0.11, "learning_rate": 9.660869565217392e-06, "loss": 0.5181, "step": 1675 }, { "epoch": 0.11, "learning_rate": 9.653623188405797e-06, "loss": 0.5188, "step": 1700 }, { "epoch": 0.11, "learning_rate": 9.646376811594204e-06, "loss": 0.4881, "step": 1725 }, { "epoch": 0.11, "learning_rate": 9.639130434782609e-06, "loss": 0.6319, "step": 1750 }, { "epoch": 0.11, "learning_rate": 9.631884057971014e-06, "loss": 0.6, "step": 1775 }, { "epoch": 0.12, "learning_rate": 9.624637681159421e-06, "loss": 0.5251, "step": 1800 }, { "epoch": 0.12, "learning_rate": 9.617391304347828e-06, "loss": 0.4999, "step": 1825 }, { "epoch": 0.12, "learning_rate": 9.610144927536233e-06, "loss": 0.5612, "step": 1850 }, { "epoch": 0.12, "learning_rate": 9.60289855072464e-06, "loss": 0.456, "step": 1875 }, { "epoch": 0.12, "learning_rate": 9.595652173913044e-06, "loss": 0.5589, "step": 1900 }, { "epoch": 0.12, "learning_rate": 9.58840579710145e-06, "loss": 0.396, "step": 1925 }, { "epoch": 0.13, "learning_rate": 9.581159420289856e-06, "loss": 0.4713, "step": 1950 }, { "epoch": 0.13, "learning_rate": 9.573913043478261e-06, "loss": 0.5178, "step": 1975 }, { "epoch": 0.13, "learning_rate": 9.566666666666668e-06, "loss": 0.48, "step": 2000 }, { "epoch": 0.13, "eval_cer": 9.69108170593733, "eval_loss": 0.5239235162734985, "eval_runtime": 3297.9692, "eval_samples_per_second": 0.753, "eval_steps_per_second": 0.376, "eval_wer": 26.436439870402133, "step": 2000 }, { "epoch": 0.13, "learning_rate": 9.559420289855074e-06, "loss": 0.5154, "step": 2025 }, { "epoch": 0.13, "learning_rate": 9.55217391304348e-06, "loss": 0.5715, "step": 2050 }, { "epoch": 0.13, "learning_rate": 9.545217391304349e-06, "loss": 0.5522, "step": 2075 }, { "epoch": 0.14, "learning_rate": 9.537971014492754e-06, "loss": 0.5205, "step": 2100 }, { "epoch": 0.14, "learning_rate": 9.53072463768116e-06, "loss": 0.4494, "step": 2125 }, { "epoch": 0.14, "learning_rate": 9.523478260869566e-06, "loss": 0.5226, "step": 2150 }, { "epoch": 0.14, "learning_rate": 9.516231884057972e-06, "loss": 0.469, "step": 2175 }, { "epoch": 0.14, "learning_rate": 9.508985507246377e-06, "loss": 0.5067, "step": 2200 }, { "epoch": 0.14, "learning_rate": 9.501739130434784e-06, "loss": 0.5879, "step": 2225 }, { "epoch": 0.15, "learning_rate": 9.494492753623189e-06, "loss": 0.8063, "step": 2250 }, { "epoch": 0.15, "learning_rate": 9.487246376811596e-06, "loss": 0.5067, "step": 2275 }, { "epoch": 0.15, "learning_rate": 9.48e-06, "loss": 0.5124, "step": 2300 }, { "epoch": 0.15, "learning_rate": 9.472753623188406e-06, "loss": 0.4894, "step": 2325 }, { "epoch": 0.15, "learning_rate": 9.465507246376812e-06, "loss": 0.504, "step": 2350 }, { "epoch": 0.15, "learning_rate": 9.458260869565217e-06, "loss": 0.545, "step": 2375 }, { "epoch": 0.16, "learning_rate": 9.451014492753624e-06, "loss": 0.4962, "step": 2400 }, { "epoch": 0.16, "learning_rate": 9.44376811594203e-06, "loss": 0.4774, "step": 2425 }, { "epoch": 0.16, "learning_rate": 9.436521739130436e-06, "loss": 0.5429, "step": 2450 }, { "epoch": 0.16, "learning_rate": 9.42927536231884e-06, "loss": 0.445, "step": 2475 }, { "epoch": 0.16, "learning_rate": 9.422028985507246e-06, "loss": 0.4111, "step": 2500 }, { "epoch": 0.16, "learning_rate": 9.414782608695653e-06, "loss": 0.5188, "step": 2525 }, { "epoch": 0.17, "learning_rate": 9.40753623188406e-06, "loss": 0.4584, "step": 2550 }, { "epoch": 0.17, "learning_rate": 9.400289855072464e-06, "loss": 0.5017, "step": 2575 }, { "epoch": 0.17, "learning_rate": 9.393043478260871e-06, "loss": 0.593, "step": 2600 }, { "epoch": 0.17, "learning_rate": 9.385797101449276e-06, "loss": 0.5195, "step": 2625 }, { "epoch": 0.17, "learning_rate": 9.378550724637681e-06, "loss": 0.5083, "step": 2650 }, { "epoch": 0.17, "learning_rate": 9.371304347826088e-06, "loss": 0.5534, "step": 2675 }, { "epoch": 0.17, "learning_rate": 9.364057971014493e-06, "loss": 0.4893, "step": 2700 }, { "epoch": 0.18, "learning_rate": 9.3568115942029e-06, "loss": 0.4512, "step": 2725 }, { "epoch": 0.18, "learning_rate": 9.349565217391306e-06, "loss": 0.5876, "step": 2750 }, { "epoch": 0.18, "learning_rate": 9.342318840579711e-06, "loss": 0.4597, "step": 2775 }, { "epoch": 0.18, "learning_rate": 9.335072463768116e-06, "loss": 0.3634, "step": 2800 }, { "epoch": 0.18, "learning_rate": 9.327826086956523e-06, "loss": 0.4483, "step": 2825 }, { "epoch": 0.18, "learning_rate": 9.320579710144928e-06, "loss": 0.5484, "step": 2850 }, { "epoch": 0.19, "learning_rate": 9.313333333333335e-06, "loss": 0.4852, "step": 2875 }, { "epoch": 0.19, "learning_rate": 9.306086956521741e-06, "loss": 0.5576, "step": 2900 }, { "epoch": 0.19, "learning_rate": 9.298840579710146e-06, "loss": 0.5107, "step": 2925 }, { "epoch": 0.19, "learning_rate": 9.291594202898551e-06, "loss": 0.5286, "step": 2950 }, { "epoch": 0.19, "learning_rate": 9.284347826086956e-06, "loss": 0.5618, "step": 2975 }, { "epoch": 0.19, "learning_rate": 9.277101449275363e-06, "loss": 0.4094, "step": 3000 }, { "epoch": 0.19, "eval_cer": 9.153180185941267, "eval_loss": 0.49246901273727417, "eval_runtime": 3242.5657, "eval_samples_per_second": 0.765, "eval_steps_per_second": 0.383, "eval_wer": 24.835525061940157, "step": 3000 }, { "epoch": 0.2, "learning_rate": 9.26985507246377e-06, "loss": 0.5152, "step": 3025 }, { "epoch": 0.2, "learning_rate": 9.262608695652175e-06, "loss": 0.5572, "step": 3050 }, { "epoch": 0.2, "learning_rate": 9.255362318840581e-06, "loss": 0.4801, "step": 3075 }, { "epoch": 0.2, "learning_rate": 9.248115942028986e-06, "loss": 0.4005, "step": 3100 }, { "epoch": 0.2, "learning_rate": 9.240869565217391e-06, "loss": 0.4693, "step": 3125 }, { "epoch": 0.2, "learning_rate": 9.233623188405798e-06, "loss": 0.4487, "step": 3150 }, { "epoch": 0.21, "learning_rate": 9.226376811594203e-06, "loss": 0.4477, "step": 3175 }, { "epoch": 0.21, "learning_rate": 9.21913043478261e-06, "loss": 0.4, "step": 3200 }, { "epoch": 0.21, "learning_rate": 9.211884057971015e-06, "loss": 0.4358, "step": 3225 }, { "epoch": 0.21, "learning_rate": 9.204637681159421e-06, "loss": 0.4952, "step": 3250 }, { "epoch": 0.21, "learning_rate": 9.197391304347826e-06, "loss": 0.4526, "step": 3275 }, { "epoch": 0.21, "learning_rate": 9.190144927536233e-06, "loss": 0.3588, "step": 3300 }, { "epoch": 0.22, "learning_rate": 9.182898550724638e-06, "loss": 0.5127, "step": 3325 }, { "epoch": 0.22, "learning_rate": 9.175652173913045e-06, "loss": 0.6166, "step": 3350 }, { "epoch": 0.22, "learning_rate": 9.16840579710145e-06, "loss": 0.5032, "step": 3375 }, { "epoch": 0.22, "learning_rate": 9.161159420289855e-06, "loss": 0.5632, "step": 3400 }, { "epoch": 0.22, "learning_rate": 9.153913043478262e-06, "loss": 0.5268, "step": 3425 }, { "epoch": 0.22, "learning_rate": 9.146666666666667e-06, "loss": 0.4672, "step": 3450 }, { "epoch": 0.23, "learning_rate": 9.139420289855073e-06, "loss": 0.4342, "step": 3475 }, { "epoch": 0.23, "learning_rate": 9.13217391304348e-06, "loss": 0.4504, "step": 3500 }, { "epoch": 0.23, "learning_rate": 9.124927536231885e-06, "loss": 0.4076, "step": 3525 }, { "epoch": 0.23, "learning_rate": 9.11768115942029e-06, "loss": 0.5036, "step": 3550 }, { "epoch": 0.23, "learning_rate": 9.110434782608695e-06, "loss": 0.3835, "step": 3575 }, { "epoch": 0.23, "learning_rate": 9.103188405797102e-06, "loss": 0.3652, "step": 3600 }, { "epoch": 0.23, "learning_rate": 9.095942028985508e-06, "loss": 0.4231, "step": 3625 }, { "epoch": 0.24, "learning_rate": 9.088695652173913e-06, "loss": 0.4644, "step": 3650 }, { "epoch": 0.24, "learning_rate": 9.08144927536232e-06, "loss": 0.5602, "step": 3675 }, { "epoch": 0.24, "learning_rate": 9.074202898550725e-06, "loss": 0.4637, "step": 3700 }, { "epoch": 0.24, "learning_rate": 9.06695652173913e-06, "loss": 0.4324, "step": 3725 }, { "epoch": 0.24, "learning_rate": 9.059710144927537e-06, "loss": 0.446, "step": 3750 }, { "epoch": 0.24, "learning_rate": 9.052463768115944e-06, "loss": 0.5127, "step": 3775 }, { "epoch": 0.25, "learning_rate": 9.045217391304349e-06, "loss": 0.4453, "step": 3800 }, { "epoch": 0.25, "learning_rate": 9.037971014492755e-06, "loss": 0.4382, "step": 3825 }, { "epoch": 0.25, "learning_rate": 9.03072463768116e-06, "loss": 0.5816, "step": 3850 }, { "epoch": 0.25, "learning_rate": 9.023478260869565e-06, "loss": 0.397, "step": 3875 }, { "epoch": 0.25, "learning_rate": 9.016231884057972e-06, "loss": 0.4512, "step": 3900 }, { "epoch": 0.25, "learning_rate": 9.008985507246377e-06, "loss": 0.4541, "step": 3925 }, { "epoch": 0.26, "learning_rate": 9.001739130434784e-06, "loss": 0.3829, "step": 3950 }, { "epoch": 0.26, "learning_rate": 8.99449275362319e-06, "loss": 0.5275, "step": 3975 }, { "epoch": 0.26, "learning_rate": 8.987246376811595e-06, "loss": 0.4792, "step": 4000 }, { "epoch": 0.26, "eval_cer": 8.841433420237099, "eval_loss": 0.47019296884536743, "eval_runtime": 3179.8405, "eval_samples_per_second": 0.781, "eval_steps_per_second": 0.39, "eval_wer": 24.110539355822375, "step": 4000 }, { "epoch": 0.26, "learning_rate": 8.98e-06, "loss": 0.4638, "step": 4025 }, { "epoch": 0.26, "learning_rate": 8.972753623188405e-06, "loss": 0.5326, "step": 4050 }, { "epoch": 0.26, "learning_rate": 8.965507246376812e-06, "loss": 0.4799, "step": 4075 }, { "epoch": 0.27, "learning_rate": 8.958260869565219e-06, "loss": 0.4798, "step": 4100 }, { "epoch": 0.27, "learning_rate": 8.951014492753624e-06, "loss": 0.4938, "step": 4125 }, { "epoch": 0.27, "learning_rate": 8.94376811594203e-06, "loss": 0.4882, "step": 4150 }, { "epoch": 0.27, "learning_rate": 8.936521739130436e-06, "loss": 0.4136, "step": 4175 }, { "epoch": 0.27, "learning_rate": 8.92927536231884e-06, "loss": 0.5116, "step": 4200 }, { "epoch": 0.27, "learning_rate": 8.922028985507247e-06, "loss": 0.5381, "step": 4225 }, { "epoch": 0.28, "learning_rate": 8.914782608695652e-06, "loss": 0.3999, "step": 4250 }, { "epoch": 0.28, "learning_rate": 8.907536231884059e-06, "loss": 0.3925, "step": 4275 }, { "epoch": 0.28, "learning_rate": 8.900289855072464e-06, "loss": 0.469, "step": 4300 }, { "epoch": 0.28, "learning_rate": 8.89304347826087e-06, "loss": 0.4854, "step": 4325 }, { "epoch": 0.28, "learning_rate": 8.885797101449276e-06, "loss": 0.5086, "step": 4350 }, { "epoch": 0.28, "learning_rate": 8.878550724637682e-06, "loss": 0.4679, "step": 4375 }, { "epoch": 0.29, "learning_rate": 8.871594202898552e-06, "loss": 0.5175, "step": 4400 }, { "epoch": 0.29, "learning_rate": 8.864347826086957e-06, "loss": 0.4921, "step": 4425 }, { "epoch": 0.29, "learning_rate": 8.857101449275362e-06, "loss": 0.4375, "step": 4450 }, { "epoch": 0.29, "learning_rate": 8.849855072463769e-06, "loss": 0.6226, "step": 4475 }, { "epoch": 0.29, "learning_rate": 8.842608695652175e-06, "loss": 0.4383, "step": 4500 }, { "epoch": 0.29, "learning_rate": 8.83536231884058e-06, "loss": 0.4799, "step": 4525 }, { "epoch": 0.29, "learning_rate": 8.828115942028987e-06, "loss": 0.4063, "step": 4550 }, { "epoch": 0.3, "learning_rate": 8.820869565217392e-06, "loss": 0.4039, "step": 4575 }, { "epoch": 0.3, "learning_rate": 8.813623188405797e-06, "loss": 0.3688, "step": 4600 }, { "epoch": 0.3, "learning_rate": 8.806376811594204e-06, "loss": 0.4714, "step": 4625 }, { "epoch": 0.3, "learning_rate": 8.799130434782609e-06, "loss": 0.426, "step": 4650 }, { "epoch": 0.3, "learning_rate": 8.791884057971015e-06, "loss": 0.4623, "step": 4675 }, { "epoch": 0.3, "learning_rate": 8.784637681159422e-06, "loss": 0.4223, "step": 4700 }, { "epoch": 0.31, "learning_rate": 8.777391304347827e-06, "loss": 0.504, "step": 4725 }, { "epoch": 0.31, "learning_rate": 8.770144927536232e-06, "loss": 0.4396, "step": 4750 }, { "epoch": 0.31, "learning_rate": 8.762898550724639e-06, "loss": 0.4665, "step": 4775 }, { "epoch": 0.31, "learning_rate": 8.755652173913044e-06, "loss": 0.4356, "step": 4800 }, { "epoch": 0.31, "learning_rate": 8.74840579710145e-06, "loss": 0.4058, "step": 4825 }, { "epoch": 0.31, "learning_rate": 8.741159420289856e-06, "loss": 0.4825, "step": 4850 }, { "epoch": 0.32, "learning_rate": 8.733913043478262e-06, "loss": 0.5461, "step": 4875 }, { "epoch": 0.32, "learning_rate": 8.726666666666667e-06, "loss": 0.4718, "step": 4900 }, { "epoch": 0.32, "learning_rate": 8.719420289855072e-06, "loss": 0.5011, "step": 4925 }, { "epoch": 0.32, "learning_rate": 8.712173913043479e-06, "loss": 0.4281, "step": 4950 }, { "epoch": 0.32, "learning_rate": 8.704927536231886e-06, "loss": 0.5207, "step": 4975 }, { "epoch": 0.32, "learning_rate": 8.69768115942029e-06, "loss": 0.3444, "step": 5000 }, { "epoch": 0.32, "eval_cer": 8.853116237886763, "eval_loss": 0.45443984866142273, "eval_runtime": 3270.5063, "eval_samples_per_second": 0.759, "eval_steps_per_second": 0.379, "eval_wer": 23.901658090337335, "step": 5000 }, { "epoch": 0.33, "learning_rate": 8.690434782608697e-06, "loss": 0.4848, "step": 5025 }, { "epoch": 0.33, "learning_rate": 8.683188405797102e-06, "loss": 0.4012, "step": 5050 }, { "epoch": 0.33, "learning_rate": 8.675942028985507e-06, "loss": 0.3266, "step": 5075 }, { "epoch": 0.33, "learning_rate": 8.668695652173914e-06, "loss": 0.4751, "step": 5100 }, { "epoch": 0.33, "learning_rate": 8.661449275362319e-06, "loss": 0.5552, "step": 5125 }, { "epoch": 0.33, "learning_rate": 8.654202898550726e-06, "loss": 0.4079, "step": 5150 }, { "epoch": 0.34, "learning_rate": 8.64695652173913e-06, "loss": 0.4326, "step": 5175 }, { "epoch": 0.34, "learning_rate": 8.639710144927538e-06, "loss": 0.4591, "step": 5200 }, { "epoch": 0.34, "learning_rate": 8.632463768115943e-06, "loss": 0.3962, "step": 5225 }, { "epoch": 0.34, "learning_rate": 8.625217391304348e-06, "loss": 0.4825, "step": 5250 }, { "epoch": 0.34, "learning_rate": 8.617971014492754e-06, "loss": 0.4377, "step": 5275 }, { "epoch": 0.34, "learning_rate": 8.610724637681161e-06, "loss": 0.437, "step": 5300 }, { "epoch": 0.34, "learning_rate": 8.603478260869566e-06, "loss": 0.3836, "step": 5325 }, { "epoch": 0.35, "learning_rate": 8.596231884057971e-06, "loss": 0.4649, "step": 5350 }, { "epoch": 0.35, "learning_rate": 8.588985507246378e-06, "loss": 0.4631, "step": 5375 }, { "epoch": 0.35, "learning_rate": 8.581739130434783e-06, "loss": 0.5619, "step": 5400 }, { "epoch": 0.35, "learning_rate": 8.57449275362319e-06, "loss": 0.5031, "step": 5425 }, { "epoch": 0.35, "learning_rate": 8.567246376811596e-06, "loss": 0.3797, "step": 5450 }, { "epoch": 0.35, "learning_rate": 8.560000000000001e-06, "loss": 0.4993, "step": 5475 }, { "epoch": 0.36, "learning_rate": 8.552753623188406e-06, "loss": 0.4146, "step": 5500 }, { "epoch": 0.36, "learning_rate": 8.545507246376811e-06, "loss": 0.4524, "step": 5525 }, { "epoch": 0.36, "learning_rate": 8.538260869565218e-06, "loss": 0.4812, "step": 5550 }, { "epoch": 0.36, "learning_rate": 8.531014492753624e-06, "loss": 0.3781, "step": 5575 }, { "epoch": 0.36, "learning_rate": 8.52376811594203e-06, "loss": 0.4343, "step": 5600 }, { "epoch": 0.36, "learning_rate": 8.516521739130436e-06, "loss": 0.4226, "step": 5625 }, { "epoch": 0.37, "learning_rate": 8.509275362318841e-06, "loss": 0.4341, "step": 5650 }, { "epoch": 0.37, "learning_rate": 8.502028985507246e-06, "loss": 0.4008, "step": 5675 }, { "epoch": 0.37, "learning_rate": 8.494782608695653e-06, "loss": 0.4199, "step": 5700 }, { "epoch": 0.37, "learning_rate": 8.487536231884058e-06, "loss": 0.4822, "step": 5725 }, { "epoch": 0.37, "learning_rate": 8.480289855072465e-06, "loss": 0.3857, "step": 5750 }, { "epoch": 0.37, "learning_rate": 8.473043478260871e-06, "loss": 0.5646, "step": 5775 }, { "epoch": 0.38, "learning_rate": 8.465797101449276e-06, "loss": 0.3835, "step": 5800 }, { "epoch": 0.38, "learning_rate": 8.458550724637681e-06, "loss": 0.4856, "step": 5825 }, { "epoch": 0.38, "learning_rate": 8.451304347826088e-06, "loss": 0.4807, "step": 5850 }, { "epoch": 0.38, "learning_rate": 8.444057971014493e-06, "loss": 0.5281, "step": 5875 }, { "epoch": 0.38, "learning_rate": 8.4368115942029e-06, "loss": 0.4234, "step": 5900 }, { "epoch": 0.38, "learning_rate": 8.429565217391305e-06, "loss": 0.6375, "step": 5925 }, { "epoch": 0.39, "learning_rate": 8.422318840579711e-06, "loss": 0.4303, "step": 5950 }, { "epoch": 0.39, "learning_rate": 8.415072463768116e-06, "loss": 0.4196, "step": 5975 }, { "epoch": 0.39, "learning_rate": 8.407826086956521e-06, "loss": 0.3943, "step": 6000 }, { "epoch": 0.39, "eval_cer": 8.360224310098873, "eval_loss": 0.44455686211586, "eval_runtime": 3263.9495, "eval_samples_per_second": 0.76, "eval_steps_per_second": 0.38, "eval_wer": 22.735277301315037, "step": 6000 }, { "epoch": 0.39, "learning_rate": 8.400579710144928e-06, "loss": 0.4164, "step": 6025 }, { "epoch": 0.39, "learning_rate": 8.393333333333335e-06, "loss": 0.4818, "step": 6050 }, { "epoch": 0.39, "learning_rate": 8.38608695652174e-06, "loss": 0.5536, "step": 6075 }, { "epoch": 0.4, "learning_rate": 8.378840579710147e-06, "loss": 0.4731, "step": 6100 }, { "epoch": 0.4, "learning_rate": 8.371594202898552e-06, "loss": 0.4081, "step": 6125 }, { "epoch": 0.4, "learning_rate": 8.364347826086957e-06, "loss": 0.3741, "step": 6150 }, { "epoch": 0.4, "learning_rate": 8.357101449275363e-06, "loss": 0.4173, "step": 6175 }, { "epoch": 0.4, "learning_rate": 8.349855072463768e-06, "loss": 0.4954, "step": 6200 }, { "epoch": 0.4, "learning_rate": 8.342608695652175e-06, "loss": 0.461, "step": 6225 }, { "epoch": 0.4, "learning_rate": 8.33536231884058e-06, "loss": 0.4501, "step": 6250 }, { "epoch": 0.41, "learning_rate": 8.328115942028987e-06, "loss": 0.3652, "step": 6275 }, { "epoch": 0.41, "learning_rate": 8.320869565217392e-06, "loss": 0.4046, "step": 6300 }, { "epoch": 0.41, "learning_rate": 8.313623188405798e-06, "loss": 0.4184, "step": 6325 }, { "epoch": 0.41, "learning_rate": 8.306376811594203e-06, "loss": 0.4287, "step": 6350 }, { "epoch": 0.41, "learning_rate": 8.29913043478261e-06, "loss": 0.3938, "step": 6375 }, { "epoch": 0.41, "learning_rate": 8.291884057971015e-06, "loss": 0.4758, "step": 6400 }, { "epoch": 0.42, "learning_rate": 8.28463768115942e-06, "loss": 0.4716, "step": 6425 }, { "epoch": 0.42, "learning_rate": 8.277391304347827e-06, "loss": 0.3819, "step": 6450 }, { "epoch": 0.42, "learning_rate": 8.270144927536232e-06, "loss": 0.3889, "step": 6475 }, { "epoch": 0.42, "learning_rate": 8.262898550724639e-06, "loss": 0.4659, "step": 6500 }, { "epoch": 0.42, "learning_rate": 8.255652173913045e-06, "loss": 0.3274, "step": 6525 }, { "epoch": 0.42, "learning_rate": 8.24840579710145e-06, "loss": 0.4144, "step": 6550 }, { "epoch": 0.43, "learning_rate": 8.241159420289855e-06, "loss": 0.3875, "step": 6575 }, { "epoch": 0.43, "learning_rate": 8.23391304347826e-06, "loss": 0.452, "step": 6600 }, { "epoch": 0.43, "learning_rate": 8.226666666666667e-06, "loss": 0.4747, "step": 6625 }, { "epoch": 0.43, "learning_rate": 8.219420289855074e-06, "loss": 0.4448, "step": 6650 }, { "epoch": 0.43, "learning_rate": 8.212173913043479e-06, "loss": 0.5215, "step": 6675 }, { "epoch": 0.43, "learning_rate": 8.204927536231885e-06, "loss": 0.4261, "step": 6700 }, { "epoch": 0.44, "learning_rate": 8.19768115942029e-06, "loss": 0.4482, "step": 6725 }, { "epoch": 0.44, "learning_rate": 8.190434782608695e-06, "loss": 0.39, "step": 6750 }, { "epoch": 0.44, "learning_rate": 8.183188405797102e-06, "loss": 0.6096, "step": 6775 }, { "epoch": 0.44, "learning_rate": 8.175942028985507e-06, "loss": 0.3912, "step": 6800 }, { "epoch": 0.44, "learning_rate": 8.168695652173914e-06, "loss": 0.3141, "step": 6825 }, { "epoch": 0.44, "learning_rate": 8.16144927536232e-06, "loss": 0.3593, "step": 6850 }, { "epoch": 0.45, "learning_rate": 8.154202898550725e-06, "loss": 0.4331, "step": 6875 }, { "epoch": 0.45, "learning_rate": 8.14695652173913e-06, "loss": 0.4574, "step": 6900 }, { "epoch": 0.45, "learning_rate": 8.139710144927537e-06, "loss": 0.3546, "step": 6925 }, { "epoch": 0.45, "learning_rate": 8.132463768115942e-06, "loss": 0.3894, "step": 6950 }, { "epoch": 0.45, "learning_rate": 8.125217391304349e-06, "loss": 0.393, "step": 6975 }, { "epoch": 0.45, "learning_rate": 8.117971014492756e-06, "loss": 0.4925, "step": 7000 }, { "epoch": 0.45, "eval_cer": 8.3723990358601, "eval_loss": 0.4348393380641937, "eval_runtime": 3254.2457, "eval_samples_per_second": 0.763, "eval_steps_per_second": 0.381, "eval_wer": 22.178768820278254, "step": 7000 }, { "epoch": 0.46, "learning_rate": 8.11072463768116e-06, "loss": 0.3986, "step": 7025 }, { "epoch": 0.46, "learning_rate": 8.103478260869566e-06, "loss": 0.3943, "step": 7050 }, { "epoch": 0.46, "learning_rate": 8.09623188405797e-06, "loss": 0.4803, "step": 7075 }, { "epoch": 0.46, "learning_rate": 8.088985507246377e-06, "loss": 0.4128, "step": 7100 }, { "epoch": 0.46, "learning_rate": 8.081739130434784e-06, "loss": 0.5511, "step": 7125 }, { "epoch": 0.46, "learning_rate": 8.074492753623189e-06, "loss": 0.4377, "step": 7150 }, { "epoch": 0.46, "learning_rate": 8.067246376811596e-06, "loss": 0.453, "step": 7175 }, { "epoch": 0.47, "learning_rate": 8.06e-06, "loss": 0.4019, "step": 7200 }, { "epoch": 0.47, "learning_rate": 8.052753623188406e-06, "loss": 0.4934, "step": 7225 }, { "epoch": 0.47, "learning_rate": 8.045507246376812e-06, "loss": 0.3873, "step": 7250 }, { "epoch": 0.47, "learning_rate": 8.038260869565217e-06, "loss": 0.389, "step": 7275 }, { "epoch": 0.47, "learning_rate": 8.031014492753624e-06, "loss": 0.4086, "step": 7300 }, { "epoch": 0.47, "learning_rate": 8.02376811594203e-06, "loss": 0.3844, "step": 7325 }, { "epoch": 0.48, "learning_rate": 8.016521739130436e-06, "loss": 0.4577, "step": 7350 }, { "epoch": 0.48, "learning_rate": 8.009275362318841e-06, "loss": 0.383, "step": 7375 }, { "epoch": 0.48, "learning_rate": 8.002028985507248e-06, "loss": 0.5191, "step": 7400 }, { "epoch": 0.48, "learning_rate": 7.994782608695653e-06, "loss": 0.3293, "step": 7425 }, { "epoch": 0.48, "learning_rate": 7.98753623188406e-06, "loss": 0.4246, "step": 7450 }, { "epoch": 0.48, "learning_rate": 7.980289855072464e-06, "loss": 0.3811, "step": 7475 }, { "epoch": 0.49, "learning_rate": 7.97304347826087e-06, "loss": 0.3891, "step": 7500 }, { "epoch": 0.49, "learning_rate": 7.965797101449276e-06, "loss": 0.4367, "step": 7525 }, { "epoch": 0.49, "learning_rate": 7.958550724637681e-06, "loss": 0.4793, "step": 7550 }, { "epoch": 0.49, "learning_rate": 7.951304347826088e-06, "loss": 0.3993, "step": 7575 }, { "epoch": 0.49, "learning_rate": 7.944347826086957e-06, "loss": 0.3095, "step": 7600 }, { "epoch": 0.49, "learning_rate": 7.937101449275362e-06, "loss": 0.4002, "step": 7625 }, { "epoch": 0.5, "learning_rate": 7.929855072463769e-06, "loss": 0.4037, "step": 7650 }, { "epoch": 0.5, "learning_rate": 7.922608695652174e-06, "loss": 0.3694, "step": 7675 }, { "epoch": 0.5, "learning_rate": 7.91536231884058e-06, "loss": 0.3969, "step": 7700 }, { "epoch": 0.5, "learning_rate": 7.908115942028987e-06, "loss": 0.4404, "step": 7725 }, { "epoch": 0.5, "learning_rate": 7.900869565217392e-06, "loss": 0.4489, "step": 7750 }, { "epoch": 0.5, "learning_rate": 7.893623188405797e-06, "loss": 0.3542, "step": 7775 }, { "epoch": 0.51, "learning_rate": 7.886376811594204e-06, "loss": 0.4793, "step": 7800 }, { "epoch": 0.51, "learning_rate": 7.879130434782609e-06, "loss": 0.3876, "step": 7825 }, { "epoch": 0.51, "learning_rate": 7.871884057971016e-06, "loss": 0.3983, "step": 7850 }, { "epoch": 0.51, "learning_rate": 7.86463768115942e-06, "loss": 0.5017, "step": 7875 }, { "epoch": 0.51, "learning_rate": 7.857391304347827e-06, "loss": 0.3704, "step": 7900 }, { "epoch": 0.51, "learning_rate": 7.850144927536232e-06, "loss": 0.4443, "step": 7925 }, { "epoch": 0.51, "learning_rate": 7.842898550724637e-06, "loss": 0.3535, "step": 7950 }, { "epoch": 0.52, "learning_rate": 7.835652173913044e-06, "loss": 0.4255, "step": 7975 }, { "epoch": 0.52, "learning_rate": 7.828405797101451e-06, "loss": 0.4455, "step": 8000 }, { "epoch": 0.52, "eval_cer": 8.29885877318117, "eval_loss": 0.42695876955986023, "eval_runtime": 3202.8428, "eval_samples_per_second": 0.775, "eval_steps_per_second": 0.387, "eval_wer": 21.754907566228322, "step": 8000 }, { "epoch": 0.52, "learning_rate": 7.821159420289856e-06, "loss": 0.5201, "step": 8025 }, { "epoch": 0.52, "learning_rate": 7.813913043478263e-06, "loss": 0.4287, "step": 8050 }, { "epoch": 0.52, "learning_rate": 7.806666666666668e-06, "loss": 0.3597, "step": 8075 }, { "epoch": 0.52, "learning_rate": 7.799420289855073e-06, "loss": 0.2911, "step": 8100 }, { "epoch": 0.53, "learning_rate": 7.79217391304348e-06, "loss": 0.4192, "step": 8125 }, { "epoch": 0.53, "learning_rate": 7.784927536231884e-06, "loss": 0.328, "step": 8150 }, { "epoch": 0.53, "learning_rate": 7.777681159420291e-06, "loss": 0.4364, "step": 8175 }, { "epoch": 0.53, "learning_rate": 7.770434782608696e-06, "loss": 0.2877, "step": 8200 }, { "epoch": 0.53, "learning_rate": 7.763188405797101e-06, "loss": 0.3641, "step": 8225 }, { "epoch": 0.53, "learning_rate": 7.755942028985508e-06, "loss": 0.3338, "step": 8250 }, { "epoch": 0.54, "learning_rate": 7.748695652173913e-06, "loss": 0.3425, "step": 8275 }, { "epoch": 0.54, "learning_rate": 7.74144927536232e-06, "loss": 0.3633, "step": 8300 }, { "epoch": 0.54, "learning_rate": 7.734202898550726e-06, "loss": 0.4027, "step": 8325 }, { "epoch": 0.54, "learning_rate": 7.726956521739131e-06, "loss": 0.4075, "step": 8350 }, { "epoch": 0.54, "learning_rate": 7.719710144927536e-06, "loss": 0.4272, "step": 8375 }, { "epoch": 0.54, "learning_rate": 7.712463768115943e-06, "loss": 0.4463, "step": 8400 }, { "epoch": 0.55, "learning_rate": 7.705217391304348e-06, "loss": 0.4225, "step": 8425 }, { "epoch": 0.55, "learning_rate": 7.697971014492755e-06, "loss": 0.4155, "step": 8450 }, { "epoch": 0.55, "learning_rate": 7.69072463768116e-06, "loss": 0.3319, "step": 8475 }, { "epoch": 0.55, "learning_rate": 7.683478260869566e-06, "loss": 0.3675, "step": 8500 }, { "epoch": 0.55, "learning_rate": 7.676231884057971e-06, "loss": 0.4573, "step": 8525 }, { "epoch": 0.55, "learning_rate": 7.668985507246376e-06, "loss": 0.3742, "step": 8550 }, { "epoch": 0.56, "learning_rate": 7.661739130434783e-06, "loss": 0.4487, "step": 8575 }, { "epoch": 0.56, "learning_rate": 7.65449275362319e-06, "loss": 0.3993, "step": 8600 }, { "epoch": 0.56, "learning_rate": 7.647246376811595e-06, "loss": 0.3999, "step": 8625 }, { "epoch": 0.56, "learning_rate": 7.640000000000001e-06, "loss": 0.4322, "step": 8650 }, { "epoch": 0.56, "learning_rate": 7.632753623188406e-06, "loss": 0.2906, "step": 8675 }, { "epoch": 0.56, "learning_rate": 7.625507246376812e-06, "loss": 0.41, "step": 8700 }, { "epoch": 0.57, "learning_rate": 7.618260869565218e-06, "loss": 0.2934, "step": 8725 }, { "epoch": 0.57, "learning_rate": 7.611014492753623e-06, "loss": 0.3668, "step": 8750 }, { "epoch": 0.57, "learning_rate": 7.60376811594203e-06, "loss": 0.3826, "step": 8775 }, { "epoch": 0.57, "learning_rate": 7.596521739130436e-06, "loss": 0.4043, "step": 8800 }, { "epoch": 0.57, "learning_rate": 7.589275362318841e-06, "loss": 0.6248, "step": 8825 }, { "epoch": 0.57, "learning_rate": 7.582028985507247e-06, "loss": 0.4668, "step": 8850 }, { "epoch": 0.57, "learning_rate": 7.574782608695653e-06, "loss": 0.4407, "step": 8875 }, { "epoch": 0.58, "learning_rate": 7.567536231884058e-06, "loss": 0.3811, "step": 8900 }, { "epoch": 0.58, "learning_rate": 7.560289855072465e-06, "loss": 0.4717, "step": 8925 }, { "epoch": 0.58, "learning_rate": 7.55304347826087e-06, "loss": 0.3531, "step": 8950 }, { "epoch": 0.58, "learning_rate": 7.545797101449276e-06, "loss": 0.4022, "step": 8975 }, { "epoch": 0.58, "learning_rate": 7.5385507246376825e-06, "loss": 0.3987, "step": 9000 }, { "epoch": 0.58, "eval_cer": 7.9417334841851535, "eval_loss": 0.41387349367141724, "eval_runtime": 3295.4388, "eval_samples_per_second": 0.753, "eval_steps_per_second": 0.377, "eval_wer": 20.842386125404992, "step": 9000 }, { "epoch": 0.58, "learning_rate": 7.5313043478260875e-06, "loss": 0.2728, "step": 9025 }, { "epoch": 0.59, "learning_rate": 7.524057971014493e-06, "loss": 0.5125, "step": 9050 }, { "epoch": 0.59, "learning_rate": 7.516811594202899e-06, "loss": 0.3452, "step": 9075 }, { "epoch": 0.59, "learning_rate": 7.509565217391305e-06, "loss": 0.3387, "step": 9100 }, { "epoch": 0.59, "learning_rate": 7.502318840579711e-06, "loss": 0.5818, "step": 9125 }, { "epoch": 0.59, "learning_rate": 7.495072463768116e-06, "loss": 0.3494, "step": 9150 }, { "epoch": 0.59, "learning_rate": 7.487826086956523e-06, "loss": 0.2902, "step": 9175 }, { "epoch": 0.6, "learning_rate": 7.4805797101449285e-06, "loss": 0.3691, "step": 9200 }, { "epoch": 0.6, "learning_rate": 7.4733333333333335e-06, "loss": 0.3344, "step": 9225 }, { "epoch": 0.6, "learning_rate": 7.466086956521739e-06, "loss": 0.3612, "step": 9250 }, { "epoch": 0.6, "learning_rate": 7.458840579710146e-06, "loss": 0.4311, "step": 9275 }, { "epoch": 0.6, "learning_rate": 7.451594202898551e-06, "loss": 0.4298, "step": 9300 }, { "epoch": 0.6, "learning_rate": 7.444347826086957e-06, "loss": 0.3657, "step": 9325 }, { "epoch": 0.61, "learning_rate": 7.437101449275363e-06, "loss": 0.4382, "step": 9350 }, { "epoch": 0.61, "learning_rate": 7.429855072463769e-06, "loss": 0.3775, "step": 9375 }, { "epoch": 0.61, "learning_rate": 7.4226086956521745e-06, "loss": 0.3566, "step": 9400 }, { "epoch": 0.61, "learning_rate": 7.4153623188405795e-06, "loss": 0.3423, "step": 9425 }, { "epoch": 0.61, "learning_rate": 7.408115942028986e-06, "loss": 0.4855, "step": 9450 }, { "epoch": 0.61, "learning_rate": 7.400869565217392e-06, "loss": 0.3648, "step": 9475 }, { "epoch": 0.62, "learning_rate": 7.393623188405797e-06, "loss": 0.3294, "step": 9500 }, { "epoch": 0.62, "learning_rate": 7.386376811594204e-06, "loss": 0.3991, "step": 9525 }, { "epoch": 0.62, "learning_rate": 7.37913043478261e-06, "loss": 0.347, "step": 9550 }, { "epoch": 0.62, "learning_rate": 7.371884057971015e-06, "loss": 0.4011, "step": 9575 }, { "epoch": 0.62, "learning_rate": 7.364637681159421e-06, "loss": 0.3433, "step": 9600 }, { "epoch": 0.62, "learning_rate": 7.357391304347826e-06, "loss": 0.4642, "step": 9625 }, { "epoch": 0.63, "learning_rate": 7.350144927536232e-06, "loss": 0.3897, "step": 9650 }, { "epoch": 0.63, "learning_rate": 7.342898550724639e-06, "loss": 0.4562, "step": 9675 }, { "epoch": 0.63, "learning_rate": 7.335652173913044e-06, "loss": 0.4942, "step": 9700 }, { "epoch": 0.63, "learning_rate": 7.32840579710145e-06, "loss": 0.3497, "step": 9725 }, { "epoch": 0.63, "learning_rate": 7.3211594202898564e-06, "loss": 0.3713, "step": 9750 }, { "epoch": 0.63, "learning_rate": 7.3139130434782614e-06, "loss": 0.3558, "step": 9775 }, { "epoch": 0.63, "learning_rate": 7.306666666666667e-06, "loss": 0.4417, "step": 9800 }, { "epoch": 0.64, "learning_rate": 7.299420289855072e-06, "loss": 0.4752, "step": 9825 }, { "epoch": 0.64, "learning_rate": 7.292173913043479e-06, "loss": 0.3515, "step": 9850 }, { "epoch": 0.64, "learning_rate": 7.284927536231885e-06, "loss": 0.4731, "step": 9875 }, { "epoch": 0.64, "learning_rate": 7.27768115942029e-06, "loss": 0.3111, "step": 9900 }, { "epoch": 0.64, "learning_rate": 7.2704347826086966e-06, "loss": 0.3776, "step": 9925 }, { "epoch": 0.64, "learning_rate": 7.263188405797102e-06, "loss": 0.4209, "step": 9950 }, { "epoch": 0.65, "learning_rate": 7.2559420289855074e-06, "loss": 0.3707, "step": 9975 }, { "epoch": 0.65, "learning_rate": 7.248695652173914e-06, "loss": 0.3373, "step": 10000 }, { "epoch": 0.65, "eval_cer": 7.887131683801465, "eval_loss": 0.4116414785385132, "eval_runtime": 3350.806, "eval_samples_per_second": 0.741, "eval_steps_per_second": 0.37, "eval_wer": 21.214408233276156, "step": 10000 }, { "epoch": 0.65, "learning_rate": 7.241449275362319e-06, "loss": 0.3843, "step": 10025 }, { "epoch": 0.65, "learning_rate": 7.234202898550725e-06, "loss": 0.3891, "step": 10050 }, { "epoch": 0.65, "learning_rate": 7.226956521739132e-06, "loss": 0.4058, "step": 10075 }, { "epoch": 0.65, "learning_rate": 7.219710144927537e-06, "loss": 0.3908, "step": 10100 }, { "epoch": 0.66, "learning_rate": 7.2124637681159426e-06, "loss": 0.384, "step": 10125 }, { "epoch": 0.66, "learning_rate": 7.205217391304348e-06, "loss": 0.4804, "step": 10150 }, { "epoch": 0.66, "learning_rate": 7.197971014492754e-06, "loss": 0.2675, "step": 10175 }, { "epoch": 0.66, "learning_rate": 7.19072463768116e-06, "loss": 0.4003, "step": 10200 }, { "epoch": 0.66, "learning_rate": 7.183478260869566e-06, "loss": 0.4716, "step": 10225 }, { "epoch": 0.66, "learning_rate": 7.176231884057972e-06, "loss": 0.3955, "step": 10250 }, { "epoch": 0.67, "learning_rate": 7.168985507246378e-06, "loss": 0.4133, "step": 10275 }, { "epoch": 0.67, "learning_rate": 7.161739130434783e-06, "loss": 0.454, "step": 10300 }, { "epoch": 0.67, "learning_rate": 7.1544927536231885e-06, "loss": 0.4465, "step": 10325 }, { "epoch": 0.67, "learning_rate": 7.147246376811595e-06, "loss": 0.3997, "step": 10350 }, { "epoch": 0.67, "learning_rate": 7.14e-06, "loss": 0.43, "step": 10375 }, { "epoch": 0.67, "learning_rate": 7.132753623188406e-06, "loss": 0.373, "step": 10400 }, { "epoch": 0.68, "learning_rate": 7.125507246376813e-06, "loss": 0.4268, "step": 10425 }, { "epoch": 0.68, "learning_rate": 7.118260869565218e-06, "loss": 0.331, "step": 10450 }, { "epoch": 0.68, "learning_rate": 7.111014492753624e-06, "loss": 0.4018, "step": 10475 }, { "epoch": 0.68, "learning_rate": 7.103768115942029e-06, "loss": 0.3489, "step": 10500 }, { "epoch": 0.68, "learning_rate": 7.096521739130435e-06, "loss": 0.3914, "step": 10525 }, { "epoch": 0.68, "learning_rate": 7.089275362318841e-06, "loss": 0.3368, "step": 10550 }, { "epoch": 0.68, "learning_rate": 7.082028985507246e-06, "loss": 0.3999, "step": 10575 }, { "epoch": 0.69, "learning_rate": 7.074782608695653e-06, "loss": 0.334, "step": 10600 }, { "epoch": 0.69, "learning_rate": 7.067536231884059e-06, "loss": 0.4635, "step": 10625 }, { "epoch": 0.69, "learning_rate": 7.060289855072464e-06, "loss": 0.475, "step": 10650 }, { "epoch": 0.69, "learning_rate": 7.0530434782608705e-06, "loss": 0.3621, "step": 10675 }, { "epoch": 0.69, "learning_rate": 7.0457971014492755e-06, "loss": 0.4164, "step": 10700 }, { "epoch": 0.69, "learning_rate": 7.038550724637681e-06, "loss": 0.3648, "step": 10725 }, { "epoch": 0.7, "learning_rate": 7.031304347826088e-06, "loss": 0.4358, "step": 10750 }, { "epoch": 0.7, "learning_rate": 7.024057971014493e-06, "loss": 0.3316, "step": 10775 }, { "epoch": 0.7, "learning_rate": 7.016811594202899e-06, "loss": 0.4052, "step": 10800 }, { "epoch": 0.7, "learning_rate": 7.009565217391306e-06, "loss": 0.4474, "step": 10825 }, { "epoch": 0.7, "learning_rate": 7.002318840579711e-06, "loss": 0.339, "step": 10850 }, { "epoch": 0.7, "learning_rate": 6.9950724637681165e-06, "loss": 0.3653, "step": 10875 }, { "epoch": 0.71, "learning_rate": 6.9878260869565215e-06, "loss": 0.3337, "step": 10900 }, { "epoch": 0.71, "learning_rate": 6.980579710144928e-06, "loss": 0.3516, "step": 10925 }, { "epoch": 0.71, "learning_rate": 6.973333333333334e-06, "loss": 0.3092, "step": 10950 }, { "epoch": 0.71, "learning_rate": 6.966086956521739e-06, "loss": 0.4312, "step": 10975 }, { "epoch": 0.71, "learning_rate": 6.958840579710146e-06, "loss": 0.3808, "step": 11000 }, { "epoch": 0.71, "eval_cer": 7.6264203846721434, "eval_loss": 0.4016057252883911, "eval_runtime": 3251.7215, "eval_samples_per_second": 0.763, "eval_steps_per_second": 0.382, "eval_wer": 20.509243377167905, "step": 11000 }, { "epoch": 0.71, "learning_rate": 6.951594202898552e-06, "loss": 0.6109, "step": 11025 }, { "epoch": 0.72, "learning_rate": 6.944347826086957e-06, "loss": 0.4322, "step": 11050 }, { "epoch": 0.72, "learning_rate": 6.937101449275363e-06, "loss": 0.318, "step": 11075 }, { "epoch": 0.72, "learning_rate": 6.929855072463769e-06, "loss": 0.3855, "step": 11100 }, { "epoch": 0.72, "learning_rate": 6.922608695652174e-06, "loss": 0.3817, "step": 11125 }, { "epoch": 0.72, "learning_rate": 6.915362318840581e-06, "loss": 0.384, "step": 11150 }, { "epoch": 0.72, "learning_rate": 6.908115942028986e-06, "loss": 0.3451, "step": 11175 }, { "epoch": 0.73, "learning_rate": 6.900869565217392e-06, "loss": 0.3518, "step": 11200 }, { "epoch": 0.73, "learning_rate": 6.8936231884057984e-06, "loss": 0.4567, "step": 11225 }, { "epoch": 0.73, "learning_rate": 6.886666666666667e-06, "loss": 0.3848, "step": 11250 }, { "epoch": 0.73, "learning_rate": 6.879420289855073e-06, "loss": 0.4563, "step": 11275 }, { "epoch": 0.73, "learning_rate": 6.872173913043478e-06, "loss": 0.3633, "step": 11300 }, { "epoch": 0.73, "learning_rate": 6.864927536231885e-06, "loss": 0.425, "step": 11325 }, { "epoch": 0.74, "learning_rate": 6.8576811594202905e-06, "loss": 0.3508, "step": 11350 }, { "epoch": 0.74, "learning_rate": 6.8504347826086955e-06, "loss": 0.3351, "step": 11375 }, { "epoch": 0.74, "learning_rate": 6.843188405797102e-06, "loss": 0.4659, "step": 11400 }, { "epoch": 0.74, "learning_rate": 6.835942028985508e-06, "loss": 0.346, "step": 11425 }, { "epoch": 0.74, "learning_rate": 6.828695652173913e-06, "loss": 0.3896, "step": 11450 }, { "epoch": 0.74, "learning_rate": 6.82144927536232e-06, "loss": 0.4153, "step": 11475 }, { "epoch": 0.74, "learning_rate": 6.814202898550725e-06, "loss": 0.3759, "step": 11500 }, { "epoch": 0.75, "learning_rate": 6.806956521739131e-06, "loss": 0.3328, "step": 11525 }, { "epoch": 0.75, "learning_rate": 6.799710144927537e-06, "loss": 0.5639, "step": 11550 }, { "epoch": 0.75, "learning_rate": 6.792463768115942e-06, "loss": 0.3775, "step": 11575 }, { "epoch": 0.75, "learning_rate": 6.785217391304348e-06, "loss": 0.4081, "step": 11600 }, { "epoch": 0.75, "learning_rate": 6.777971014492755e-06, "loss": 0.4266, "step": 11625 }, { "epoch": 0.75, "learning_rate": 6.77072463768116e-06, "loss": 0.3683, "step": 11650 }, { "epoch": 0.76, "learning_rate": 6.763478260869566e-06, "loss": 0.4148, "step": 11675 }, { "epoch": 0.76, "learning_rate": 6.756231884057971e-06, "loss": 0.3413, "step": 11700 }, { "epoch": 0.76, "learning_rate": 6.7489855072463775e-06, "loss": 0.3954, "step": 11725 }, { "epoch": 0.76, "learning_rate": 6.741739130434783e-06, "loss": 0.3807, "step": 11750 }, { "epoch": 0.76, "learning_rate": 6.734492753623188e-06, "loss": 0.3475, "step": 11775 }, { "epoch": 0.76, "learning_rate": 6.727246376811595e-06, "loss": 0.3428, "step": 11800 }, { "epoch": 0.77, "learning_rate": 6.720000000000001e-06, "loss": 0.3614, "step": 11825 }, { "epoch": 0.77, "learning_rate": 6.712753623188406e-06, "loss": 0.3261, "step": 11850 }, { "epoch": 0.77, "learning_rate": 6.705507246376813e-06, "loss": 0.463, "step": 11875 }, { "epoch": 0.77, "learning_rate": 6.6982608695652184e-06, "loss": 0.3045, "step": 11900 }, { "epoch": 0.77, "learning_rate": 6.6910144927536235e-06, "loss": 0.3677, "step": 11925 }, { "epoch": 0.77, "learning_rate": 6.68376811594203e-06, "loss": 0.3405, "step": 11950 }, { "epoch": 0.78, "learning_rate": 6.676521739130435e-06, "loss": 0.3467, "step": 11975 }, { "epoch": 0.78, "learning_rate": 6.669275362318841e-06, "loss": 0.4214, "step": 12000 }, { "epoch": 0.78, "eval_cer": 7.4152688277829695, "eval_loss": 0.39488446712493896, "eval_runtime": 3259.8037, "eval_samples_per_second": 0.761, "eval_steps_per_second": 0.381, "eval_wer": 20.093767867352774, "step": 12000 }, { "epoch": 0.78, "learning_rate": 6.662028985507248e-06, "loss": 0.3608, "step": 12025 }, { "epoch": 0.78, "learning_rate": 6.654782608695653e-06, "loss": 0.3147, "step": 12050 }, { "epoch": 0.78, "learning_rate": 6.647536231884059e-06, "loss": 0.2764, "step": 12075 }, { "epoch": 0.78, "learning_rate": 6.6402898550724644e-06, "loss": 0.3447, "step": 12100 }, { "epoch": 0.79, "learning_rate": 6.63304347826087e-06, "loss": 0.3727, "step": 12125 }, { "epoch": 0.79, "learning_rate": 6.625797101449276e-06, "loss": 0.4042, "step": 12150 }, { "epoch": 0.79, "learning_rate": 6.618550724637681e-06, "loss": 0.3758, "step": 12175 }, { "epoch": 0.79, "learning_rate": 6.611304347826088e-06, "loss": 0.3582, "step": 12200 }, { "epoch": 0.79, "learning_rate": 6.604057971014494e-06, "loss": 0.3571, "step": 12225 }, { "epoch": 0.79, "learning_rate": 6.596811594202899e-06, "loss": 0.3676, "step": 12250 }, { "epoch": 0.8, "learning_rate": 6.5895652173913046e-06, "loss": 0.3224, "step": 12275 }, { "epoch": 0.8, "learning_rate": 6.582318840579711e-06, "loss": 0.3025, "step": 12300 }, { "epoch": 0.8, "learning_rate": 6.575072463768116e-06, "loss": 0.3686, "step": 12325 }, { "epoch": 0.8, "learning_rate": 6.567826086956522e-06, "loss": 0.3866, "step": 12350 }, { "epoch": 0.8, "learning_rate": 6.560579710144928e-06, "loss": 0.3662, "step": 12375 }, { "epoch": 0.8, "learning_rate": 6.553333333333334e-06, "loss": 0.3507, "step": 12400 }, { "epoch": 0.8, "learning_rate": 6.54608695652174e-06, "loss": 0.3165, "step": 12425 }, { "epoch": 0.81, "learning_rate": 6.538840579710145e-06, "loss": 0.3616, "step": 12450 }, { "epoch": 0.81, "learning_rate": 6.531594202898551e-06, "loss": 0.3466, "step": 12475 }, { "epoch": 0.81, "learning_rate": 6.524347826086957e-06, "loss": 0.5202, "step": 12500 }, { "epoch": 0.81, "learning_rate": 6.517101449275362e-06, "loss": 0.3789, "step": 12525 }, { "epoch": 0.81, "learning_rate": 6.509855072463769e-06, "loss": 0.5112, "step": 12550 }, { "epoch": 0.81, "learning_rate": 6.502608695652174e-06, "loss": 0.353, "step": 12575 }, { "epoch": 0.82, "learning_rate": 6.49536231884058e-06, "loss": 0.3469, "step": 12600 }, { "epoch": 0.82, "learning_rate": 6.4881159420289865e-06, "loss": 0.4366, "step": 12625 }, { "epoch": 0.82, "learning_rate": 6.4808695652173915e-06, "loss": 0.309, "step": 12650 }, { "epoch": 0.82, "learning_rate": 6.473623188405797e-06, "loss": 0.4358, "step": 12675 }, { "epoch": 0.82, "learning_rate": 6.466376811594204e-06, "loss": 0.3286, "step": 12700 }, { "epoch": 0.82, "learning_rate": 6.459130434782609e-06, "loss": 0.2837, "step": 12725 }, { "epoch": 0.83, "learning_rate": 6.451884057971015e-06, "loss": 0.3613, "step": 12750 }, { "epoch": 0.83, "learning_rate": 6.444637681159422e-06, "loss": 0.2637, "step": 12775 }, { "epoch": 0.83, "learning_rate": 6.437391304347827e-06, "loss": 0.3415, "step": 12800 }, { "epoch": 0.83, "learning_rate": 6.4301449275362325e-06, "loss": 0.371, "step": 12825 }, { "epoch": 0.83, "learning_rate": 6.4228985507246375e-06, "loss": 0.286, "step": 12850 }, { "epoch": 0.83, "learning_rate": 6.415652173913044e-06, "loss": 0.3646, "step": 12875 }, { "epoch": 0.84, "learning_rate": 6.40840579710145e-06, "loss": 0.4352, "step": 12900 }, { "epoch": 0.84, "learning_rate": 6.401159420289855e-06, "loss": 0.2876, "step": 12925 }, { "epoch": 0.84, "learning_rate": 6.393913043478262e-06, "loss": 0.3672, "step": 12950 }, { "epoch": 0.84, "learning_rate": 6.386666666666668e-06, "loss": 0.2878, "step": 12975 }, { "epoch": 0.84, "learning_rate": 6.379420289855073e-06, "loss": 0.3029, "step": 13000 }, { "epoch": 0.84, "eval_cer": 7.358084509813567, "eval_loss": 0.3902455270290375, "eval_runtime": 3231.646, "eval_samples_per_second": 0.768, "eval_steps_per_second": 0.384, "eval_wer": 19.7347055460263, "step": 13000 }, { "epoch": 1.55, "learning_rate": 6.372173913043479e-06, "loss": 0.3232, "step": 13025 }, { "epoch": 1.55, "learning_rate": 6.364927536231884e-06, "loss": 0.3888, "step": 13050 }, { "epoch": 1.55, "learning_rate": 6.35768115942029e-06, "loss": 0.3928, "step": 13075 }, { "epoch": 1.55, "learning_rate": 6.350434782608697e-06, "loss": 0.3615, "step": 13100 }, { "epoch": 1.56, "learning_rate": 6.343188405797102e-06, "loss": 0.4292, "step": 13125 }, { "epoch": 1.56, "learning_rate": 6.335942028985508e-06, "loss": 0.3445, "step": 13150 }, { "epoch": 1.56, "learning_rate": 6.328695652173914e-06, "loss": 0.3983, "step": 13175 }, { "epoch": 1.57, "learning_rate": 6.3214492753623195e-06, "loss": 0.3746, "step": 13200 }, { "epoch": 1.57, "learning_rate": 6.314202898550725e-06, "loss": 0.3714, "step": 13225 }, { "epoch": 1.57, "learning_rate": 6.30695652173913e-06, "loss": 0.369, "step": 13250 }, { "epoch": 1.58, "learning_rate": 6.299710144927537e-06, "loss": 0.3991, "step": 13275 }, { "epoch": 1.58, "learning_rate": 6.292463768115943e-06, "loss": 0.4264, "step": 13300 }, { "epoch": 1.58, "learning_rate": 6.285217391304348e-06, "loss": 0.2885, "step": 13325 }, { "epoch": 1.58, "learning_rate": 6.277971014492754e-06, "loss": 0.3356, "step": 13350 }, { "epoch": 1.59, "learning_rate": 6.2707246376811605e-06, "loss": 0.3758, "step": 13375 }, { "epoch": 1.59, "learning_rate": 6.2634782608695655e-06, "loss": 0.3424, "step": 13400 }, { "epoch": 1.59, "learning_rate": 6.256231884057971e-06, "loss": 0.3376, "step": 13425 }, { "epoch": 1.6, "learning_rate": 6.248985507246378e-06, "loss": 0.3928, "step": 13450 }, { "epoch": 1.6, "learning_rate": 6.241739130434783e-06, "loss": 0.3247, "step": 13475 }, { "epoch": 1.6, "learning_rate": 6.234492753623189e-06, "loss": 0.3002, "step": 13500 }, { "epoch": 1.6, "learning_rate": 6.227246376811594e-06, "loss": 0.2954, "step": 13525 }, { "epoch": 1.61, "learning_rate": 6.220000000000001e-06, "loss": 0.3292, "step": 13550 }, { "epoch": 1.61, "learning_rate": 6.213043478260871e-06, "loss": 0.3325, "step": 13575 }, { "epoch": 1.61, "learning_rate": 6.205797101449276e-06, "loss": 0.3929, "step": 13600 }, { "epoch": 1.62, "learning_rate": 6.198550724637682e-06, "loss": 0.3311, "step": 13625 }, { "epoch": 1.62, "learning_rate": 6.191304347826087e-06, "loss": 0.2803, "step": 13650 }, { "epoch": 1.62, "learning_rate": 6.1840579710144935e-06, "loss": 0.3777, "step": 13675 }, { "epoch": 1.63, "learning_rate": 6.176811594202899e-06, "loss": 0.387, "step": 13700 }, { "epoch": 1.63, "learning_rate": 6.169565217391304e-06, "loss": 0.3304, "step": 13725 }, { "epoch": 1.63, "learning_rate": 6.162318840579711e-06, "loss": 0.4854, "step": 13750 }, { "epoch": 1.63, "learning_rate": 6.155072463768117e-06, "loss": 0.3572, "step": 13775 }, { "epoch": 1.64, "learning_rate": 6.147826086956522e-06, "loss": 0.3484, "step": 13800 }, { "epoch": 1.64, "learning_rate": 6.140579710144929e-06, "loss": 0.3671, "step": 13825 }, { "epoch": 1.64, "learning_rate": 6.133333333333334e-06, "loss": 0.376, "step": 13850 }, { "epoch": 1.65, "learning_rate": 6.1260869565217395e-06, "loss": 0.3435, "step": 13875 }, { "epoch": 1.65, "learning_rate": 6.118840579710146e-06, "loss": 0.4171, "step": 13900 }, { "epoch": 1.65, "learning_rate": 6.111594202898551e-06, "loss": 0.3793, "step": 13925 }, { "epoch": 1.66, "learning_rate": 6.104347826086957e-06, "loss": 0.4026, "step": 13950 }, { "epoch": 1.66, "learning_rate": 6.097101449275363e-06, "loss": 0.3086, "step": 13975 }, { "epoch": 1.66, "learning_rate": 6.089855072463769e-06, "loss": 0.3549, "step": 14000 }, { "epoch": 1.66, "eval_cer": 7.119509075704658, "eval_loss": 0.39083221554756165, "eval_runtime": 3180.5722, "eval_samples_per_second": 0.78, "eval_steps_per_second": 0.39, "eval_wer": 19.411473222793976, "step": 14000 }, { "epoch": 1.66, "learning_rate": 6.082608695652175e-06, "loss": 0.3889, "step": 14025 }, { "epoch": 1.67, "learning_rate": 6.07536231884058e-06, "loss": 0.3197, "step": 14050 }, { "epoch": 1.67, "learning_rate": 6.068115942028986e-06, "loss": 0.3279, "step": 14075 }, { "epoch": 1.67, "learning_rate": 6.060869565217392e-06, "loss": 0.4178, "step": 14100 }, { "epoch": 1.68, "learning_rate": 6.053623188405797e-06, "loss": 0.3872, "step": 14125 }, { "epoch": 1.68, "learning_rate": 6.046376811594203e-06, "loss": 0.3375, "step": 14150 }, { "epoch": 1.68, "learning_rate": 6.03913043478261e-06, "loss": 0.4023, "step": 14175 }, { "epoch": 1.69, "learning_rate": 6.031884057971015e-06, "loss": 0.4128, "step": 14200 }, { "epoch": 1.69, "learning_rate": 6.024637681159421e-06, "loss": 0.3603, "step": 14225 }, { "epoch": 1.69, "learning_rate": 6.0173913043478264e-06, "loss": 0.3824, "step": 14250 }, { "epoch": 1.69, "learning_rate": 6.010144927536232e-06, "loss": 0.4071, "step": 14275 }, { "epoch": 1.7, "learning_rate": 6.002898550724638e-06, "loss": 0.2672, "step": 14300 }, { "epoch": 1.7, "learning_rate": 5.995652173913043e-06, "loss": 0.327, "step": 14325 }, { "epoch": 1.7, "learning_rate": 5.98840579710145e-06, "loss": 0.3569, "step": 14350 }, { "epoch": 1.71, "learning_rate": 5.981159420289856e-06, "loss": 0.3308, "step": 14375 }, { "epoch": 1.71, "learning_rate": 5.973913043478261e-06, "loss": 0.3802, "step": 14400 }, { "epoch": 1.71, "learning_rate": 5.966666666666667e-06, "loss": 0.4012, "step": 14425 }, { "epoch": 1.71, "learning_rate": 5.959420289855073e-06, "loss": 0.3191, "step": 14450 }, { "epoch": 1.72, "learning_rate": 5.952173913043478e-06, "loss": 0.2991, "step": 14475 }, { "epoch": 1.72, "learning_rate": 5.944927536231885e-06, "loss": 0.3889, "step": 14500 }, { "epoch": 1.72, "learning_rate": 5.93768115942029e-06, "loss": 0.3315, "step": 14525 }, { "epoch": 1.73, "learning_rate": 5.930434782608696e-06, "loss": 0.3925, "step": 14550 }, { "epoch": 1.73, "learning_rate": 5.9231884057971025e-06, "loss": 0.3661, "step": 14575 }, { "epoch": 1.73, "learning_rate": 5.9159420289855076e-06, "loss": 0.4426, "step": 14600 }, { "epoch": 1.74, "learning_rate": 5.908695652173913e-06, "loss": 0.4046, "step": 14625 }, { "epoch": 1.74, "learning_rate": 5.90144927536232e-06, "loss": 0.3361, "step": 14650 }, { "epoch": 1.74, "learning_rate": 5.894202898550725e-06, "loss": 0.4759, "step": 14675 }, { "epoch": 1.74, "learning_rate": 5.886956521739131e-06, "loss": 0.4326, "step": 14700 }, { "epoch": 1.75, "learning_rate": 5.879710144927536e-06, "loss": 0.2716, "step": 14725 }, { "epoch": 1.75, "learning_rate": 5.872463768115943e-06, "loss": 0.3416, "step": 14750 }, { "epoch": 1.75, "learning_rate": 5.8652173913043485e-06, "loss": 0.3715, "step": 14775 }, { "epoch": 1.76, "learning_rate": 5.8579710144927535e-06, "loss": 0.3737, "step": 14800 }, { "epoch": 1.76, "learning_rate": 5.85072463768116e-06, "loss": 0.309, "step": 14825 }, { "epoch": 1.76, "learning_rate": 5.843478260869566e-06, "loss": 0.3327, "step": 14850 }, { "epoch": 1.77, "learning_rate": 5.836231884057971e-06, "loss": 0.401, "step": 14875 }, { "epoch": 1.77, "learning_rate": 5.828985507246378e-06, "loss": 0.2827, "step": 14900 }, { "epoch": 1.77, "learning_rate": 5.821739130434783e-06, "loss": 0.3644, "step": 14925 }, { "epoch": 1.77, "learning_rate": 5.814492753623189e-06, "loss": 0.3638, "step": 14950 }, { "epoch": 1.78, "learning_rate": 5.807246376811595e-06, "loss": 0.4652, "step": 14975 }, { "epoch": 1.78, "learning_rate": 5.8e-06, "loss": 0.3385, "step": 15000 }, { "epoch": 1.78, "eval_cer": 7.779157853313001, "eval_loss": 0.39061304926872253, "eval_runtime": 3221.9453, "eval_samples_per_second": 0.77, "eval_steps_per_second": 0.385, "eval_wer": 20.20506956356013, "step": 15000 }, { "epoch": 1.78, "learning_rate": 5.792753623188406e-06, "loss": 0.4065, "step": 15025 }, { "epoch": 1.79, "learning_rate": 5.785507246376812e-06, "loss": 0.4354, "step": 15050 }, { "epoch": 1.79, "learning_rate": 5.778260869565218e-06, "loss": 0.3932, "step": 15075 }, { "epoch": 1.79, "learning_rate": 5.771014492753624e-06, "loss": 0.3212, "step": 15100 }, { "epoch": 1.79, "learning_rate": 5.76376811594203e-06, "loss": 0.4244, "step": 15125 }, { "epoch": 1.8, "learning_rate": 5.7565217391304355e-06, "loss": 0.306, "step": 15150 }, { "epoch": 1.8, "learning_rate": 5.749275362318841e-06, "loss": 0.3492, "step": 15175 }, { "epoch": 1.8, "learning_rate": 5.742028985507246e-06, "loss": 0.3573, "step": 15200 }, { "epoch": 1.81, "learning_rate": 5.734782608695652e-06, "loss": 0.3975, "step": 15225 }, { "epoch": 1.81, "learning_rate": 5.727536231884059e-06, "loss": 0.3276, "step": 15250 }, { "epoch": 1.81, "learning_rate": 5.720289855072464e-06, "loss": 0.3638, "step": 15275 }, { "epoch": 1.82, "learning_rate": 5.71304347826087e-06, "loss": 0.3312, "step": 15300 }, { "epoch": 1.82, "learning_rate": 5.7057971014492765e-06, "loss": 0.3026, "step": 15325 }, { "epoch": 1.82, "learning_rate": 5.6985507246376815e-06, "loss": 0.3493, "step": 15350 }, { "epoch": 1.82, "learning_rate": 5.691304347826087e-06, "loss": 0.309, "step": 15375 }, { "epoch": 1.83, "learning_rate": 5.684057971014492e-06, "loss": 0.2761, "step": 15400 }, { "epoch": 1.83, "learning_rate": 5.676811594202899e-06, "loss": 0.3507, "step": 15425 }, { "epoch": 1.83, "learning_rate": 5.669565217391305e-06, "loss": 0.3359, "step": 15450 }, { "epoch": 1.84, "learning_rate": 5.66231884057971e-06, "loss": 0.3132, "step": 15475 }, { "epoch": 1.84, "learning_rate": 5.655072463768117e-06, "loss": 0.2976, "step": 15500 }, { "epoch": 1.84, "learning_rate": 5.6478260869565225e-06, "loss": 0.3893, "step": 15525 }, { "epoch": 1.85, "learning_rate": 5.6405797101449275e-06, "loss": 0.3417, "step": 15550 }, { "epoch": 1.85, "learning_rate": 5.633333333333334e-06, "loss": 0.3462, "step": 15575 }, { "epoch": 1.85, "learning_rate": 5.626086956521739e-06, "loss": 0.3885, "step": 15600 }, { "epoch": 1.85, "learning_rate": 5.618840579710145e-06, "loss": 0.3844, "step": 15625 }, { "epoch": 1.86, "learning_rate": 5.611594202898552e-06, "loss": 0.3112, "step": 15650 }, { "epoch": 1.86, "learning_rate": 5.604347826086957e-06, "loss": 0.3266, "step": 15675 }, { "epoch": 1.86, "learning_rate": 5.597101449275363e-06, "loss": 0.3538, "step": 15700 }, { "epoch": 1.87, "learning_rate": 5.589855072463769e-06, "loss": 0.351, "step": 15725 }, { "epoch": 1.87, "learning_rate": 5.582608695652174e-06, "loss": 0.3373, "step": 15750 }, { "epoch": 1.87, "learning_rate": 5.57536231884058e-06, "loss": 0.4156, "step": 15775 }, { "epoch": 1.87, "learning_rate": 5.568115942028985e-06, "loss": 0.4124, "step": 15800 }, { "epoch": 1.88, "learning_rate": 5.560869565217392e-06, "loss": 0.3716, "step": 15825 }, { "epoch": 1.88, "learning_rate": 5.553623188405798e-06, "loss": 0.5276, "step": 15850 }, { "epoch": 1.88, "learning_rate": 5.546376811594203e-06, "loss": 0.3412, "step": 15875 }, { "epoch": 1.89, "learning_rate": 5.5391304347826094e-06, "loss": 0.3293, "step": 15900 }, { "epoch": 1.89, "learning_rate": 5.531884057971015e-06, "loss": 0.3759, "step": 15925 }, { "epoch": 1.89, "learning_rate": 5.52463768115942e-06, "loss": 0.3926, "step": 15950 }, { "epoch": 1.9, "learning_rate": 5.517391304347827e-06, "loss": 0.3686, "step": 15975 }, { "epoch": 1.9, "learning_rate": 5.510144927536233e-06, "loss": 0.3282, "step": 16000 }, { "epoch": 1.9, "eval_cer": 7.108072212110778, "eval_loss": 0.39232152700424194, "eval_runtime": 3154.8615, "eval_samples_per_second": 0.787, "eval_steps_per_second": 0.393, "eval_wer": 19.265103868877453, "step": 16000 }, { "epoch": 1.9, "learning_rate": 5.502898550724638e-06, "loss": 0.3279, "step": 16025 }, { "epoch": 1.9, "learning_rate": 5.4956521739130446e-06, "loss": 0.4442, "step": 16050 }, { "epoch": 1.91, "learning_rate": 5.4884057971014496e-06, "loss": 0.4354, "step": 16075 }, { "epoch": 1.91, "learning_rate": 5.481159420289855e-06, "loss": 0.362, "step": 16100 }, { "epoch": 1.91, "learning_rate": 5.473913043478261e-06, "loss": 0.3849, "step": 16125 }, { "epoch": 1.92, "learning_rate": 5.466666666666667e-06, "loss": 0.3956, "step": 16150 }, { "epoch": 1.92, "learning_rate": 5.459420289855073e-06, "loss": 0.2881, "step": 16175 }, { "epoch": 1.92, "learning_rate": 5.452173913043479e-06, "loss": 0.3321, "step": 16200 }, { "epoch": 1.93, "learning_rate": 5.444927536231885e-06, "loss": 0.3512, "step": 16225 }, { "epoch": 1.93, "learning_rate": 5.4376811594202905e-06, "loss": 0.3227, "step": 16250 }, { "epoch": 1.93, "learning_rate": 5.4304347826086955e-06, "loss": 0.3204, "step": 16275 }, { "epoch": 1.93, "learning_rate": 5.423188405797101e-06, "loss": 0.2884, "step": 16300 }, { "epoch": 1.94, "learning_rate": 5.415942028985508e-06, "loss": 0.3259, "step": 16325 }, { "epoch": 1.94, "learning_rate": 5.408695652173913e-06, "loss": 0.3611, "step": 16350 }, { "epoch": 1.94, "learning_rate": 5.401449275362319e-06, "loss": 0.3598, "step": 16375 }, { "epoch": 1.95, "learning_rate": 5.394202898550726e-06, "loss": 0.3911, "step": 16400 }, { "epoch": 1.95, "learning_rate": 5.386956521739131e-06, "loss": 0.4117, "step": 16425 }, { "epoch": 1.95, "learning_rate": 5.3797101449275365e-06, "loss": 0.4095, "step": 16450 }, { "epoch": 1.96, "learning_rate": 5.3724637681159415e-06, "loss": 0.3033, "step": 16475 }, { "epoch": 1.96, "learning_rate": 5.365217391304348e-06, "loss": 0.3534, "step": 16500 }, { "epoch": 1.96, "learning_rate": 5.357971014492754e-06, "loss": 0.2906, "step": 16525 }, { "epoch": 1.96, "learning_rate": 5.350724637681159e-06, "loss": 0.2948, "step": 16550 }, { "epoch": 1.97, "learning_rate": 5.343478260869566e-06, "loss": 0.2731, "step": 16575 }, { "epoch": 1.97, "learning_rate": 5.336231884057972e-06, "loss": 0.3218, "step": 16600 }, { "epoch": 1.97, "learning_rate": 5.328985507246377e-06, "loss": 0.328, "step": 16625 }, { "epoch": 1.98, "learning_rate": 5.321739130434783e-06, "loss": 0.274, "step": 16650 }, { "epoch": 1.98, "learning_rate": 5.314492753623189e-06, "loss": 0.2936, "step": 16675 }, { "epoch": 1.98, "learning_rate": 5.307246376811594e-06, "loss": 0.3601, "step": 16700 }, { "epoch": 1.98, "learning_rate": 5.3002898550724646e-06, "loss": 0.4228, "step": 16725 }, { "epoch": 1.99, "learning_rate": 5.2930434782608696e-06, "loss": 0.3024, "step": 16750 }, { "epoch": 1.99, "learning_rate": 5.285797101449276e-06, "loss": 0.3463, "step": 16775 }, { "epoch": 1.99, "learning_rate": 5.278550724637682e-06, "loss": 0.3282, "step": 16800 }, { "epoch": 2.0, "learning_rate": 5.271304347826087e-06, "loss": 0.3138, "step": 16825 }, { "epoch": 2.0, "learning_rate": 5.264057971014494e-06, "loss": 0.3608, "step": 16850 }, { "epoch": 2.0, "learning_rate": 5.256811594202899e-06, "loss": 0.2716, "step": 16875 }, { "epoch": 2.01, "learning_rate": 5.249565217391305e-06, "loss": 0.4661, "step": 16900 }, { "epoch": 2.01, "learning_rate": 5.242318840579711e-06, "loss": 0.2482, "step": 16925 }, { "epoch": 2.01, "learning_rate": 5.235072463768116e-06, "loss": 0.34, "step": 16950 }, { "epoch": 2.01, "learning_rate": 5.227826086956522e-06, "loss": 0.3228, "step": 16975 }, { "epoch": 2.02, "learning_rate": 5.220579710144928e-06, "loss": 0.3196, "step": 17000 }, { "epoch": 2.02, "eval_cer": 7.224900388607408, "eval_loss": 0.39229413866996765, "eval_runtime": 3162.0207, "eval_samples_per_second": 0.785, "eval_steps_per_second": 0.392, "eval_wer": 19.335239184295787, "step": 17000 }, { "epoch": 2.02, "learning_rate": 5.213333333333334e-06, "loss": 0.2583, "step": 17025 }, { "epoch": 2.02, "learning_rate": 5.20608695652174e-06, "loss": 0.248, "step": 17050 }, { "epoch": 2.03, "learning_rate": 5.198840579710145e-06, "loss": 0.2901, "step": 17075 }, { "epoch": 2.03, "learning_rate": 5.191594202898551e-06, "loss": 0.2492, "step": 17100 }, { "epoch": 2.03, "learning_rate": 5.184347826086957e-06, "loss": 0.3115, "step": 17125 }, { "epoch": 2.04, "learning_rate": 5.177101449275362e-06, "loss": 0.3328, "step": 17150 }, { "epoch": 2.04, "learning_rate": 5.169855072463768e-06, "loss": 0.2782, "step": 17175 }, { "epoch": 2.04, "learning_rate": 5.162608695652175e-06, "loss": 0.2778, "step": 17200 }, { "epoch": 2.04, "learning_rate": 5.15536231884058e-06, "loss": 0.2721, "step": 17225 }, { "epoch": 2.05, "learning_rate": 5.148115942028986e-06, "loss": 0.361, "step": 17250 }, { "epoch": 2.05, "learning_rate": 5.140869565217391e-06, "loss": 0.3612, "step": 17275 }, { "epoch": 2.05, "learning_rate": 5.1336231884057975e-06, "loss": 0.2824, "step": 17300 }, { "epoch": 2.06, "learning_rate": 5.126376811594203e-06, "loss": 0.2909, "step": 17325 }, { "epoch": 2.06, "learning_rate": 5.119130434782608e-06, "loss": 0.2773, "step": 17350 }, { "epoch": 2.06, "learning_rate": 5.111884057971015e-06, "loss": 0.3971, "step": 17375 }, { "epoch": 2.06, "learning_rate": 5.104637681159421e-06, "loss": 0.2334, "step": 17400 }, { "epoch": 2.07, "learning_rate": 5.097391304347826e-06, "loss": 0.3899, "step": 17425 }, { "epoch": 2.07, "learning_rate": 5.090144927536233e-06, "loss": 0.321, "step": 17450 }, { "epoch": 2.07, "learning_rate": 5.082898550724638e-06, "loss": 0.2295, "step": 17475 }, { "epoch": 2.08, "learning_rate": 5.0756521739130435e-06, "loss": 0.278, "step": 17500 }, { "epoch": 2.08, "learning_rate": 5.06840579710145e-06, "loss": 0.2696, "step": 17525 }, { "epoch": 2.08, "learning_rate": 5.061159420289855e-06, "loss": 0.2604, "step": 17550 }, { "epoch": 2.09, "learning_rate": 5.053913043478261e-06, "loss": 0.3015, "step": 17575 }, { "epoch": 2.09, "learning_rate": 5.046666666666668e-06, "loss": 0.1998, "step": 17600 }, { "epoch": 2.09, "learning_rate": 5.039420289855073e-06, "loss": 0.3426, "step": 17625 }, { "epoch": 2.09, "learning_rate": 5.032173913043479e-06, "loss": 0.3037, "step": 17650 }, { "epoch": 2.1, "learning_rate": 5.024927536231885e-06, "loss": 0.3063, "step": 17675 }, { "epoch": 2.1, "learning_rate": 5.01768115942029e-06, "loss": 0.2932, "step": 17700 }, { "epoch": 2.1, "learning_rate": 5.010434782608696e-06, "loss": 0.3028, "step": 17725 }, { "epoch": 2.11, "learning_rate": 5.003188405797101e-06, "loss": 0.2644, "step": 17750 }, { "epoch": 2.11, "learning_rate": 4.995942028985508e-06, "loss": 0.2902, "step": 17775 }, { "epoch": 2.11, "learning_rate": 4.988695652173913e-06, "loss": 0.2816, "step": 17800 }, { "epoch": 2.12, "learning_rate": 4.98144927536232e-06, "loss": 0.3323, "step": 17825 }, { "epoch": 2.12, "learning_rate": 4.9742028985507255e-06, "loss": 0.2923, "step": 17850 }, { "epoch": 2.12, "learning_rate": 4.9669565217391305e-06, "loss": 0.3281, "step": 17875 }, { "epoch": 2.12, "learning_rate": 4.959710144927536e-06, "loss": 0.3877, "step": 17900 }, { "epoch": 2.13, "learning_rate": 4.952463768115943e-06, "loss": 0.372, "step": 17925 }, { "epoch": 2.13, "learning_rate": 4.945217391304348e-06, "loss": 0.2854, "step": 17950 }, { "epoch": 2.13, "learning_rate": 4.937971014492754e-06, "loss": 0.3001, "step": 17975 }, { "epoch": 2.14, "learning_rate": 4.93072463768116e-06, "loss": 0.3251, "step": 18000 }, { "epoch": 2.14, "eval_cer": 7.176078508534606, "eval_loss": 0.39806175231933594, "eval_runtime": 3134.0346, "eval_samples_per_second": 0.792, "eval_steps_per_second": 0.396, "eval_wer": 19.483133218982278, "step": 18000 }, { "epoch": 2.14, "learning_rate": 4.923478260869566e-06, "loss": 0.3021, "step": 18025 }, { "epoch": 2.14, "learning_rate": 4.9162318840579714e-06, "loss": 0.2846, "step": 18050 }, { "epoch": 2.14, "learning_rate": 4.908985507246377e-06, "loss": 0.284, "step": 18075 }, { "epoch": 2.15, "learning_rate": 4.901739130434783e-06, "loss": 0.2423, "step": 18100 }, { "epoch": 2.15, "learning_rate": 4.894492753623189e-06, "loss": 0.2551, "step": 18125 }, { "epoch": 2.15, "learning_rate": 4.887246376811595e-06, "loss": 0.4317, "step": 18150 }, { "epoch": 2.16, "learning_rate": 4.880000000000001e-06, "loss": 0.4729, "step": 18175 }, { "epoch": 2.16, "learning_rate": 4.872753623188406e-06, "loss": 0.2887, "step": 18200 }, { "epoch": 2.16, "learning_rate": 4.865507246376812e-06, "loss": 0.4263, "step": 18225 }, { "epoch": 2.17, "learning_rate": 4.8582608695652174e-06, "loss": 0.3566, "step": 18250 }, { "epoch": 2.17, "learning_rate": 4.851014492753623e-06, "loss": 0.3274, "step": 18275 }, { "epoch": 2.17, "learning_rate": 4.843768115942029e-06, "loss": 0.2818, "step": 18300 }, { "epoch": 2.17, "learning_rate": 4.836521739130435e-06, "loss": 0.29, "step": 18325 }, { "epoch": 2.18, "learning_rate": 4.829275362318841e-06, "loss": 0.3009, "step": 18350 }, { "epoch": 2.18, "learning_rate": 4.822028985507247e-06, "loss": 0.3663, "step": 18375 }, { "epoch": 2.18, "learning_rate": 4.8147826086956526e-06, "loss": 0.2181, "step": 18400 }, { "epoch": 2.19, "learning_rate": 4.807536231884058e-06, "loss": 0.4402, "step": 18425 }, { "epoch": 2.19, "learning_rate": 4.800289855072464e-06, "loss": 0.3224, "step": 18450 }, { "epoch": 2.19, "learning_rate": 4.79304347826087e-06, "loss": 0.4503, "step": 18475 }, { "epoch": 2.2, "learning_rate": 4.785797101449276e-06, "loss": 0.3597, "step": 18500 }, { "epoch": 2.2, "learning_rate": 4.778550724637682e-06, "loss": 0.3584, "step": 18525 }, { "epoch": 2.2, "learning_rate": 4.771304347826088e-06, "loss": 0.3391, "step": 18550 }, { "epoch": 2.2, "learning_rate": 4.764057971014493e-06, "loss": 0.3192, "step": 18575 }, { "epoch": 2.21, "learning_rate": 4.756811594202899e-06, "loss": 0.3671, "step": 18600 }, { "epoch": 2.21, "learning_rate": 4.749565217391305e-06, "loss": 0.3506, "step": 18625 }, { "epoch": 2.21, "learning_rate": 4.74231884057971e-06, "loss": 0.3515, "step": 18650 }, { "epoch": 2.22, "learning_rate": 4.735072463768116e-06, "loss": 0.2615, "step": 18675 }, { "epoch": 2.22, "learning_rate": 4.727826086956522e-06, "loss": 0.2509, "step": 18700 }, { "epoch": 2.22, "learning_rate": 4.720579710144928e-06, "loss": 0.3, "step": 18725 }, { "epoch": 2.22, "learning_rate": 4.713333333333334e-06, "loss": 0.302, "step": 18750 }, { "epoch": 2.23, "learning_rate": 4.7060869565217395e-06, "loss": 0.2971, "step": 18775 }, { "epoch": 2.23, "learning_rate": 4.698840579710145e-06, "loss": 0.4138, "step": 18800 }, { "epoch": 2.23, "learning_rate": 4.691594202898551e-06, "loss": 0.296, "step": 18825 }, { "epoch": 2.24, "learning_rate": 4.684347826086957e-06, "loss": 0.2533, "step": 18850 }, { "epoch": 2.24, "learning_rate": 4.677101449275362e-06, "loss": 0.2477, "step": 18875 }, { "epoch": 2.24, "learning_rate": 4.669855072463769e-06, "loss": 0.2952, "step": 18900 }, { "epoch": 2.25, "learning_rate": 4.662608695652175e-06, "loss": 0.2471, "step": 18925 }, { "epoch": 2.25, "learning_rate": 4.65536231884058e-06, "loss": 0.2664, "step": 18950 }, { "epoch": 2.25, "learning_rate": 4.6481159420289855e-06, "loss": 0.2127, "step": 18975 }, { "epoch": 2.25, "learning_rate": 4.640869565217392e-06, "loss": 0.4162, "step": 19000 }, { "epoch": 2.25, "eval_cer": 7.059004377982194, "eval_loss": 0.39584028720855713, "eval_runtime": 3153.6429, "eval_samples_per_second": 0.787, "eval_steps_per_second": 0.394, "eval_wer": 19.057747284162378, "step": 19000 }, { "epoch": 2.26, "learning_rate": 4.633623188405797e-06, "loss": 0.286, "step": 19025 }, { "epoch": 2.26, "learning_rate": 4.626376811594203e-06, "loss": 0.2912, "step": 19050 }, { "epoch": 2.26, "learning_rate": 4.619130434782609e-06, "loss": 0.2905, "step": 19075 }, { "epoch": 2.27, "learning_rate": 4.611884057971015e-06, "loss": 0.333, "step": 19100 }, { "epoch": 2.27, "learning_rate": 4.604637681159421e-06, "loss": 0.2647, "step": 19125 }, { "epoch": 2.27, "learning_rate": 4.5973913043478265e-06, "loss": 0.2746, "step": 19150 }, { "epoch": 2.28, "learning_rate": 4.590144927536232e-06, "loss": 0.3317, "step": 19175 }, { "epoch": 2.28, "learning_rate": 4.582898550724638e-06, "loss": 0.2549, "step": 19200 }, { "epoch": 2.28, "learning_rate": 4.575652173913044e-06, "loss": 0.312, "step": 19225 }, { "epoch": 2.28, "learning_rate": 4.56840579710145e-06, "loss": 0.3177, "step": 19250 }, { "epoch": 2.29, "learning_rate": 4.561159420289856e-06, "loss": 0.3063, "step": 19275 }, { "epoch": 2.29, "learning_rate": 4.553913043478262e-06, "loss": 0.3964, "step": 19300 }, { "epoch": 2.29, "learning_rate": 4.546666666666667e-06, "loss": 0.3377, "step": 19325 }, { "epoch": 2.3, "learning_rate": 4.5394202898550725e-06, "loss": 0.2753, "step": 19350 }, { "epoch": 2.3, "learning_rate": 4.532173913043479e-06, "loss": 0.2735, "step": 19375 }, { "epoch": 2.3, "learning_rate": 4.524927536231884e-06, "loss": 0.292, "step": 19400 }, { "epoch": 2.31, "learning_rate": 4.51768115942029e-06, "loss": 0.2894, "step": 19425 }, { "epoch": 2.31, "learning_rate": 4.510434782608696e-06, "loss": 0.367, "step": 19450 }, { "epoch": 2.31, "learning_rate": 4.503188405797102e-06, "loss": 0.2483, "step": 19475 }, { "epoch": 2.31, "learning_rate": 4.495942028985508e-06, "loss": 0.4151, "step": 19500 }, { "epoch": 2.32, "learning_rate": 4.4886956521739134e-06, "loss": 0.269, "step": 19525 }, { "epoch": 2.32, "learning_rate": 4.481449275362319e-06, "loss": 0.3127, "step": 19550 }, { "epoch": 2.32, "learning_rate": 4.474202898550725e-06, "loss": 0.2615, "step": 19575 }, { "epoch": 2.33, "learning_rate": 4.466956521739131e-06, "loss": 0.2606, "step": 19600 }, { "epoch": 2.33, "learning_rate": 4.459710144927537e-06, "loss": 0.2855, "step": 19625 }, { "epoch": 2.33, "learning_rate": 4.452463768115942e-06, "loss": 0.2419, "step": 19650 }, { "epoch": 2.33, "learning_rate": 4.4452173913043486e-06, "loss": 0.3292, "step": 19675 }, { "epoch": 2.34, "learning_rate": 4.4379710144927544e-06, "loss": 0.2821, "step": 19700 }, { "epoch": 2.34, "learning_rate": 4.4307246376811594e-06, "loss": 0.3189, "step": 19725 }, { "epoch": 2.34, "learning_rate": 4.423478260869565e-06, "loss": 0.286, "step": 19750 }, { "epoch": 2.35, "learning_rate": 4.416231884057971e-06, "loss": 0.2853, "step": 19775 }, { "epoch": 2.35, "learning_rate": 4.408985507246377e-06, "loss": 0.2835, "step": 19800 }, { "epoch": 2.35, "learning_rate": 4.401739130434783e-06, "loss": 0.2626, "step": 19825 }, { "epoch": 2.36, "learning_rate": 4.394492753623189e-06, "loss": 0.3301, "step": 19850 }, { "epoch": 2.36, "learning_rate": 4.3872463768115946e-06, "loss": 0.3094, "step": 19875 }, { "epoch": 2.36, "learning_rate": 4.380289855072464e-06, "loss": 0.2322, "step": 19900 }, { "epoch": 2.36, "learning_rate": 4.37304347826087e-06, "loss": 0.3167, "step": 19925 }, { "epoch": 2.37, "learning_rate": 4.365797101449276e-06, "loss": 0.3029, "step": 19950 }, { "epoch": 2.37, "learning_rate": 4.358550724637682e-06, "loss": 0.2892, "step": 19975 }, { "epoch": 2.37, "learning_rate": 4.3513043478260875e-06, "loss": 0.2851, "step": 20000 }, { "epoch": 2.37, "eval_cer": 7.0167002803876235, "eval_loss": 0.39532455801963806, "eval_runtime": 3151.9912, "eval_samples_per_second": 0.787, "eval_steps_per_second": 0.394, "eval_wer": 19.209453020773775, "step": 20000 }, { "epoch": 2.38, "learning_rate": 4.344057971014493e-06, "loss": 0.2749, "step": 20025 }, { "epoch": 2.38, "learning_rate": 4.336811594202899e-06, "loss": 0.3344, "step": 20050 }, { "epoch": 2.38, "learning_rate": 4.329565217391305e-06, "loss": 0.2773, "step": 20075 }, { "epoch": 2.39, "learning_rate": 4.322318840579711e-06, "loss": 0.2361, "step": 20100 }, { "epoch": 2.39, "learning_rate": 4.315072463768116e-06, "loss": 0.2254, "step": 20125 }, { "epoch": 2.39, "learning_rate": 4.307826086956522e-06, "loss": 0.2396, "step": 20150 }, { "epoch": 2.39, "learning_rate": 4.3005797101449284e-06, "loss": 0.2621, "step": 20175 }, { "epoch": 2.4, "learning_rate": 4.2933333333333334e-06, "loss": 0.31, "step": 20200 }, { "epoch": 2.4, "learning_rate": 4.286086956521739e-06, "loss": 0.3039, "step": 20225 }, { "epoch": 2.4, "learning_rate": 4.278840579710145e-06, "loss": 0.2772, "step": 20250 }, { "epoch": 2.41, "learning_rate": 4.271594202898551e-06, "loss": 0.2535, "step": 20275 }, { "epoch": 2.41, "learning_rate": 4.264347826086957e-06, "loss": 0.2903, "step": 20300 }, { "epoch": 2.41, "learning_rate": 4.257101449275363e-06, "loss": 0.3347, "step": 20325 }, { "epoch": 2.41, "learning_rate": 4.2498550724637686e-06, "loss": 0.3133, "step": 20350 }, { "epoch": 2.42, "learning_rate": 4.2426086956521744e-06, "loss": 0.2631, "step": 20375 }, { "epoch": 2.42, "learning_rate": 4.23536231884058e-06, "loss": 0.2973, "step": 20400 }, { "epoch": 2.42, "learning_rate": 4.228115942028986e-06, "loss": 0.2731, "step": 20425 }, { "epoch": 2.43, "learning_rate": 4.220869565217391e-06, "loss": 0.3088, "step": 20450 }, { "epoch": 2.43, "learning_rate": 4.213623188405798e-06, "loss": 0.3291, "step": 20475 }, { "epoch": 2.43, "learning_rate": 4.206376811594204e-06, "loss": 0.2447, "step": 20500 }, { "epoch": 2.44, "learning_rate": 4.199130434782609e-06, "loss": 0.3862, "step": 20525 }, { "epoch": 2.44, "learning_rate": 4.1918840579710146e-06, "loss": 0.3494, "step": 20550 }, { "epoch": 2.44, "learning_rate": 4.18463768115942e-06, "loss": 0.314, "step": 20575 }, { "epoch": 2.44, "learning_rate": 4.177391304347826e-06, "loss": 0.3158, "step": 20600 }, { "epoch": 2.45, "learning_rate": 4.170144927536232e-06, "loss": 0.2839, "step": 20625 }, { "epoch": 2.45, "learning_rate": 4.162898550724638e-06, "loss": 0.2518, "step": 20650 }, { "epoch": 2.45, "learning_rate": 4.155652173913044e-06, "loss": 0.3692, "step": 20675 }, { "epoch": 2.46, "learning_rate": 4.14840579710145e-06, "loss": 0.2712, "step": 20700 }, { "epoch": 2.46, "learning_rate": 4.1411594202898555e-06, "loss": 0.2804, "step": 20725 }, { "epoch": 2.46, "learning_rate": 4.1339130434782605e-06, "loss": 0.3514, "step": 20750 }, { "epoch": 2.47, "learning_rate": 4.126666666666667e-06, "loss": 0.2892, "step": 20775 }, { "epoch": 2.47, "learning_rate": 4.119420289855073e-06, "loss": 0.2898, "step": 20800 }, { "epoch": 2.47, "learning_rate": 4.112173913043478e-06, "loss": 0.3071, "step": 20825 }, { "epoch": 2.47, "learning_rate": 4.104927536231885e-06, "loss": 0.2719, "step": 20850 }, { "epoch": 2.48, "learning_rate": 4.097681159420291e-06, "loss": 0.3628, "step": 20875 }, { "epoch": 2.48, "learning_rate": 4.090434782608696e-06, "loss": 0.3201, "step": 20900 }, { "epoch": 2.48, "learning_rate": 4.0831884057971015e-06, "loss": 0.3166, "step": 20925 }, { "epoch": 2.49, "learning_rate": 4.075942028985508e-06, "loss": 0.3418, "step": 20950 }, { "epoch": 2.49, "learning_rate": 4.068695652173913e-06, "loss": 0.288, "step": 20975 }, { "epoch": 2.49, "learning_rate": 4.061449275362319e-06, "loss": 0.2982, "step": 21000 }, { "epoch": 2.49, "eval_cer": 6.842564808893699, "eval_loss": 0.39293238520622253, "eval_runtime": 3128.5672, "eval_samples_per_second": 0.793, "eval_steps_per_second": 0.397, "eval_wer": 18.80998665904326, "step": 21000 }, { "epoch": 2.49, "learning_rate": 4.054202898550725e-06, "loss": 0.2191, "step": 21025 }, { "epoch": 2.5, "learning_rate": 4.046956521739131e-06, "loss": 0.3047, "step": 21050 }, { "epoch": 2.5, "learning_rate": 4.039710144927537e-06, "loss": 0.2752, "step": 21075 }, { "epoch": 2.5, "learning_rate": 4.0324637681159425e-06, "loss": 0.2675, "step": 21100 }, { "epoch": 2.51, "learning_rate": 4.025217391304348e-06, "loss": 0.2971, "step": 21125 }, { "epoch": 2.51, "learning_rate": 4.017971014492754e-06, "loss": 0.3199, "step": 21150 }, { "epoch": 2.51, "learning_rate": 4.01072463768116e-06, "loss": 0.2402, "step": 21175 }, { "epoch": 2.52, "learning_rate": 4.003478260869565e-06, "loss": 0.2752, "step": 21200 }, { "epoch": 2.52, "learning_rate": 3.996231884057971e-06, "loss": 0.3148, "step": 21225 }, { "epoch": 2.52, "learning_rate": 3.988985507246378e-06, "loss": 0.2471, "step": 21250 }, { "epoch": 2.52, "learning_rate": 3.981739130434783e-06, "loss": 0.2807, "step": 21275 }, { "epoch": 2.53, "learning_rate": 3.9744927536231885e-06, "loss": 0.2242, "step": 21300 }, { "epoch": 2.53, "learning_rate": 3.967246376811594e-06, "loss": 0.4252, "step": 21325 }, { "epoch": 2.53, "learning_rate": 3.96e-06, "loss": 0.2453, "step": 21350 }, { "epoch": 2.54, "learning_rate": 3.952753623188406e-06, "loss": 0.2282, "step": 21375 }, { "epoch": 2.54, "learning_rate": 3.945507246376812e-06, "loss": 0.353, "step": 21400 }, { "epoch": 2.54, "learning_rate": 3.938260869565218e-06, "loss": 0.3021, "step": 21425 }, { "epoch": 2.55, "learning_rate": 3.931014492753624e-06, "loss": 0.2803, "step": 21450 }, { "epoch": 2.55, "learning_rate": 3.9237681159420295e-06, "loss": 0.2523, "step": 21475 }, { "epoch": 2.55, "learning_rate": 3.916521739130435e-06, "loss": 0.2748, "step": 21500 }, { "epoch": 2.55, "learning_rate": 3.90927536231884e-06, "loss": 0.3106, "step": 21525 }, { "epoch": 2.56, "learning_rate": 3.902028985507247e-06, "loss": 0.3489, "step": 21550 }, { "epoch": 2.56, "learning_rate": 3.894782608695653e-06, "loss": 0.3188, "step": 21575 }, { "epoch": 2.56, "learning_rate": 3.887536231884058e-06, "loss": 0.3188, "step": 21600 }, { "epoch": 2.57, "learning_rate": 3.880289855072465e-06, "loss": 0.3178, "step": 21625 }, { "epoch": 2.57, "learning_rate": 3.87304347826087e-06, "loss": 0.2279, "step": 21650 }, { "epoch": 2.57, "learning_rate": 3.8657971014492755e-06, "loss": 0.2803, "step": 21675 }, { "epoch": 2.58, "learning_rate": 3.858550724637681e-06, "loss": 0.21, "step": 21700 }, { "epoch": 2.58, "learning_rate": 3.851304347826087e-06, "loss": 0.2753, "step": 21725 }, { "epoch": 2.58, "learning_rate": 3.844057971014493e-06, "loss": 0.4256, "step": 21750 }, { "epoch": 2.58, "learning_rate": 3.836811594202899e-06, "loss": 0.2934, "step": 21775 }, { "epoch": 2.59, "learning_rate": 3.829565217391305e-06, "loss": 0.3364, "step": 21800 }, { "epoch": 2.59, "learning_rate": 3.822318840579711e-06, "loss": 0.3053, "step": 21825 }, { "epoch": 2.59, "learning_rate": 3.8150724637681164e-06, "loss": 0.3143, "step": 21850 }, { "epoch": 2.6, "learning_rate": 3.807826086956522e-06, "loss": 0.2758, "step": 21875 }, { "epoch": 2.6, "learning_rate": 3.8005797101449277e-06, "loss": 0.2616, "step": 21900 }, { "epoch": 2.6, "learning_rate": 3.793333333333334e-06, "loss": 0.2949, "step": 21925 }, { "epoch": 2.6, "learning_rate": 3.7860869565217394e-06, "loss": 0.358, "step": 21950 }, { "epoch": 2.61, "learning_rate": 3.7788405797101453e-06, "loss": 0.2856, "step": 21975 }, { "epoch": 2.61, "learning_rate": 3.7715942028985507e-06, "loss": 0.3642, "step": 22000 }, { "epoch": 2.61, "eval_cer": 6.886713561906636, "eval_loss": 0.3953614830970764, "eval_runtime": 3140.8887, "eval_samples_per_second": 0.79, "eval_steps_per_second": 0.395, "eval_wer": 18.69716028206594, "step": 22000 }, { "epoch": 2.61, "learning_rate": 3.764347826086957e-06, "loss": 0.283, "step": 22025 }, { "epoch": 2.62, "learning_rate": 3.757101449275363e-06, "loss": 0.3267, "step": 22050 }, { "epoch": 2.62, "learning_rate": 3.7498550724637683e-06, "loss": 0.3271, "step": 22075 }, { "epoch": 2.62, "learning_rate": 3.742608695652174e-06, "loss": 0.3372, "step": 22100 }, { "epoch": 2.63, "learning_rate": 3.7353623188405804e-06, "loss": 0.2551, "step": 22125 }, { "epoch": 2.63, "learning_rate": 3.728115942028986e-06, "loss": 0.3063, "step": 22150 }, { "epoch": 2.63, "learning_rate": 3.7208695652173917e-06, "loss": 0.2902, "step": 22175 }, { "epoch": 2.63, "learning_rate": 3.713623188405797e-06, "loss": 0.255, "step": 22200 }, { "epoch": 2.64, "learning_rate": 3.7063768115942034e-06, "loss": 0.3041, "step": 22225 }, { "epoch": 2.64, "learning_rate": 3.699130434782609e-06, "loss": 0.3338, "step": 22250 }, { "epoch": 2.64, "learning_rate": 3.6918840579710147e-06, "loss": 0.2509, "step": 22275 }, { "epoch": 2.65, "learning_rate": 3.68463768115942e-06, "loss": 0.2996, "step": 22300 }, { "epoch": 2.65, "learning_rate": 3.6773913043478264e-06, "loss": 0.3299, "step": 22325 }, { "epoch": 2.65, "learning_rate": 3.6701449275362323e-06, "loss": 0.234, "step": 22350 }, { "epoch": 2.66, "learning_rate": 3.6628985507246377e-06, "loss": 0.304, "step": 22375 }, { "epoch": 2.66, "learning_rate": 3.6556521739130435e-06, "loss": 0.3406, "step": 22400 }, { "epoch": 2.66, "learning_rate": 3.64840579710145e-06, "loss": 0.2437, "step": 22425 }, { "epoch": 2.66, "learning_rate": 3.6411594202898552e-06, "loss": 0.4036, "step": 22450 }, { "epoch": 2.67, "learning_rate": 3.633913043478261e-06, "loss": 0.431, "step": 22475 }, { "epoch": 2.67, "learning_rate": 3.6266666666666674e-06, "loss": 0.2864, "step": 22500 }, { "epoch": 2.67, "learning_rate": 3.619420289855073e-06, "loss": 0.2791, "step": 22525 }, { "epoch": 2.68, "learning_rate": 3.6121739130434787e-06, "loss": 0.2975, "step": 22550 }, { "epoch": 2.68, "learning_rate": 3.604927536231884e-06, "loss": 0.3252, "step": 22575 }, { "epoch": 2.68, "learning_rate": 3.5976811594202904e-06, "loss": 0.2389, "step": 22600 }, { "epoch": 2.68, "learning_rate": 3.5904347826086962e-06, "loss": 0.3063, "step": 22625 }, { "epoch": 2.69, "learning_rate": 3.5831884057971017e-06, "loss": 0.2614, "step": 22650 }, { "epoch": 2.69, "learning_rate": 3.5759420289855075e-06, "loss": 0.2833, "step": 22675 }, { "epoch": 2.69, "learning_rate": 3.5686956521739134e-06, "loss": 0.3931, "step": 22700 }, { "epoch": 2.7, "learning_rate": 3.5614492753623192e-06, "loss": 0.2804, "step": 22725 }, { "epoch": 2.7, "learning_rate": 3.554202898550725e-06, "loss": 0.2688, "step": 22750 }, { "epoch": 2.7, "learning_rate": 3.5469565217391305e-06, "loss": 0.2059, "step": 22775 }, { "epoch": 2.71, "learning_rate": 3.5397101449275368e-06, "loss": 0.3133, "step": 22800 }, { "epoch": 2.71, "learning_rate": 3.5324637681159422e-06, "loss": 0.2725, "step": 22825 }, { "epoch": 2.71, "learning_rate": 3.525217391304348e-06, "loss": 0.2712, "step": 22850 }, { "epoch": 2.71, "learning_rate": 3.5179710144927535e-06, "loss": 0.264, "step": 22875 }, { "epoch": 2.72, "learning_rate": 3.5107246376811598e-06, "loss": 0.2404, "step": 22900 }, { "epoch": 2.72, "learning_rate": 3.5034782608695656e-06, "loss": 0.3211, "step": 22925 }, { "epoch": 2.72, "learning_rate": 3.496231884057971e-06, "loss": 0.2726, "step": 22950 }, { "epoch": 2.73, "learning_rate": 3.488985507246377e-06, "loss": 0.399, "step": 22975 }, { "epoch": 2.73, "learning_rate": 3.481739130434783e-06, "loss": 0.2297, "step": 23000 }, { "epoch": 2.73, "eval_cer": 6.938363913620936, "eval_loss": 0.3916235566139221, "eval_runtime": 3180.568, "eval_samples_per_second": 0.78, "eval_steps_per_second": 0.39, "eval_wer": 18.73299028016009, "step": 23000 }, { "epoch": 2.73, "learning_rate": 3.4744927536231886e-06, "loss": 0.3484, "step": 23025 }, { "epoch": 2.74, "learning_rate": 3.4672463768115945e-06, "loss": 0.2585, "step": 23050 }, { "epoch": 2.74, "learning_rate": 3.46e-06, "loss": 0.2843, "step": 23075 }, { "epoch": 2.74, "learning_rate": 3.452753623188406e-06, "loss": 0.3526, "step": 23100 }, { "epoch": 2.74, "learning_rate": 3.445507246376812e-06, "loss": 0.3063, "step": 23125 }, { "epoch": 2.75, "learning_rate": 3.4382608695652175e-06, "loss": 0.3701, "step": 23150 }, { "epoch": 2.75, "learning_rate": 3.4310144927536233e-06, "loss": 0.2438, "step": 23175 }, { "epoch": 2.75, "learning_rate": 3.4237681159420296e-06, "loss": 0.3001, "step": 23200 }, { "epoch": 2.76, "learning_rate": 3.416521739130435e-06, "loss": 0.3103, "step": 23225 }, { "epoch": 2.76, "learning_rate": 3.409275362318841e-06, "loss": 0.2769, "step": 23250 }, { "epoch": 2.76, "learning_rate": 3.4020289855072467e-06, "loss": 0.4483, "step": 23275 }, { "epoch": 2.76, "learning_rate": 3.3947826086956526e-06, "loss": 0.2777, "step": 23300 }, { "epoch": 2.77, "learning_rate": 3.387536231884058e-06, "loss": 0.2413, "step": 23325 }, { "epoch": 2.77, "learning_rate": 3.380289855072464e-06, "loss": 0.2911, "step": 23350 }, { "epoch": 2.77, "learning_rate": 3.37304347826087e-06, "loss": 0.3544, "step": 23375 }, { "epoch": 2.78, "learning_rate": 3.3657971014492756e-06, "loss": 0.349, "step": 23400 }, { "epoch": 2.78, "learning_rate": 3.3585507246376814e-06, "loss": 0.3243, "step": 23425 }, { "epoch": 2.78, "learning_rate": 3.351304347826087e-06, "loss": 0.2601, "step": 23450 }, { "epoch": 2.79, "learning_rate": 3.344057971014493e-06, "loss": 0.268, "step": 23475 }, { "epoch": 2.79, "learning_rate": 3.336811594202899e-06, "loss": 0.294, "step": 23500 }, { "epoch": 2.79, "learning_rate": 3.3295652173913044e-06, "loss": 0.3095, "step": 23525 }, { "epoch": 2.79, "learning_rate": 3.3223188405797103e-06, "loss": 0.2588, "step": 23550 }, { "epoch": 2.8, "learning_rate": 3.3150724637681166e-06, "loss": 0.4027, "step": 23575 }, { "epoch": 2.8, "learning_rate": 3.307826086956522e-06, "loss": 0.2887, "step": 23600 }, { "epoch": 2.8, "learning_rate": 3.300579710144928e-06, "loss": 0.2459, "step": 23625 }, { "epoch": 2.81, "learning_rate": 3.2933333333333333e-06, "loss": 0.2288, "step": 23650 }, { "epoch": 2.81, "learning_rate": 3.2860869565217396e-06, "loss": 0.2998, "step": 23675 }, { "epoch": 2.81, "learning_rate": 3.2788405797101454e-06, "loss": 0.3197, "step": 23700 }, { "epoch": 2.82, "learning_rate": 3.271594202898551e-06, "loss": 0.2931, "step": 23725 }, { "epoch": 2.82, "learning_rate": 3.2643478260869567e-06, "loss": 0.2451, "step": 23750 }, { "epoch": 2.82, "learning_rate": 3.2571014492753626e-06, "loss": 0.251, "step": 23775 }, { "epoch": 2.82, "learning_rate": 3.2498550724637684e-06, "loss": 0.291, "step": 23800 }, { "epoch": 2.83, "learning_rate": 3.2426086956521743e-06, "loss": 0.2916, "step": 23825 }, { "epoch": 2.83, "learning_rate": 3.2353623188405797e-06, "loss": 0.3365, "step": 23850 }, { "epoch": 2.83, "learning_rate": 3.228115942028986e-06, "loss": 0.2967, "step": 23875 }, { "epoch": 2.84, "learning_rate": 3.2208695652173914e-06, "loss": 0.2435, "step": 23900 }, { "epoch": 2.84, "learning_rate": 3.2136231884057973e-06, "loss": 0.3885, "step": 23925 }, { "epoch": 2.84, "learning_rate": 3.2063768115942027e-06, "loss": 0.2373, "step": 23950 }, { "epoch": 2.85, "learning_rate": 3.199130434782609e-06, "loss": 0.3457, "step": 23975 }, { "epoch": 2.85, "learning_rate": 3.191884057971015e-06, "loss": 0.2313, "step": 24000 }, { "epoch": 2.85, "eval_cer": 6.778493777362389, "eval_loss": 0.3930225968360901, "eval_runtime": 3191.3103, "eval_samples_per_second": 0.778, "eval_steps_per_second": 0.389, "eval_wer": 18.60339241471317, "step": 24000 }, { "epoch": 2.85, "learning_rate": 3.1846376811594202e-06, "loss": 0.2984, "step": 24025 }, { "epoch": 2.85, "learning_rate": 3.1773913043478265e-06, "loss": 0.2425, "step": 24050 }, { "epoch": 2.86, "learning_rate": 3.1701449275362324e-06, "loss": 0.3009, "step": 24075 }, { "epoch": 2.86, "learning_rate": 3.162898550724638e-06, "loss": 0.251, "step": 24100 }, { "epoch": 2.86, "learning_rate": 3.1556521739130437e-06, "loss": 0.2794, "step": 24125 }, { "epoch": 2.87, "learning_rate": 3.14840579710145e-06, "loss": 0.326, "step": 24150 }, { "epoch": 2.87, "learning_rate": 3.1414492753623194e-06, "loss": 0.2487, "step": 24175 }, { "epoch": 2.87, "learning_rate": 3.134202898550725e-06, "loss": 0.2793, "step": 24200 }, { "epoch": 2.87, "learning_rate": 3.1269565217391307e-06, "loss": 0.3093, "step": 24225 }, { "epoch": 2.88, "learning_rate": 3.119710144927536e-06, "loss": 0.2536, "step": 24250 }, { "epoch": 2.88, "learning_rate": 3.1124637681159424e-06, "loss": 0.3143, "step": 24275 }, { "epoch": 2.88, "learning_rate": 3.1052173913043483e-06, "loss": 0.2409, "step": 24300 }, { "epoch": 2.89, "learning_rate": 3.0979710144927537e-06, "loss": 0.3879, "step": 24325 }, { "epoch": 2.89, "learning_rate": 3.0907246376811596e-06, "loss": 0.3521, "step": 24350 }, { "epoch": 2.89, "learning_rate": 3.083478260869566e-06, "loss": 0.2628, "step": 24375 }, { "epoch": 2.9, "learning_rate": 3.0762318840579713e-06, "loss": 0.2127, "step": 24400 }, { "epoch": 2.9, "learning_rate": 3.068985507246377e-06, "loss": 0.3071, "step": 24425 }, { "epoch": 2.9, "learning_rate": 3.0617391304347826e-06, "loss": 0.2488, "step": 24450 }, { "epoch": 2.9, "learning_rate": 3.054492753623189e-06, "loss": 0.2462, "step": 24475 }, { "epoch": 2.91, "learning_rate": 3.0472463768115947e-06, "loss": 0.2651, "step": 24500 }, { "epoch": 2.91, "learning_rate": 3.04e-06, "loss": 0.2555, "step": 24525 }, { "epoch": 2.91, "learning_rate": 3.032753623188406e-06, "loss": 0.2511, "step": 24550 }, { "epoch": 2.92, "learning_rate": 3.025507246376812e-06, "loss": 0.2761, "step": 24575 }, { "epoch": 2.92, "learning_rate": 3.0182608695652177e-06, "loss": 0.3315, "step": 24600 }, { "epoch": 2.92, "learning_rate": 3.0110144927536235e-06, "loss": 0.4222, "step": 24625 }, { "epoch": 2.93, "learning_rate": 3.003768115942029e-06, "loss": 0.252, "step": 24650 }, { "epoch": 2.93, "learning_rate": 2.9965217391304352e-06, "loss": 0.3424, "step": 24675 }, { "epoch": 2.93, "learning_rate": 2.9892753623188407e-06, "loss": 0.3086, "step": 24700 }, { "epoch": 2.93, "learning_rate": 2.9820289855072465e-06, "loss": 0.3246, "step": 24725 }, { "epoch": 2.94, "learning_rate": 2.974782608695652e-06, "loss": 0.4331, "step": 24750 }, { "epoch": 2.94, "learning_rate": 2.9675362318840582e-06, "loss": 0.2933, "step": 24775 }, { "epoch": 2.94, "learning_rate": 2.960289855072464e-06, "loss": 0.3234, "step": 24800 }, { "epoch": 2.95, "learning_rate": 2.9530434782608695e-06, "loss": 0.2495, "step": 24825 }, { "epoch": 2.95, "learning_rate": 2.9457971014492754e-06, "loss": 0.2506, "step": 24850 }, { "epoch": 2.95, "learning_rate": 2.9385507246376817e-06, "loss": 0.2862, "step": 24875 }, { "epoch": 2.95, "learning_rate": 2.931304347826087e-06, "loss": 0.2804, "step": 24900 }, { "epoch": 2.96, "learning_rate": 2.924057971014493e-06, "loss": 0.2659, "step": 24925 }, { "epoch": 2.96, "learning_rate": 2.9168115942028992e-06, "loss": 0.2801, "step": 24950 }, { "epoch": 2.96, "learning_rate": 2.9095652173913046e-06, "loss": 0.3455, "step": 24975 }, { "epoch": 2.97, "learning_rate": 2.902608695652174e-06, "loss": 0.2833, "step": 25000 }, { "epoch": 2.97, "eval_cer": 6.855231442766491, "eval_loss": 0.39096301794052124, "eval_runtime": 3187.6224, "eval_samples_per_second": 0.779, "eval_steps_per_second": 0.389, "eval_wer": 18.598056032018295, "step": 25000 }, { "epoch": 2.97, "learning_rate": 2.89536231884058e-06, "loss": 0.2299, "step": 25025 }, { "epoch": 2.97, "learning_rate": 2.8881159420289854e-06, "loss": 0.2482, "step": 25050 }, { "epoch": 2.98, "learning_rate": 2.8808695652173917e-06, "loss": 0.3388, "step": 25075 }, { "epoch": 2.98, "learning_rate": 2.8736231884057975e-06, "loss": 0.4429, "step": 25100 }, { "epoch": 2.98, "learning_rate": 2.866376811594203e-06, "loss": 0.2245, "step": 25125 }, { "epoch": 2.98, "learning_rate": 2.859130434782609e-06, "loss": 0.2648, "step": 25150 }, { "epoch": 2.99, "learning_rate": 2.851884057971015e-06, "loss": 0.1995, "step": 25175 }, { "epoch": 2.99, "learning_rate": 2.8446376811594205e-06, "loss": 0.2652, "step": 25200 }, { "epoch": 2.99, "learning_rate": 2.8373913043478264e-06, "loss": 0.2587, "step": 25225 }, { "epoch": 3.0, "learning_rate": 2.830144927536232e-06, "loss": 0.2889, "step": 25250 }, { "epoch": 3.0, "learning_rate": 2.822898550724638e-06, "loss": 0.2257, "step": 25275 }, { "epoch": 3.0, "learning_rate": 2.815652173913044e-06, "loss": 0.1742, "step": 25300 }, { "epoch": 3.01, "learning_rate": 2.8084057971014494e-06, "loss": 0.1856, "step": 25325 }, { "epoch": 3.01, "learning_rate": 2.8011594202898552e-06, "loss": 0.1801, "step": 25350 }, { "epoch": 3.01, "learning_rate": 2.7939130434782615e-06, "loss": 0.2185, "step": 25375 }, { "epoch": 3.01, "learning_rate": 2.786666666666667e-06, "loss": 0.2565, "step": 25400 }, { "epoch": 3.02, "learning_rate": 2.779420289855073e-06, "loss": 0.2026, "step": 25425 }, { "epoch": 3.02, "learning_rate": 2.7721739130434782e-06, "loss": 0.2373, "step": 25450 }, { "epoch": 3.02, "learning_rate": 2.7649275362318845e-06, "loss": 0.2406, "step": 25475 }, { "epoch": 3.03, "learning_rate": 2.75768115942029e-06, "loss": 0.4514, "step": 25500 }, { "epoch": 3.03, "learning_rate": 2.750434782608696e-06, "loss": 0.1876, "step": 25525 }, { "epoch": 3.03, "learning_rate": 2.7431884057971012e-06, "loss": 0.2703, "step": 25550 }, { "epoch": 3.03, "learning_rate": 2.7359420289855075e-06, "loss": 0.1749, "step": 25575 }, { "epoch": 3.04, "learning_rate": 2.7286956521739134e-06, "loss": 0.2088, "step": 25600 }, { "epoch": 3.04, "learning_rate": 2.721449275362319e-06, "loss": 0.2087, "step": 25625 }, { "epoch": 3.04, "learning_rate": 2.7142028985507246e-06, "loss": 0.3172, "step": 25650 }, { "epoch": 3.05, "learning_rate": 2.706956521739131e-06, "loss": 0.1898, "step": 25675 }, { "epoch": 3.05, "learning_rate": 2.6997101449275364e-06, "loss": 0.1685, "step": 25700 }, { "epoch": 3.05, "learning_rate": 2.692463768115942e-06, "loss": 0.1918, "step": 25725 }, { "epoch": 3.06, "learning_rate": 2.6852173913043476e-06, "loss": 0.2734, "step": 25750 }, { "epoch": 3.06, "learning_rate": 2.677971014492754e-06, "loss": 0.1485, "step": 25775 }, { "epoch": 3.06, "learning_rate": 2.6707246376811598e-06, "loss": 0.1542, "step": 25800 }, { "epoch": 3.06, "learning_rate": 2.663478260869565e-06, "loss": 0.1694, "step": 25825 }, { "epoch": 3.07, "learning_rate": 2.6562318840579715e-06, "loss": 0.1685, "step": 25850 }, { "epoch": 3.07, "learning_rate": 2.6489855072463773e-06, "loss": 0.1719, "step": 25875 }, { "epoch": 3.07, "learning_rate": 2.6417391304347828e-06, "loss": 0.1573, "step": 25900 }, { "epoch": 3.08, "learning_rate": 2.6344927536231886e-06, "loss": 0.2429, "step": 25925 }, { "epoch": 3.08, "learning_rate": 2.6272463768115945e-06, "loss": 0.1751, "step": 25950 }, { "epoch": 3.08, "learning_rate": 2.6202898550724644e-06, "loss": 0.2976, "step": 25975 }, { "epoch": 3.09, "learning_rate": 2.61304347826087e-06, "loss": 0.2509, "step": 26000 }, { "epoch": 3.09, "eval_cer": 6.816493678980766, "eval_loss": 0.3948805630207062, "eval_runtime": 3174.2689, "eval_samples_per_second": 0.782, "eval_steps_per_second": 0.391, "eval_wer": 18.518010291595196, "step": 26000 }, { "epoch": 3.09, "learning_rate": 2.6057971014492757e-06, "loss": 0.377, "step": 26025 }, { "epoch": 3.09, "learning_rate": 2.598550724637681e-06, "loss": 0.1902, "step": 26050 }, { "epoch": 3.09, "learning_rate": 2.5913043478260874e-06, "loss": 0.2086, "step": 26075 }, { "epoch": 3.1, "learning_rate": 2.5840579710144932e-06, "loss": 0.269, "step": 26100 }, { "epoch": 3.1, "learning_rate": 2.5768115942028987e-06, "loss": 0.2287, "step": 26125 }, { "epoch": 3.1, "learning_rate": 2.5695652173913045e-06, "loss": 0.2673, "step": 26150 }, { "epoch": 3.11, "learning_rate": 2.562318840579711e-06, "loss": 0.1238, "step": 26175 }, { "epoch": 3.11, "learning_rate": 2.5550724637681162e-06, "loss": 0.2047, "step": 26200 }, { "epoch": 3.11, "learning_rate": 2.547826086956522e-06, "loss": 0.3, "step": 26225 }, { "epoch": 3.11, "learning_rate": 2.5405797101449275e-06, "loss": 0.201, "step": 26250 }, { "epoch": 3.12, "learning_rate": 2.5333333333333338e-06, "loss": 0.1864, "step": 26275 }, { "epoch": 3.12, "learning_rate": 2.5260869565217392e-06, "loss": 0.2565, "step": 26300 }, { "epoch": 3.12, "learning_rate": 2.518840579710145e-06, "loss": 0.189, "step": 26325 }, { "epoch": 3.13, "learning_rate": 2.511594202898551e-06, "loss": 0.2006, "step": 26350 }, { "epoch": 3.13, "learning_rate": 2.5043478260869568e-06, "loss": 0.1992, "step": 26375 }, { "epoch": 3.13, "learning_rate": 2.4971014492753626e-06, "loss": 0.1742, "step": 26400 }, { "epoch": 3.14, "learning_rate": 2.489855072463768e-06, "loss": 0.1909, "step": 26425 }, { "epoch": 3.14, "learning_rate": 2.4826086956521743e-06, "loss": 0.1935, "step": 26450 }, { "epoch": 3.14, "learning_rate": 2.4753623188405798e-06, "loss": 0.2335, "step": 26475 }, { "epoch": 3.14, "learning_rate": 2.4681159420289856e-06, "loss": 0.2635, "step": 26500 }, { "epoch": 3.15, "learning_rate": 2.4608695652173915e-06, "loss": 0.2079, "step": 26525 }, { "epoch": 3.15, "learning_rate": 2.4536231884057973e-06, "loss": 0.2006, "step": 26550 }, { "epoch": 3.15, "learning_rate": 2.446376811594203e-06, "loss": 0.244, "step": 26575 }, { "epoch": 3.16, "learning_rate": 2.439130434782609e-06, "loss": 0.32, "step": 26600 }, { "epoch": 3.16, "learning_rate": 2.4318840579710145e-06, "loss": 0.1757, "step": 26625 }, { "epoch": 3.16, "learning_rate": 2.4246376811594203e-06, "loss": 0.151, "step": 26650 }, { "epoch": 3.17, "learning_rate": 2.417391304347826e-06, "loss": 0.1985, "step": 26675 }, { "epoch": 3.17, "learning_rate": 2.410144927536232e-06, "loss": 0.2241, "step": 26700 }, { "epoch": 3.17, "learning_rate": 2.402898550724638e-06, "loss": 0.1411, "step": 26725 }, { "epoch": 3.17, "learning_rate": 2.3956521739130437e-06, "loss": 0.2348, "step": 26750 }, { "epoch": 3.18, "learning_rate": 2.3884057971014496e-06, "loss": 0.2529, "step": 26775 }, { "epoch": 3.18, "learning_rate": 2.3811594202898555e-06, "loss": 0.1819, "step": 26800 }, { "epoch": 3.18, "learning_rate": 2.3739130434782613e-06, "loss": 0.2473, "step": 26825 }, { "epoch": 3.19, "learning_rate": 2.3666666666666667e-06, "loss": 0.2902, "step": 26850 }, { "epoch": 3.19, "learning_rate": 2.3594202898550726e-06, "loss": 0.1368, "step": 26875 }, { "epoch": 3.19, "learning_rate": 2.3521739130434784e-06, "loss": 0.2857, "step": 26900 }, { "epoch": 3.2, "learning_rate": 2.3449275362318843e-06, "loss": 0.1613, "step": 26925 }, { "epoch": 3.2, "learning_rate": 2.33768115942029e-06, "loss": 0.2573, "step": 26950 }, { "epoch": 3.2, "learning_rate": 2.330434782608696e-06, "loss": 0.2029, "step": 26975 }, { "epoch": 3.2, "learning_rate": 2.3231884057971014e-06, "loss": 0.2085, "step": 27000 }, { "epoch": 3.2, "eval_cer": 6.811328643809336, "eval_loss": 0.3984606862068176, "eval_runtime": 3176.0872, "eval_samples_per_second": 0.781, "eval_steps_per_second": 0.391, "eval_wer": 18.613302839717935, "step": 27000 }, { "epoch": 3.21, "learning_rate": 2.3159420289855077e-06, "loss": 0.235, "step": 27025 }, { "epoch": 3.21, "learning_rate": 2.308695652173913e-06, "loss": 0.1992, "step": 27050 }, { "epoch": 3.21, "learning_rate": 2.301449275362319e-06, "loss": 0.2457, "step": 27075 }, { "epoch": 3.22, "learning_rate": 2.294202898550725e-06, "loss": 0.1871, "step": 27100 }, { "epoch": 3.22, "learning_rate": 2.2869565217391307e-06, "loss": 0.1464, "step": 27125 }, { "epoch": 3.22, "learning_rate": 2.279710144927536e-06, "loss": 0.2012, "step": 27150 }, { "epoch": 3.22, "learning_rate": 2.2724637681159424e-06, "loss": 0.1757, "step": 27175 }, { "epoch": 3.23, "learning_rate": 2.265217391304348e-06, "loss": 0.1795, "step": 27200 }, { "epoch": 3.23, "learning_rate": 2.2579710144927537e-06, "loss": 0.1706, "step": 27225 }, { "epoch": 3.23, "learning_rate": 2.2507246376811596e-06, "loss": 0.2044, "step": 27250 }, { "epoch": 3.24, "learning_rate": 2.2434782608695654e-06, "loss": 0.2155, "step": 27275 }, { "epoch": 3.24, "learning_rate": 2.2362318840579713e-06, "loss": 0.1811, "step": 27300 }, { "epoch": 3.24, "learning_rate": 2.228985507246377e-06, "loss": 0.2311, "step": 27325 }, { "epoch": 3.25, "learning_rate": 2.2217391304347825e-06, "loss": 0.3311, "step": 27350 }, { "epoch": 3.25, "learning_rate": 2.2144927536231884e-06, "loss": 0.1692, "step": 27375 }, { "epoch": 3.25, "learning_rate": 2.2072463768115943e-06, "loss": 0.2069, "step": 27400 }, { "epoch": 3.25, "learning_rate": 2.2e-06, "loss": 0.1755, "step": 27425 }, { "epoch": 3.26, "learning_rate": 2.192753623188406e-06, "loss": 0.2029, "step": 27450 }, { "epoch": 3.26, "learning_rate": 2.185507246376812e-06, "loss": 0.2542, "step": 27475 }, { "epoch": 3.26, "learning_rate": 2.1782608695652177e-06, "loss": 0.1882, "step": 27500 }, { "epoch": 3.27, "learning_rate": 2.1710144927536235e-06, "loss": 0.2374, "step": 27525 }, { "epoch": 3.27, "learning_rate": 2.1637681159420294e-06, "loss": 0.1967, "step": 27550 }, { "epoch": 3.27, "learning_rate": 2.156521739130435e-06, "loss": 0.1869, "step": 27575 }, { "epoch": 3.28, "learning_rate": 2.1492753623188407e-06, "loss": 0.2861, "step": 27600 }, { "epoch": 3.28, "learning_rate": 2.1420289855072465e-06, "loss": 0.2392, "step": 27625 }, { "epoch": 3.28, "learning_rate": 2.1347826086956524e-06, "loss": 0.18, "step": 27650 }, { "epoch": 3.28, "learning_rate": 2.1275362318840582e-06, "loss": 0.2496, "step": 27675 }, { "epoch": 3.29, "learning_rate": 2.120289855072464e-06, "loss": 0.1998, "step": 27700 }, { "epoch": 3.29, "learning_rate": 2.1130434782608695e-06, "loss": 0.259, "step": 27725 }, { "epoch": 3.29, "learning_rate": 2.105797101449276e-06, "loss": 0.3129, "step": 27750 }, { "epoch": 3.3, "learning_rate": 2.0985507246376812e-06, "loss": 0.1907, "step": 27775 }, { "epoch": 3.3, "learning_rate": 2.091304347826087e-06, "loss": 0.1343, "step": 27800 }, { "epoch": 3.3, "learning_rate": 2.084057971014493e-06, "loss": 0.1973, "step": 27825 }, { "epoch": 3.3, "learning_rate": 2.0768115942028988e-06, "loss": 0.1658, "step": 27850 }, { "epoch": 3.31, "learning_rate": 2.0695652173913046e-06, "loss": 0.1508, "step": 27875 }, { "epoch": 3.31, "learning_rate": 2.0623188405797105e-06, "loss": 0.1947, "step": 27900 }, { "epoch": 3.31, "learning_rate": 2.055072463768116e-06, "loss": 0.1812, "step": 27925 }, { "epoch": 3.32, "learning_rate": 2.0478260869565218e-06, "loss": 0.2154, "step": 27950 }, { "epoch": 3.32, "learning_rate": 2.0405797101449276e-06, "loss": 0.1456, "step": 27975 }, { "epoch": 3.32, "learning_rate": 2.0333333333333335e-06, "loss": 0.2055, "step": 28000 }, { "epoch": 3.32, "eval_cer": 6.862364110384181, "eval_loss": 0.39950060844421387, "eval_runtime": 3191.9428, "eval_samples_per_second": 0.778, "eval_steps_per_second": 0.389, "eval_wer": 18.76119687440442, "step": 28000 }, { "epoch": 3.33, "learning_rate": 2.0260869565217393e-06, "loss": 0.1855, "step": 28025 }, { "epoch": 3.33, "learning_rate": 2.018840579710145e-06, "loss": 0.2535, "step": 28050 }, { "epoch": 3.33, "learning_rate": 2.0115942028985506e-06, "loss": 0.2101, "step": 28075 }, { "epoch": 3.33, "learning_rate": 2.004347826086957e-06, "loss": 0.2977, "step": 28100 }, { "epoch": 3.34, "learning_rate": 1.9971014492753623e-06, "loss": 0.1915, "step": 28125 }, { "epoch": 3.34, "learning_rate": 1.989855072463768e-06, "loss": 0.1589, "step": 28150 }, { "epoch": 3.34, "learning_rate": 1.982608695652174e-06, "loss": 0.175, "step": 28175 }, { "epoch": 3.35, "learning_rate": 1.97536231884058e-06, "loss": 0.2892, "step": 28200 }, { "epoch": 3.35, "learning_rate": 1.9681159420289853e-06, "loss": 0.223, "step": 28225 }, { "epoch": 3.35, "learning_rate": 1.9608695652173916e-06, "loss": 0.1731, "step": 28250 }, { "epoch": 3.36, "learning_rate": 1.9536231884057975e-06, "loss": 0.2097, "step": 28275 }, { "epoch": 3.36, "learning_rate": 1.946376811594203e-06, "loss": 0.1909, "step": 28300 }, { "epoch": 3.36, "learning_rate": 1.939130434782609e-06, "loss": 0.2079, "step": 28325 }, { "epoch": 3.36, "learning_rate": 1.9318840579710146e-06, "loss": 0.1848, "step": 28350 }, { "epoch": 3.37, "learning_rate": 1.9246376811594205e-06, "loss": 0.1813, "step": 28375 }, { "epoch": 3.37, "learning_rate": 1.9173913043478263e-06, "loss": 0.1679, "step": 28400 }, { "epoch": 3.37, "learning_rate": 1.910144927536232e-06, "loss": 0.1787, "step": 28425 }, { "epoch": 3.38, "learning_rate": 1.9028985507246378e-06, "loss": 0.1718, "step": 28450 }, { "epoch": 3.38, "learning_rate": 1.8956521739130437e-06, "loss": 0.2553, "step": 28475 }, { "epoch": 3.38, "learning_rate": 1.8884057971014493e-06, "loss": 0.2249, "step": 28500 }, { "epoch": 3.38, "learning_rate": 1.8811594202898554e-06, "loss": 0.1657, "step": 28525 }, { "epoch": 3.39, "learning_rate": 1.873913043478261e-06, "loss": 0.1738, "step": 28550 }, { "epoch": 3.39, "learning_rate": 1.8666666666666669e-06, "loss": 0.1935, "step": 28575 }, { "epoch": 3.39, "learning_rate": 1.8594202898550725e-06, "loss": 0.2179, "step": 28600 }, { "epoch": 3.4, "learning_rate": 1.8521739130434786e-06, "loss": 0.2696, "step": 28625 }, { "epoch": 3.4, "learning_rate": 1.8449275362318842e-06, "loss": 0.1657, "step": 28650 }, { "epoch": 3.4, "learning_rate": 1.83768115942029e-06, "loss": 0.2302, "step": 28675 }, { "epoch": 3.41, "learning_rate": 1.8304347826086957e-06, "loss": 0.2888, "step": 28700 }, { "epoch": 3.41, "learning_rate": 1.8231884057971016e-06, "loss": 0.193, "step": 28725 }, { "epoch": 3.41, "learning_rate": 1.8159420289855072e-06, "loss": 0.2122, "step": 28750 }, { "epoch": 3.41, "learning_rate": 1.8086956521739133e-06, "loss": 0.1602, "step": 28775 }, { "epoch": 3.42, "learning_rate": 1.801449275362319e-06, "loss": 0.2419, "step": 28800 }, { "epoch": 3.42, "learning_rate": 1.7942028985507248e-06, "loss": 0.4138, "step": 28825 }, { "epoch": 3.42, "learning_rate": 1.7869565217391304e-06, "loss": 0.2473, "step": 28850 }, { "epoch": 3.43, "learning_rate": 1.7797101449275365e-06, "loss": 0.1792, "step": 28875 }, { "epoch": 3.43, "learning_rate": 1.7724637681159421e-06, "loss": 0.1822, "step": 28900 }, { "epoch": 3.43, "learning_rate": 1.765217391304348e-06, "loss": 0.1505, "step": 28925 }, { "epoch": 3.44, "learning_rate": 1.7579710144927536e-06, "loss": 0.1418, "step": 28950 }, { "epoch": 3.44, "learning_rate": 1.7507246376811595e-06, "loss": 0.1262, "step": 28975 }, { "epoch": 3.44, "learning_rate": 1.7434782608695653e-06, "loss": 0.175, "step": 29000 }, { "epoch": 3.44, "eval_cer": 6.772713857051503, "eval_loss": 0.40093937516212463, "eval_runtime": 3157.1944, "eval_samples_per_second": 0.786, "eval_steps_per_second": 0.393, "eval_wer": 18.48141795311607, "step": 29000 }, { "epoch": 3.44, "learning_rate": 1.7362318840579712e-06, "loss": 0.2065, "step": 29025 }, { "epoch": 3.45, "learning_rate": 1.7289855072463768e-06, "loss": 0.1723, "step": 29050 }, { "epoch": 3.45, "learning_rate": 1.7217391304347827e-06, "loss": 0.1419, "step": 29075 }, { "epoch": 3.45, "learning_rate": 1.7144927536231887e-06, "loss": 0.2607, "step": 29100 }, { "epoch": 3.46, "learning_rate": 1.7072463768115944e-06, "loss": 0.1884, "step": 29125 }, { "epoch": 3.46, "learning_rate": 1.7000000000000002e-06, "loss": 0.1824, "step": 29150 }, { "epoch": 3.46, "learning_rate": 1.6927536231884059e-06, "loss": 0.1657, "step": 29175 }, { "epoch": 3.47, "learning_rate": 1.685507246376812e-06, "loss": 0.248, "step": 29200 }, { "epoch": 3.47, "learning_rate": 1.6782608695652176e-06, "loss": 0.2124, "step": 29225 }, { "epoch": 3.47, "learning_rate": 1.6710144927536234e-06, "loss": 0.1964, "step": 29250 }, { "epoch": 3.47, "learning_rate": 1.663768115942029e-06, "loss": 0.3202, "step": 29275 }, { "epoch": 3.48, "learning_rate": 1.656521739130435e-06, "loss": 0.194, "step": 29300 }, { "epoch": 3.48, "learning_rate": 1.6492753623188406e-06, "loss": 0.2738, "step": 29325 }, { "epoch": 3.48, "learning_rate": 1.6420289855072467e-06, "loss": 0.1667, "step": 29350 }, { "epoch": 3.49, "learning_rate": 1.6347826086956523e-06, "loss": 0.2819, "step": 29375 }, { "epoch": 3.49, "learning_rate": 1.6275362318840581e-06, "loss": 0.1894, "step": 29400 }, { "epoch": 3.49, "learning_rate": 1.6202898550724638e-06, "loss": 0.1791, "step": 29425 }, { "epoch": 3.49, "learning_rate": 1.6130434782608699e-06, "loss": 0.1853, "step": 29450 }, { "epoch": 3.5, "learning_rate": 1.6057971014492755e-06, "loss": 0.2618, "step": 29475 }, { "epoch": 3.5, "learning_rate": 1.5985507246376814e-06, "loss": 0.2052, "step": 29500 }, { "epoch": 3.5, "learning_rate": 1.591304347826087e-06, "loss": 0.2185, "step": 29525 }, { "epoch": 3.51, "learning_rate": 1.5840579710144928e-06, "loss": 0.1305, "step": 29550 }, { "epoch": 3.51, "learning_rate": 1.5768115942028985e-06, "loss": 0.233, "step": 29575 }, { "epoch": 3.51, "learning_rate": 1.5695652173913046e-06, "loss": 0.2164, "step": 29600 }, { "epoch": 3.52, "learning_rate": 1.5623188405797102e-06, "loss": 0.1524, "step": 29625 }, { "epoch": 3.52, "learning_rate": 1.555072463768116e-06, "loss": 0.1961, "step": 29650 }, { "epoch": 3.52, "learning_rate": 1.5478260869565217e-06, "loss": 0.2242, "step": 29675 }, { "epoch": 3.52, "learning_rate": 1.5405797101449278e-06, "loss": 0.1997, "step": 29700 }, { "epoch": 3.53, "learning_rate": 1.5333333333333334e-06, "loss": 0.2001, "step": 29725 }, { "epoch": 3.53, "learning_rate": 1.5260869565217393e-06, "loss": 0.1888, "step": 29750 }, { "epoch": 3.53, "learning_rate": 1.518840579710145e-06, "loss": 0.2124, "step": 29775 }, { "epoch": 3.54, "learning_rate": 1.5115942028985508e-06, "loss": 0.2145, "step": 29800 }, { "epoch": 3.54, "learning_rate": 1.5043478260869566e-06, "loss": 0.2512, "step": 29825 }, { "epoch": 3.54, "learning_rate": 1.4971014492753625e-06, "loss": 0.1625, "step": 29850 }, { "epoch": 3.55, "learning_rate": 1.4898550724637683e-06, "loss": 0.1556, "step": 29875 }, { "epoch": 3.55, "learning_rate": 1.482608695652174e-06, "loss": 0.2134, "step": 29900 }, { "epoch": 3.55, "learning_rate": 1.47536231884058e-06, "loss": 0.1959, "step": 29925 }, { "epoch": 3.55, "learning_rate": 1.4681159420289857e-06, "loss": 0.197, "step": 29950 }, { "epoch": 3.56, "learning_rate": 1.4608695652173915e-06, "loss": 0.1825, "step": 29975 }, { "epoch": 3.56, "learning_rate": 1.4536231884057972e-06, "loss": 0.1701, "step": 30000 }, { "epoch": 3.56, "eval_cer": 7.013625854690344, "eval_loss": 0.3998452425003052, "eval_runtime": 3192.2868, "eval_samples_per_second": 0.777, "eval_steps_per_second": 0.389, "eval_wer": 18.834381551362682, "step": 30000 }, { "epoch": 3.56, "step": 30000, "total_flos": 1.9457998848e+18, "train_loss": 0.0, "train_runtime": 0.3469, "train_samples_per_second": 14412.297, "train_steps_per_second": 14412.297 }, { "epoch": 3.56, "eval_cer": 9.956974355224656, "eval_loss": 0.7926790118217468, "eval_runtime": 3112.2219, "eval_samples_per_second": 0.696, "eval_steps_per_second": 0.348, "eval_wer": 31.400474471700036, "step": 30000 } ], "max_steps": 5000, "num_train_epochs": 2, "total_flos": 1.9457998848e+18, "trial_name": null, "trial_params": null }