{ "best_metric": null, "best_model_checkpoint": null, "epoch": 7.041757622702627, "eval_steps": 2500, "global_step": 200000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 4.7000000000000004e-08, "loss": 13.3462, "step": 50 }, { "epoch": 0.0, "learning_rate": 9.700000000000001e-08, "loss": 13.4325, "step": 100 }, { "epoch": 0.01, "learning_rate": 1.4500000000000001e-07, "loss": 15.1202, "step": 150 }, { "epoch": 0.01, "learning_rate": 1.95e-07, "loss": 13.265, "step": 200 }, { "epoch": 0.01, "learning_rate": 2.44e-07, "loss": 14.4751, "step": 250 }, { "epoch": 0.01, "learning_rate": 2.94e-07, "loss": 13.4503, "step": 300 }, { "epoch": 0.01, "learning_rate": 3.44e-07, "loss": 13.8313, "step": 350 }, { "epoch": 0.01, "learning_rate": 3.94e-07, "loss": 13.4356, "step": 400 }, { "epoch": 0.02, "learning_rate": 4.4400000000000006e-07, "loss": 13.9124, "step": 450 }, { "epoch": 0.02, "learning_rate": 4.940000000000001e-07, "loss": 14.6006, "step": 500 }, { "epoch": 0.02, "learning_rate": 5.44e-07, "loss": 13.4093, "step": 550 }, { "epoch": 0.02, "learning_rate": 5.94e-07, "loss": 13.4746, "step": 600 }, { "epoch": 0.02, "learning_rate": 6.44e-07, "loss": 14.4774, "step": 650 }, { "epoch": 0.02, "learning_rate": 6.94e-07, "loss": 13.2629, "step": 700 }, { "epoch": 0.03, "learning_rate": 7.44e-07, "loss": 13.0762, "step": 750 }, { "epoch": 0.03, "learning_rate": 7.94e-07, "loss": 12.8286, "step": 800 }, { "epoch": 0.03, "learning_rate": 8.440000000000001e-07, "loss": 12.6316, "step": 850 }, { "epoch": 0.03, "learning_rate": 8.94e-07, "loss": 12.3767, "step": 900 }, { "epoch": 0.03, "learning_rate": 9.440000000000001e-07, "loss": 12.0782, "step": 950 }, { "epoch": 0.04, "learning_rate": 9.940000000000001e-07, "loss": 11.7918, "step": 1000 }, { "epoch": 0.04, "learning_rate": 1.044e-06, "loss": 11.2528, "step": 1050 }, { "epoch": 0.04, "learning_rate": 1.094e-06, "loss": 10.7915, "step": 1100 }, { "epoch": 0.04, "learning_rate": 1.1440000000000002e-06, "loss": 10.4157, "step": 1150 }, { "epoch": 0.04, "learning_rate": 1.1940000000000001e-06, "loss": 10.3647, "step": 1200 }, { "epoch": 0.04, "learning_rate": 1.244e-06, "loss": 9.9214, "step": 1250 }, { "epoch": 0.05, "learning_rate": 1.294e-06, "loss": 9.4672, "step": 1300 }, { "epoch": 0.05, "learning_rate": 1.344e-06, "loss": 9.6436, "step": 1350 }, { "epoch": 0.05, "learning_rate": 1.3940000000000001e-06, "loss": 9.3357, "step": 1400 }, { "epoch": 0.05, "learning_rate": 1.444e-06, "loss": 8.3043, "step": 1450 }, { "epoch": 0.05, "learning_rate": 1.4940000000000002e-06, "loss": 8.2694, "step": 1500 }, { "epoch": 0.05, "learning_rate": 1.5440000000000002e-06, "loss": 8.0348, "step": 1550 }, { "epoch": 0.06, "learning_rate": 1.594e-06, "loss": 7.7377, "step": 1600 }, { "epoch": 0.06, "learning_rate": 1.644e-06, "loss": 7.5757, "step": 1650 }, { "epoch": 0.06, "learning_rate": 1.694e-06, "loss": 7.4689, "step": 1700 }, { "epoch": 0.06, "learning_rate": 1.7440000000000002e-06, "loss": 6.9314, "step": 1750 }, { "epoch": 0.06, "learning_rate": 1.794e-06, "loss": 7.0793, "step": 1800 }, { "epoch": 0.07, "learning_rate": 1.8440000000000003e-06, "loss": 7.0355, "step": 1850 }, { "epoch": 0.07, "learning_rate": 1.8940000000000002e-06, "loss": 6.4377, "step": 1900 }, { "epoch": 0.07, "learning_rate": 1.944e-06, "loss": 6.5264, "step": 1950 }, { "epoch": 0.07, "learning_rate": 1.9940000000000003e-06, "loss": 6.3947, "step": 2000 }, { "epoch": 0.07, "learning_rate": 2.0440000000000003e-06, "loss": 6.1153, "step": 2050 }, { "epoch": 0.07, "learning_rate": 2.094e-06, "loss": 6.0151, "step": 2100 }, { "epoch": 0.08, "learning_rate": 2.144e-06, "loss": 6.0025, "step": 2150 }, { "epoch": 0.08, "learning_rate": 2.194e-06, "loss": 5.8175, "step": 2200 }, { "epoch": 0.08, "learning_rate": 2.244e-06, "loss": 5.6286, "step": 2250 }, { "epoch": 0.08, "learning_rate": 2.294e-06, "loss": 5.7398, "step": 2300 }, { "epoch": 0.08, "learning_rate": 2.3440000000000003e-06, "loss": 5.5829, "step": 2350 }, { "epoch": 0.08, "learning_rate": 2.3940000000000003e-06, "loss": 5.4584, "step": 2400 }, { "epoch": 0.09, "learning_rate": 2.443e-06, "loss": 5.5921, "step": 2450 }, { "epoch": 0.09, "learning_rate": 2.493e-06, "loss": 5.3032, "step": 2500 }, { "epoch": 0.09, "eval_loss": 7.053048133850098, "eval_runtime": 7.7457, "eval_samples_per_second": 183.328, "eval_steps_per_second": 11.49, "eval_wer": 1.0, "step": 2500 }, { "epoch": 0.09, "learning_rate": 2.5430000000000005e-06, "loss": 5.03, "step": 2550 }, { "epoch": 0.09, "learning_rate": 2.593e-06, "loss": 5.0891, "step": 2600 }, { "epoch": 0.09, "learning_rate": 2.643e-06, "loss": 5.0401, "step": 2650 }, { "epoch": 0.1, "learning_rate": 2.693e-06, "loss": 4.9428, "step": 2700 }, { "epoch": 0.1, "learning_rate": 2.7430000000000002e-06, "loss": 4.8569, "step": 2750 }, { "epoch": 0.1, "learning_rate": 2.793e-06, "loss": 4.7334, "step": 2800 }, { "epoch": 0.1, "learning_rate": 2.843e-06, "loss": 4.622, "step": 2850 }, { "epoch": 0.1, "learning_rate": 2.893e-06, "loss": 4.6339, "step": 2900 }, { "epoch": 0.1, "learning_rate": 2.9430000000000005e-06, "loss": 4.8513, "step": 2950 }, { "epoch": 0.11, "learning_rate": 2.9930000000000004e-06, "loss": 4.4769, "step": 3000 }, { "epoch": 0.11, "learning_rate": 3.0430000000000003e-06, "loss": 4.3885, "step": 3050 }, { "epoch": 0.11, "learning_rate": 3.0930000000000003e-06, "loss": 4.3643, "step": 3100 }, { "epoch": 0.11, "learning_rate": 3.1430000000000007e-06, "loss": 4.263, "step": 3150 }, { "epoch": 0.11, "learning_rate": 3.193e-06, "loss": 4.2107, "step": 3200 }, { "epoch": 0.11, "learning_rate": 3.243e-06, "loss": 4.302, "step": 3250 }, { "epoch": 0.12, "learning_rate": 3.293e-06, "loss": 4.21, "step": 3300 }, { "epoch": 0.12, "learning_rate": 3.343e-06, "loss": 4.1202, "step": 3350 }, { "epoch": 0.12, "learning_rate": 3.3930000000000004e-06, "loss": 4.0725, "step": 3400 }, { "epoch": 0.12, "learning_rate": 3.4430000000000003e-06, "loss": 4.0051, "step": 3450 }, { "epoch": 0.12, "learning_rate": 3.4930000000000003e-06, "loss": 4.0251, "step": 3500 }, { "epoch": 0.12, "learning_rate": 3.5430000000000002e-06, "loss": 4.0444, "step": 3550 }, { "epoch": 0.13, "learning_rate": 3.5930000000000006e-06, "loss": 3.8632, "step": 3600 }, { "epoch": 0.13, "learning_rate": 3.6430000000000005e-06, "loss": 3.8705, "step": 3650 }, { "epoch": 0.13, "learning_rate": 3.6930000000000005e-06, "loss": 3.8023, "step": 3700 }, { "epoch": 0.13, "learning_rate": 3.7430000000000004e-06, "loss": 3.7624, "step": 3750 }, { "epoch": 0.13, "learning_rate": 3.7930000000000004e-06, "loss": 3.7358, "step": 3800 }, { "epoch": 0.14, "learning_rate": 3.843e-06, "loss": 3.8833, "step": 3850 }, { "epoch": 0.14, "learning_rate": 3.893e-06, "loss": 3.7054, "step": 3900 }, { "epoch": 0.14, "learning_rate": 3.943e-06, "loss": 3.6743, "step": 3950 }, { "epoch": 0.14, "learning_rate": 3.9930000000000006e-06, "loss": 3.659, "step": 4000 }, { "epoch": 0.14, "learning_rate": 4.043e-06, "loss": 3.6112, "step": 4050 }, { "epoch": 0.14, "learning_rate": 4.0930000000000005e-06, "loss": 3.6801, "step": 4100 }, { "epoch": 0.15, "learning_rate": 4.143e-06, "loss": 3.5854, "step": 4150 }, { "epoch": 0.15, "learning_rate": 4.193e-06, "loss": 3.6023, "step": 4200 }, { "epoch": 0.15, "learning_rate": 4.243000000000001e-06, "loss": 3.5962, "step": 4250 }, { "epoch": 0.15, "learning_rate": 4.293e-06, "loss": 3.5521, "step": 4300 }, { "epoch": 0.15, "learning_rate": 4.343000000000001e-06, "loss": 3.5149, "step": 4350 }, { "epoch": 0.15, "learning_rate": 4.393000000000001e-06, "loss": 3.5215, "step": 4400 }, { "epoch": 0.16, "learning_rate": 4.4430000000000005e-06, "loss": 3.5136, "step": 4450 }, { "epoch": 0.16, "learning_rate": 4.493e-06, "loss": 3.5168, "step": 4500 }, { "epoch": 0.16, "learning_rate": 4.543e-06, "loss": 3.4727, "step": 4550 }, { "epoch": 0.16, "learning_rate": 4.593e-06, "loss": 3.4894, "step": 4600 }, { "epoch": 0.16, "learning_rate": 4.643e-06, "loss": 3.4889, "step": 4650 }, { "epoch": 0.17, "learning_rate": 4.693000000000001e-06, "loss": 3.4842, "step": 4700 }, { "epoch": 0.17, "learning_rate": 4.743e-06, "loss": 3.4439, "step": 4750 }, { "epoch": 0.17, "learning_rate": 4.7930000000000005e-06, "loss": 3.4434, "step": 4800 }, { "epoch": 0.17, "learning_rate": 4.843000000000001e-06, "loss": 3.4639, "step": 4850 }, { "epoch": 0.17, "learning_rate": 4.893e-06, "loss": 3.4605, "step": 4900 }, { "epoch": 0.17, "learning_rate": 4.943000000000001e-06, "loss": 3.4602, "step": 4950 }, { "epoch": 0.18, "learning_rate": 4.993e-06, "loss": 3.4521, "step": 5000 }, { "epoch": 0.18, "eval_loss": 3.601861000061035, "eval_runtime": 10.064, "eval_samples_per_second": 141.097, "eval_steps_per_second": 8.843, "eval_wer": 1.0, "step": 5000 }, { "epoch": 0.18, "learning_rate": 5.043e-06, "loss": 3.424, "step": 5050 }, { "epoch": 0.18, "learning_rate": 5.093e-06, "loss": 3.4384, "step": 5100 }, { "epoch": 0.18, "learning_rate": 5.1430000000000006e-06, "loss": 3.4357, "step": 5150 }, { "epoch": 0.18, "learning_rate": 5.193e-06, "loss": 3.508, "step": 5200 }, { "epoch": 0.18, "learning_rate": 5.2430000000000005e-06, "loss": 3.4305, "step": 5250 }, { "epoch": 0.19, "learning_rate": 5.293e-06, "loss": 3.4465, "step": 5300 }, { "epoch": 0.19, "learning_rate": 5.343e-06, "loss": 3.4168, "step": 5350 }, { "epoch": 0.19, "learning_rate": 5.393000000000001e-06, "loss": 3.4193, "step": 5400 }, { "epoch": 0.19, "learning_rate": 5.443e-06, "loss": 3.4385, "step": 5450 }, { "epoch": 0.19, "learning_rate": 5.493000000000001e-06, "loss": 3.4036, "step": 5500 }, { "epoch": 0.2, "learning_rate": 5.543000000000001e-06, "loss": 3.4101, "step": 5550 }, { "epoch": 0.2, "learning_rate": 5.5930000000000005e-06, "loss": 3.4081, "step": 5600 }, { "epoch": 0.2, "learning_rate": 5.643000000000001e-06, "loss": 3.3905, "step": 5650 }, { "epoch": 0.2, "learning_rate": 5.693e-06, "loss": 3.3937, "step": 5700 }, { "epoch": 0.2, "learning_rate": 5.743000000000001e-06, "loss": 3.4579, "step": 5750 }, { "epoch": 0.2, "learning_rate": 5.793000000000001e-06, "loss": 3.3738, "step": 5800 }, { "epoch": 0.21, "learning_rate": 5.843000000000001e-06, "loss": 3.385, "step": 5850 }, { "epoch": 0.21, "learning_rate": 5.893000000000001e-06, "loss": 3.3707, "step": 5900 }, { "epoch": 0.21, "learning_rate": 5.943000000000001e-06, "loss": 3.3747, "step": 5950 }, { "epoch": 0.21, "learning_rate": 5.993000000000001e-06, "loss": 3.359, "step": 6000 }, { "epoch": 0.21, "learning_rate": 6.0429999999999996e-06, "loss": 3.3753, "step": 6050 }, { "epoch": 0.21, "learning_rate": 6.093e-06, "loss": 3.3703, "step": 6100 }, { "epoch": 0.22, "learning_rate": 6.143e-06, "loss": 3.3744, "step": 6150 }, { "epoch": 0.22, "learning_rate": 6.193e-06, "loss": 3.4173, "step": 6200 }, { "epoch": 0.22, "learning_rate": 6.243e-06, "loss": 3.3541, "step": 6250 }, { "epoch": 0.22, "learning_rate": 6.2930000000000006e-06, "loss": 3.3675, "step": 6300 }, { "epoch": 0.22, "learning_rate": 6.343e-06, "loss": 3.3471, "step": 6350 }, { "epoch": 0.23, "learning_rate": 6.3930000000000005e-06, "loss": 3.3558, "step": 6400 }, { "epoch": 0.23, "learning_rate": 6.443e-06, "loss": 3.335, "step": 6450 }, { "epoch": 0.23, "learning_rate": 6.493e-06, "loss": 3.3344, "step": 6500 }, { "epoch": 0.23, "learning_rate": 6.543000000000001e-06, "loss": 3.3296, "step": 6550 }, { "epoch": 0.23, "learning_rate": 6.593e-06, "loss": 3.3459, "step": 6600 }, { "epoch": 0.23, "learning_rate": 6.643000000000001e-06, "loss": 3.3453, "step": 6650 }, { "epoch": 0.24, "learning_rate": 6.693000000000001e-06, "loss": 3.3491, "step": 6700 }, { "epoch": 0.24, "learning_rate": 6.7430000000000005e-06, "loss": 3.3249, "step": 6750 }, { "epoch": 0.24, "learning_rate": 6.793000000000001e-06, "loss": 3.3246, "step": 6800 }, { "epoch": 0.24, "learning_rate": 6.843e-06, "loss": 3.3178, "step": 6850 }, { "epoch": 0.24, "learning_rate": 6.893000000000001e-06, "loss": 3.3216, "step": 6900 }, { "epoch": 0.24, "learning_rate": 6.943000000000001e-06, "loss": 3.3597, "step": 6950 }, { "epoch": 0.25, "learning_rate": 6.993000000000001e-06, "loss": 3.3181, "step": 7000 }, { "epoch": 0.25, "learning_rate": 7.043000000000001e-06, "loss": 3.3265, "step": 7050 }, { "epoch": 0.25, "learning_rate": 7.093000000000001e-06, "loss": 3.3375, "step": 7100 }, { "epoch": 0.25, "learning_rate": 7.143000000000001e-06, "loss": 3.3365, "step": 7150 }, { "epoch": 0.25, "learning_rate": 7.193000000000001e-06, "loss": 3.3036, "step": 7200 }, { "epoch": 0.26, "learning_rate": 7.243000000000001e-06, "loss": 3.3252, "step": 7250 }, { "epoch": 0.26, "learning_rate": 7.293e-06, "loss": 3.3059, "step": 7300 }, { "epoch": 0.26, "learning_rate": 7.343e-06, "loss": 3.328, "step": 7350 }, { "epoch": 0.26, "learning_rate": 7.393e-06, "loss": 3.3056, "step": 7400 }, { "epoch": 0.26, "learning_rate": 7.4430000000000006e-06, "loss": 3.3207, "step": 7450 }, { "epoch": 0.26, "learning_rate": 7.493e-06, "loss": 3.3037, "step": 7500 }, { "epoch": 0.26, "eval_loss": 3.493137836456299, "eval_runtime": 10.1789, "eval_samples_per_second": 139.505, "eval_steps_per_second": 8.744, "eval_wer": 1.0, "step": 7500 }, { "epoch": 0.27, "learning_rate": 7.5430000000000005e-06, "loss": 3.308, "step": 7550 }, { "epoch": 0.27, "learning_rate": 7.593e-06, "loss": 3.3127, "step": 7600 }, { "epoch": 0.27, "learning_rate": 7.643000000000001e-06, "loss": 3.3121, "step": 7650 }, { "epoch": 0.27, "learning_rate": 7.693e-06, "loss": 3.3238, "step": 7700 }, { "epoch": 0.27, "learning_rate": 7.743e-06, "loss": 3.3304, "step": 7750 }, { "epoch": 0.27, "learning_rate": 7.793e-06, "loss": 3.3204, "step": 7800 }, { "epoch": 0.28, "learning_rate": 7.843000000000001e-06, "loss": 3.3014, "step": 7850 }, { "epoch": 0.28, "learning_rate": 7.893e-06, "loss": 3.3343, "step": 7900 }, { "epoch": 0.28, "learning_rate": 7.943e-06, "loss": 3.3093, "step": 7950 }, { "epoch": 0.28, "learning_rate": 7.993000000000001e-06, "loss": 3.3117, "step": 8000 }, { "epoch": 0.28, "learning_rate": 8.043e-06, "loss": 3.2943, "step": 8050 }, { "epoch": 0.29, "learning_rate": 8.093e-06, "loss": 3.2958, "step": 8100 }, { "epoch": 0.29, "learning_rate": 8.143000000000001e-06, "loss": 3.3454, "step": 8150 }, { "epoch": 0.29, "learning_rate": 8.193000000000001e-06, "loss": 3.3037, "step": 8200 }, { "epoch": 0.29, "learning_rate": 8.243e-06, "loss": 3.2979, "step": 8250 }, { "epoch": 0.29, "learning_rate": 8.293000000000002e-06, "loss": 3.2942, "step": 8300 }, { "epoch": 0.29, "learning_rate": 8.343000000000001e-06, "loss": 3.2869, "step": 8350 }, { "epoch": 0.3, "learning_rate": 8.393e-06, "loss": 3.3271, "step": 8400 }, { "epoch": 0.3, "learning_rate": 8.443000000000002e-06, "loss": 3.337, "step": 8450 }, { "epoch": 0.3, "learning_rate": 8.493000000000002e-06, "loss": 3.3157, "step": 8500 }, { "epoch": 0.3, "learning_rate": 8.543e-06, "loss": 3.3043, "step": 8550 }, { "epoch": 0.3, "learning_rate": 8.593e-06, "loss": 3.2915, "step": 8600 }, { "epoch": 0.3, "learning_rate": 8.643e-06, "loss": 3.2816, "step": 8650 }, { "epoch": 0.31, "learning_rate": 8.693e-06, "loss": 3.2882, "step": 8700 }, { "epoch": 0.31, "learning_rate": 8.743e-06, "loss": 3.2922, "step": 8750 }, { "epoch": 0.31, "learning_rate": 8.793e-06, "loss": 3.2966, "step": 8800 }, { "epoch": 0.31, "learning_rate": 8.843e-06, "loss": 3.2851, "step": 8850 }, { "epoch": 0.31, "learning_rate": 8.893000000000001e-06, "loss": 3.2923, "step": 8900 }, { "epoch": 0.32, "learning_rate": 8.943e-06, "loss": 3.2764, "step": 8950 }, { "epoch": 0.32, "learning_rate": 8.993e-06, "loss": 3.2968, "step": 9000 }, { "epoch": 0.32, "learning_rate": 9.043000000000001e-06, "loss": 3.263, "step": 9050 }, { "epoch": 0.32, "learning_rate": 9.093000000000001e-06, "loss": 3.2895, "step": 9100 }, { "epoch": 0.32, "learning_rate": 9.143e-06, "loss": 3.3235, "step": 9150 }, { "epoch": 0.32, "learning_rate": 9.193000000000002e-06, "loss": 3.2993, "step": 9200 }, { "epoch": 0.33, "learning_rate": 9.243000000000001e-06, "loss": 3.3241, "step": 9250 }, { "epoch": 0.33, "learning_rate": 9.293e-06, "loss": 3.2813, "step": 9300 }, { "epoch": 0.33, "learning_rate": 9.343e-06, "loss": 3.2898, "step": 9350 }, { "epoch": 0.33, "learning_rate": 9.393000000000001e-06, "loss": 3.2506, "step": 9400 }, { "epoch": 0.33, "learning_rate": 9.443000000000001e-06, "loss": 3.3176, "step": 9450 }, { "epoch": 0.33, "learning_rate": 9.493e-06, "loss": 3.3087, "step": 9500 }, { "epoch": 0.34, "learning_rate": 9.543000000000002e-06, "loss": 3.2961, "step": 9550 }, { "epoch": 0.34, "learning_rate": 9.593000000000001e-06, "loss": 3.2858, "step": 9600 }, { "epoch": 0.34, "learning_rate": 9.643e-06, "loss": 3.267, "step": 9650 }, { "epoch": 0.34, "learning_rate": 9.692e-06, "loss": 3.3293, "step": 9700 }, { "epoch": 0.34, "learning_rate": 9.742000000000001e-06, "loss": 3.2597, "step": 9750 }, { "epoch": 0.35, "learning_rate": 9.792e-06, "loss": 3.2411, "step": 9800 }, { "epoch": 0.35, "learning_rate": 9.842e-06, "loss": 3.23, "step": 9850 }, { "epoch": 0.35, "learning_rate": 9.892000000000001e-06, "loss": 3.3535, "step": 9900 }, { "epoch": 0.35, "learning_rate": 9.942e-06, "loss": 3.2285, "step": 9950 }, { "epoch": 0.35, "learning_rate": 9.992e-06, "loss": 3.2012, "step": 10000 }, { "epoch": 0.35, "eval_loss": 3.419313907623291, "eval_runtime": 12.0256, "eval_samples_per_second": 118.081, "eval_steps_per_second": 7.401, "eval_wer": 1.0, "step": 10000 }, { "epoch": 0.35, "learning_rate": 1.0042000000000001e-05, "loss": 3.1657, "step": 10050 }, { "epoch": 0.36, "learning_rate": 1.0092000000000001e-05, "loss": 3.1619, "step": 10100 }, { "epoch": 0.36, "learning_rate": 1.0142e-05, "loss": 3.2113, "step": 10150 }, { "epoch": 0.36, "learning_rate": 1.0192000000000002e-05, "loss": 3.1313, "step": 10200 }, { "epoch": 0.36, "learning_rate": 1.0242000000000001e-05, "loss": 3.1489, "step": 10250 }, { "epoch": 0.36, "learning_rate": 1.0291999999999999e-05, "loss": 3.0888, "step": 10300 }, { "epoch": 0.36, "learning_rate": 1.0342e-05, "loss": 3.1901, "step": 10350 }, { "epoch": 0.37, "learning_rate": 1.0392e-05, "loss": 3.1994, "step": 10400 }, { "epoch": 0.37, "learning_rate": 1.0442000000000001e-05, "loss": 3.0744, "step": 10450 }, { "epoch": 0.37, "learning_rate": 1.0492e-05, "loss": 3.0529, "step": 10500 }, { "epoch": 0.37, "learning_rate": 1.0542000000000002e-05, "loss": 3.0715, "step": 10550 }, { "epoch": 0.37, "learning_rate": 1.0592e-05, "loss": 3.0427, "step": 10600 }, { "epoch": 0.37, "learning_rate": 1.0642e-05, "loss": 3.0184, "step": 10650 }, { "epoch": 0.38, "learning_rate": 1.0692e-05, "loss": 3.0148, "step": 10700 }, { "epoch": 0.38, "learning_rate": 1.0742000000000002e-05, "loss": 3.0003, "step": 10750 }, { "epoch": 0.38, "learning_rate": 1.0792000000000001e-05, "loss": 3.0029, "step": 10800 }, { "epoch": 0.38, "learning_rate": 1.0842000000000002e-05, "loss": 3.0047, "step": 10850 }, { "epoch": 0.38, "learning_rate": 1.0892e-05, "loss": 2.9589, "step": 10900 }, { "epoch": 0.39, "learning_rate": 1.0942000000000001e-05, "loss": 2.9764, "step": 10950 }, { "epoch": 0.39, "learning_rate": 1.0992e-05, "loss": 2.9356, "step": 11000 }, { "epoch": 0.39, "learning_rate": 1.1042000000000002e-05, "loss": 2.9042, "step": 11050 }, { "epoch": 0.39, "learning_rate": 1.1092e-05, "loss": 2.9244, "step": 11100 }, { "epoch": 0.39, "learning_rate": 1.1142000000000001e-05, "loss": 2.8914, "step": 11150 }, { "epoch": 0.39, "learning_rate": 1.1192e-05, "loss": 2.8736, "step": 11200 }, { "epoch": 0.4, "learning_rate": 1.1242000000000002e-05, "loss": 2.8538, "step": 11250 }, { "epoch": 0.4, "learning_rate": 1.1292000000000001e-05, "loss": 2.9744, "step": 11300 }, { "epoch": 0.4, "learning_rate": 1.1342000000000003e-05, "loss": 2.8937, "step": 11350 }, { "epoch": 0.4, "learning_rate": 1.1392e-05, "loss": 2.8238, "step": 11400 }, { "epoch": 0.4, "learning_rate": 1.1442000000000002e-05, "loss": 2.7929, "step": 11450 }, { "epoch": 0.4, "learning_rate": 1.1492000000000001e-05, "loss": 2.8081, "step": 11500 }, { "epoch": 0.41, "learning_rate": 1.1542e-05, "loss": 2.8633, "step": 11550 }, { "epoch": 0.41, "learning_rate": 1.1592000000000002e-05, "loss": 2.7273, "step": 11600 }, { "epoch": 0.41, "learning_rate": 1.1642e-05, "loss": 2.7504, "step": 11650 }, { "epoch": 0.41, "learning_rate": 1.1692000000000001e-05, "loss": 2.7028, "step": 11700 }, { "epoch": 0.41, "learning_rate": 1.1742e-05, "loss": 2.6851, "step": 11750 }, { "epoch": 0.42, "learning_rate": 1.1792000000000002e-05, "loss": 2.665, "step": 11800 }, { "epoch": 0.42, "learning_rate": 1.1842e-05, "loss": 2.5866, "step": 11850 }, { "epoch": 0.42, "learning_rate": 1.1892e-05, "loss": 2.609, "step": 11900 }, { "epoch": 0.42, "learning_rate": 1.1942e-05, "loss": 2.6202, "step": 11950 }, { "epoch": 0.42, "learning_rate": 1.1992000000000001e-05, "loss": 2.5421, "step": 12000 }, { "epoch": 0.42, "learning_rate": 1.2042000000000001e-05, "loss": 2.5052, "step": 12050 }, { "epoch": 0.43, "learning_rate": 1.2092000000000002e-05, "loss": 2.4689, "step": 12100 }, { "epoch": 0.43, "learning_rate": 1.2142e-05, "loss": 2.4317, "step": 12150 }, { "epoch": 0.43, "learning_rate": 1.2192000000000001e-05, "loss": 2.4919, "step": 12200 }, { "epoch": 0.43, "learning_rate": 1.2242e-05, "loss": 2.3886, "step": 12250 }, { "epoch": 0.43, "learning_rate": 1.2292000000000002e-05, "loss": 2.3378, "step": 12300 }, { "epoch": 0.43, "learning_rate": 1.2342000000000001e-05, "loss": 2.3704, "step": 12350 }, { "epoch": 0.44, "learning_rate": 1.2392000000000003e-05, "loss": 2.3586, "step": 12400 }, { "epoch": 0.44, "learning_rate": 1.2442e-05, "loss": 2.3901, "step": 12450 }, { "epoch": 0.44, "learning_rate": 1.2492000000000002e-05, "loss": 2.3026, "step": 12500 }, { "epoch": 0.44, "eval_loss": 1.9423085451126099, "eval_runtime": 124.9728, "eval_samples_per_second": 11.362, "eval_steps_per_second": 0.712, "eval_wer": 0.9872923663429246, "step": 12500 }, { "epoch": 0.44, "learning_rate": 1.2542000000000001e-05, "loss": 2.2366, "step": 12550 }, { "epoch": 0.44, "learning_rate": 1.2592000000000002e-05, "loss": 2.199, "step": 12600 }, { "epoch": 0.45, "learning_rate": 1.2642e-05, "loss": 2.2084, "step": 12650 }, { "epoch": 0.45, "learning_rate": 1.2692000000000001e-05, "loss": 2.2424, "step": 12700 }, { "epoch": 0.45, "learning_rate": 1.2742000000000001e-05, "loss": 2.148, "step": 12750 }, { "epoch": 0.45, "learning_rate": 1.2792e-05, "loss": 2.0756, "step": 12800 }, { "epoch": 0.45, "learning_rate": 1.2842000000000002e-05, "loss": 2.0907, "step": 12850 }, { "epoch": 0.45, "learning_rate": 1.2892e-05, "loss": 2.0458, "step": 12900 }, { "epoch": 0.46, "learning_rate": 1.2942e-05, "loss": 2.0054, "step": 12950 }, { "epoch": 0.46, "learning_rate": 1.2992e-05, "loss": 2.0198, "step": 13000 }, { "epoch": 0.46, "learning_rate": 1.3041000000000001e-05, "loss": 2.1357, "step": 13050 }, { "epoch": 0.46, "learning_rate": 1.3091e-05, "loss": 2.0381, "step": 13100 }, { "epoch": 0.46, "learning_rate": 1.3141000000000002e-05, "loss": 2.0359, "step": 13150 }, { "epoch": 0.46, "learning_rate": 1.3191000000000001e-05, "loss": 1.9001, "step": 13200 }, { "epoch": 0.47, "learning_rate": 1.3241e-05, "loss": 1.9348, "step": 13250 }, { "epoch": 0.47, "learning_rate": 1.3291e-05, "loss": 1.8653, "step": 13300 }, { "epoch": 0.47, "learning_rate": 1.3341000000000002e-05, "loss": 1.8422, "step": 13350 }, { "epoch": 0.47, "learning_rate": 1.3391000000000001e-05, "loss": 1.882, "step": 13400 }, { "epoch": 0.47, "learning_rate": 1.3441000000000002e-05, "loss": 1.824, "step": 13450 }, { "epoch": 0.48, "learning_rate": 1.3491e-05, "loss": 1.8367, "step": 13500 }, { "epoch": 0.48, "learning_rate": 1.3541000000000001e-05, "loss": 1.837, "step": 13550 }, { "epoch": 0.48, "learning_rate": 1.3591e-05, "loss": 1.8585, "step": 13600 }, { "epoch": 0.48, "learning_rate": 1.3641000000000002e-05, "loss": 1.7428, "step": 13650 }, { "epoch": 0.48, "learning_rate": 1.3691000000000002e-05, "loss": 1.7128, "step": 13700 }, { "epoch": 0.48, "learning_rate": 1.3741000000000003e-05, "loss": 1.7281, "step": 13750 }, { "epoch": 0.49, "learning_rate": 1.3791e-05, "loss": 1.6616, "step": 13800 }, { "epoch": 0.49, "learning_rate": 1.3841000000000002e-05, "loss": 1.8904, "step": 13850 }, { "epoch": 0.49, "learning_rate": 1.3891000000000001e-05, "loss": 1.6556, "step": 13900 }, { "epoch": 0.49, "learning_rate": 1.3941000000000001e-05, "loss": 1.6314, "step": 13950 }, { "epoch": 0.49, "learning_rate": 1.3991000000000002e-05, "loss": 1.63, "step": 14000 }, { "epoch": 0.49, "learning_rate": 1.4041e-05, "loss": 1.6098, "step": 14050 }, { "epoch": 0.5, "learning_rate": 1.4091000000000001e-05, "loss": 1.661, "step": 14100 }, { "epoch": 0.5, "learning_rate": 1.4141e-05, "loss": 1.5996, "step": 14150 }, { "epoch": 0.5, "learning_rate": 1.4191000000000002e-05, "loss": 1.7523, "step": 14200 }, { "epoch": 0.5, "learning_rate": 1.4241e-05, "loss": 1.5367, "step": 14250 }, { "epoch": 0.5, "learning_rate": 1.4291000000000001e-05, "loss": 1.5391, "step": 14300 }, { "epoch": 0.51, "learning_rate": 1.4341e-05, "loss": 1.5598, "step": 14350 }, { "epoch": 0.51, "learning_rate": 1.4391000000000002e-05, "loss": 1.4563, "step": 14400 }, { "epoch": 0.51, "learning_rate": 1.4441000000000001e-05, "loss": 1.4344, "step": 14450 }, { "epoch": 0.51, "learning_rate": 1.4491000000000002e-05, "loss": 1.4759, "step": 14500 }, { "epoch": 0.51, "learning_rate": 1.4541e-05, "loss": 1.5761, "step": 14550 }, { "epoch": 0.51, "learning_rate": 1.4591000000000001e-05, "loss": 1.4589, "step": 14600 }, { "epoch": 0.52, "learning_rate": 1.4641000000000001e-05, "loss": 1.6196, "step": 14650 }, { "epoch": 0.52, "learning_rate": 1.4691000000000002e-05, "loss": 1.4332, "step": 14700 }, { "epoch": 0.52, "learning_rate": 1.4741000000000002e-05, "loss": 1.5231, "step": 14750 }, { "epoch": 0.52, "learning_rate": 1.4791000000000001e-05, "loss": 1.4294, "step": 14800 }, { "epoch": 0.52, "learning_rate": 1.4841e-05, "loss": 1.4149, "step": 14850 }, { "epoch": 0.52, "learning_rate": 1.4891000000000002e-05, "loss": 1.5815, "step": 14900 }, { "epoch": 0.53, "learning_rate": 1.4941000000000001e-05, "loss": 1.4123, "step": 14950 }, { "epoch": 0.53, "learning_rate": 1.4991000000000003e-05, "loss": 1.4238, "step": 15000 }, { "epoch": 0.53, "eval_loss": 0.8772240877151489, "eval_runtime": 12.5995, "eval_samples_per_second": 112.703, "eval_steps_per_second": 7.064, "eval_wer": 0.6695107561042026, "step": 15000 }, { "epoch": 0.53, "learning_rate": 1.5041e-05, "loss": 1.4982, "step": 15050 }, { "epoch": 0.53, "learning_rate": 1.5091000000000002e-05, "loss": 1.3728, "step": 15100 }, { "epoch": 0.53, "learning_rate": 1.5141000000000001e-05, "loss": 1.2692, "step": 15150 }, { "epoch": 0.54, "learning_rate": 1.5191e-05, "loss": 1.2939, "step": 15200 }, { "epoch": 0.54, "learning_rate": 1.5241000000000002e-05, "loss": 1.3519, "step": 15250 }, { "epoch": 0.54, "learning_rate": 1.5291e-05, "loss": 1.3453, "step": 15300 }, { "epoch": 0.54, "learning_rate": 1.5341e-05, "loss": 1.2795, "step": 15350 }, { "epoch": 0.54, "learning_rate": 1.5391e-05, "loss": 1.3077, "step": 15400 }, { "epoch": 0.54, "learning_rate": 1.5441e-05, "loss": 1.3132, "step": 15450 }, { "epoch": 0.55, "learning_rate": 1.5491e-05, "loss": 1.2635, "step": 15500 }, { "epoch": 0.55, "learning_rate": 1.554e-05, "loss": 1.3806, "step": 15550 }, { "epoch": 0.55, "learning_rate": 1.559e-05, "loss": 1.2733, "step": 15600 }, { "epoch": 0.55, "learning_rate": 1.5640000000000003e-05, "loss": 1.227, "step": 15650 }, { "epoch": 0.55, "learning_rate": 1.569e-05, "loss": 1.1915, "step": 15700 }, { "epoch": 0.55, "learning_rate": 1.5740000000000002e-05, "loss": 1.2593, "step": 15750 }, { "epoch": 0.56, "learning_rate": 1.579e-05, "loss": 1.2529, "step": 15800 }, { "epoch": 0.56, "learning_rate": 1.584e-05, "loss": 1.1973, "step": 15850 }, { "epoch": 0.56, "learning_rate": 1.5890000000000002e-05, "loss": 1.1813, "step": 15900 }, { "epoch": 0.56, "learning_rate": 1.5940000000000003e-05, "loss": 1.236, "step": 15950 }, { "epoch": 0.56, "learning_rate": 1.599e-05, "loss": 1.1579, "step": 16000 }, { "epoch": 0.57, "learning_rate": 1.6040000000000002e-05, "loss": 1.1937, "step": 16050 }, { "epoch": 0.57, "learning_rate": 1.609e-05, "loss": 1.1705, "step": 16100 }, { "epoch": 0.57, "learning_rate": 1.614e-05, "loss": 1.3132, "step": 16150 }, { "epoch": 0.57, "learning_rate": 1.6190000000000003e-05, "loss": 1.1325, "step": 16200 }, { "epoch": 0.57, "learning_rate": 1.6240000000000004e-05, "loss": 1.1535, "step": 16250 }, { "epoch": 0.57, "learning_rate": 1.629e-05, "loss": 1.1045, "step": 16300 }, { "epoch": 0.58, "learning_rate": 1.634e-05, "loss": 1.1623, "step": 16350 }, { "epoch": 0.58, "learning_rate": 1.639e-05, "loss": 1.148, "step": 16400 }, { "epoch": 0.58, "learning_rate": 1.6440000000000002e-05, "loss": 1.1202, "step": 16450 }, { "epoch": 0.58, "learning_rate": 1.6490000000000003e-05, "loss": 1.1157, "step": 16500 }, { "epoch": 0.58, "learning_rate": 1.6539000000000002e-05, "loss": 1.146, "step": 16550 }, { "epoch": 0.58, "learning_rate": 1.6589000000000003e-05, "loss": 1.1423, "step": 16600 }, { "epoch": 0.59, "learning_rate": 1.6639e-05, "loss": 1.1504, "step": 16650 }, { "epoch": 0.59, "learning_rate": 1.6689000000000002e-05, "loss": 1.1099, "step": 16700 }, { "epoch": 0.59, "learning_rate": 1.6739e-05, "loss": 1.1227, "step": 16750 }, { "epoch": 0.59, "learning_rate": 1.6789e-05, "loss": 1.0735, "step": 16800 }, { "epoch": 0.59, "learning_rate": 1.6839000000000003e-05, "loss": 1.2835, "step": 16850 }, { "epoch": 0.6, "learning_rate": 1.6889e-05, "loss": 1.0772, "step": 16900 }, { "epoch": 0.6, "learning_rate": 1.6939e-05, "loss": 1.2067, "step": 16950 }, { "epoch": 0.6, "learning_rate": 1.6989000000000003e-05, "loss": 1.1242, "step": 17000 }, { "epoch": 0.6, "learning_rate": 1.7039e-05, "loss": 1.1571, "step": 17050 }, { "epoch": 0.6, "learning_rate": 1.7089000000000002e-05, "loss": 1.05, "step": 17100 }, { "epoch": 0.6, "learning_rate": 1.7139e-05, "loss": 1.0158, "step": 17150 }, { "epoch": 0.61, "learning_rate": 1.7189e-05, "loss": 1.1355, "step": 17200 }, { "epoch": 0.61, "learning_rate": 1.7239000000000002e-05, "loss": 1.0928, "step": 17250 }, { "epoch": 0.61, "learning_rate": 1.7289000000000003e-05, "loss": 1.148, "step": 17300 }, { "epoch": 0.61, "learning_rate": 1.7339e-05, "loss": 1.0782, "step": 17350 }, { "epoch": 0.61, "learning_rate": 1.7389e-05, "loss": 0.9891, "step": 17400 }, { "epoch": 0.61, "learning_rate": 1.7439e-05, "loss": 1.0428, "step": 17450 }, { "epoch": 0.62, "learning_rate": 1.7489e-05, "loss": 1.1592, "step": 17500 }, { "epoch": 0.62, "eval_loss": 0.6630315780639648, "eval_runtime": 90.475, "eval_samples_per_second": 15.695, "eval_steps_per_second": 0.984, "eval_wer": 0.5011346101479531, "step": 17500 }, { "epoch": 0.62, "learning_rate": 1.7539000000000003e-05, "loss": 1.2172, "step": 17550 }, { "epoch": 0.62, "learning_rate": 1.7589e-05, "loss": 1.1639, "step": 17600 }, { "epoch": 0.62, "learning_rate": 1.7639000000000002e-05, "loss": 1.0972, "step": 17650 }, { "epoch": 0.62, "learning_rate": 1.7689e-05, "loss": 1.007, "step": 17700 }, { "epoch": 0.62, "learning_rate": 1.7739e-05, "loss": 1.019, "step": 17750 }, { "epoch": 0.63, "learning_rate": 1.7789000000000002e-05, "loss": 1.0055, "step": 17800 }, { "epoch": 0.63, "learning_rate": 1.7839000000000003e-05, "loss": 1.1827, "step": 17850 }, { "epoch": 0.63, "learning_rate": 1.7889e-05, "loss": 0.9894, "step": 17900 }, { "epoch": 0.63, "learning_rate": 1.7939000000000002e-05, "loss": 1.0019, "step": 17950 }, { "epoch": 0.63, "learning_rate": 1.7989e-05, "loss": 0.9912, "step": 18000 }, { "epoch": 0.64, "learning_rate": 1.8039e-05, "loss": 1.0662, "step": 18050 }, { "epoch": 0.64, "learning_rate": 1.8089000000000002e-05, "loss": 1.0172, "step": 18100 }, { "epoch": 0.64, "learning_rate": 1.8139000000000004e-05, "loss": 1.0089, "step": 18150 }, { "epoch": 0.64, "learning_rate": 1.8189e-05, "loss": 0.962, "step": 18200 }, { "epoch": 0.64, "learning_rate": 1.8239000000000003e-05, "loss": 1.0009, "step": 18250 }, { "epoch": 0.64, "learning_rate": 1.8289e-05, "loss": 1.0143, "step": 18300 }, { "epoch": 0.65, "learning_rate": 1.8339000000000002e-05, "loss": 0.9687, "step": 18350 }, { "epoch": 0.65, "learning_rate": 1.8389e-05, "loss": 0.9504, "step": 18400 }, { "epoch": 0.65, "learning_rate": 1.8439e-05, "loss": 0.9868, "step": 18450 }, { "epoch": 0.65, "learning_rate": 1.8489000000000002e-05, "loss": 0.9756, "step": 18500 }, { "epoch": 0.65, "learning_rate": 1.8539000000000003e-05, "loss": 1.1523, "step": 18550 }, { "epoch": 0.65, "learning_rate": 1.8589e-05, "loss": 1.1513, "step": 18600 }, { "epoch": 0.66, "learning_rate": 1.8639e-05, "loss": 0.9949, "step": 18650 }, { "epoch": 0.66, "learning_rate": 1.8689e-05, "loss": 0.9231, "step": 18700 }, { "epoch": 0.66, "learning_rate": 1.8739e-05, "loss": 0.9968, "step": 18750 }, { "epoch": 0.66, "learning_rate": 1.8789000000000003e-05, "loss": 0.9144, "step": 18800 }, { "epoch": 0.66, "learning_rate": 1.8839e-05, "loss": 0.956, "step": 18850 }, { "epoch": 0.67, "learning_rate": 1.8889e-05, "loss": 0.9801, "step": 18900 }, { "epoch": 0.67, "learning_rate": 1.8939e-05, "loss": 1.1259, "step": 18950 }, { "epoch": 0.67, "learning_rate": 1.8989e-05, "loss": 0.9337, "step": 19000 }, { "epoch": 0.67, "learning_rate": 1.9039000000000002e-05, "loss": 0.9623, "step": 19050 }, { "epoch": 0.67, "learning_rate": 1.9089000000000003e-05, "loss": 1.149, "step": 19100 }, { "epoch": 0.67, "learning_rate": 1.9139e-05, "loss": 0.9086, "step": 19150 }, { "epoch": 0.68, "learning_rate": 1.9189000000000002e-05, "loss": 1.0715, "step": 19200 }, { "epoch": 0.68, "learning_rate": 1.9239e-05, "loss": 0.9143, "step": 19250 }, { "epoch": 0.68, "learning_rate": 1.9289e-05, "loss": 0.9389, "step": 19300 }, { "epoch": 0.68, "learning_rate": 1.9339000000000002e-05, "loss": 0.905, "step": 19350 }, { "epoch": 0.68, "learning_rate": 1.9389000000000004e-05, "loss": 0.9098, "step": 19400 }, { "epoch": 0.68, "learning_rate": 1.9439e-05, "loss": 0.9275, "step": 19450 }, { "epoch": 0.69, "learning_rate": 1.9489000000000003e-05, "loss": 0.942, "step": 19500 }, { "epoch": 0.69, "learning_rate": 1.9539e-05, "loss": 0.9299, "step": 19550 }, { "epoch": 0.69, "learning_rate": 1.9589e-05, "loss": 0.8564, "step": 19600 }, { "epoch": 0.69, "learning_rate": 1.9639000000000003e-05, "loss": 0.9457, "step": 19650 }, { "epoch": 0.69, "learning_rate": 1.9689000000000004e-05, "loss": 0.9373, "step": 19700 }, { "epoch": 0.7, "learning_rate": 1.9739000000000002e-05, "loss": 0.9528, "step": 19750 }, { "epoch": 0.7, "learning_rate": 1.9789000000000003e-05, "loss": 0.8714, "step": 19800 }, { "epoch": 0.7, "learning_rate": 1.9839e-05, "loss": 0.8855, "step": 19850 }, { "epoch": 0.7, "learning_rate": 1.9889000000000002e-05, "loss": 0.8884, "step": 19900 }, { "epoch": 0.7, "learning_rate": 1.9939e-05, "loss": 0.8832, "step": 19950 }, { "epoch": 0.7, "learning_rate": 1.9989e-05, "loss": 0.861, "step": 20000 }, { "epoch": 0.7, "eval_loss": 0.5460492968559265, "eval_runtime": 99.9659, "eval_samples_per_second": 14.205, "eval_steps_per_second": 0.89, "eval_wer": 0.4238903512753018, "step": 20000 }, { "epoch": 0.71, "learning_rate": 1.999566666666667e-05, "loss": 0.9192, "step": 20050 }, { "epoch": 0.71, "learning_rate": 1.9990111111111113e-05, "loss": 0.8652, "step": 20100 }, { "epoch": 0.71, "learning_rate": 1.998455555555556e-05, "loss": 0.8969, "step": 20150 }, { "epoch": 0.71, "learning_rate": 1.9979000000000003e-05, "loss": 0.8931, "step": 20200 }, { "epoch": 0.71, "learning_rate": 1.9973444444444447e-05, "loss": 0.8594, "step": 20250 }, { "epoch": 0.71, "learning_rate": 1.996788888888889e-05, "loss": 0.9658, "step": 20300 }, { "epoch": 0.72, "learning_rate": 1.9962333333333334e-05, "loss": 0.8561, "step": 20350 }, { "epoch": 0.72, "learning_rate": 1.995677777777778e-05, "loss": 0.8758, "step": 20400 }, { "epoch": 0.72, "learning_rate": 1.9951222222222224e-05, "loss": 1.0173, "step": 20450 }, { "epoch": 0.72, "learning_rate": 1.9945666666666668e-05, "loss": 0.8666, "step": 20500 }, { "epoch": 0.72, "learning_rate": 1.9940111111111115e-05, "loss": 0.8382, "step": 20550 }, { "epoch": 0.73, "learning_rate": 1.9934555555555558e-05, "loss": 0.8602, "step": 20600 }, { "epoch": 0.73, "learning_rate": 1.9929000000000002e-05, "loss": 0.8674, "step": 20650 }, { "epoch": 0.73, "learning_rate": 1.9923444444444445e-05, "loss": 0.9336, "step": 20700 }, { "epoch": 0.73, "learning_rate": 1.991788888888889e-05, "loss": 0.8985, "step": 20750 }, { "epoch": 0.73, "learning_rate": 1.9912333333333336e-05, "loss": 0.8497, "step": 20800 }, { "epoch": 0.73, "learning_rate": 1.990677777777778e-05, "loss": 0.8835, "step": 20850 }, { "epoch": 0.74, "learning_rate": 1.9901222222222223e-05, "loss": 0.926, "step": 20900 }, { "epoch": 0.74, "learning_rate": 1.989566666666667e-05, "loss": 0.8632, "step": 20950 }, { "epoch": 0.74, "learning_rate": 1.9890111111111113e-05, "loss": 0.91, "step": 21000 }, { "epoch": 0.74, "learning_rate": 1.9884555555555557e-05, "loss": 0.8077, "step": 21050 }, { "epoch": 0.74, "learning_rate": 1.9879e-05, "loss": 0.8736, "step": 21100 }, { "epoch": 0.74, "learning_rate": 1.9873444444444444e-05, "loss": 0.8236, "step": 21150 }, { "epoch": 0.75, "learning_rate": 1.986788888888889e-05, "loss": 0.8167, "step": 21200 }, { "epoch": 0.75, "learning_rate": 1.9862333333333335e-05, "loss": 0.8408, "step": 21250 }, { "epoch": 0.75, "learning_rate": 1.985677777777778e-05, "loss": 0.8454, "step": 21300 }, { "epoch": 0.75, "learning_rate": 1.9851333333333334e-05, "loss": 1.0975, "step": 21350 }, { "epoch": 0.75, "learning_rate": 1.9845777777777778e-05, "loss": 0.9236, "step": 21400 }, { "epoch": 0.76, "learning_rate": 1.984022222222222e-05, "loss": 0.8169, "step": 21450 }, { "epoch": 0.76, "learning_rate": 1.9834666666666668e-05, "loss": 0.8352, "step": 21500 }, { "epoch": 0.76, "learning_rate": 1.9829111111111112e-05, "loss": 0.9096, "step": 21550 }, { "epoch": 0.76, "learning_rate": 1.982355555555556e-05, "loss": 0.7899, "step": 21600 }, { "epoch": 0.76, "learning_rate": 1.9818000000000002e-05, "loss": 0.8887, "step": 21650 }, { "epoch": 0.76, "learning_rate": 1.9812444444444446e-05, "loss": 0.8577, "step": 21700 }, { "epoch": 0.77, "learning_rate": 1.980688888888889e-05, "loss": 0.8657, "step": 21750 }, { "epoch": 0.77, "learning_rate": 1.9801333333333333e-05, "loss": 0.846, "step": 21800 }, { "epoch": 0.77, "learning_rate": 1.979577777777778e-05, "loss": 0.8466, "step": 21850 }, { "epoch": 0.77, "learning_rate": 1.9790222222222224e-05, "loss": 0.8386, "step": 21900 }, { "epoch": 0.77, "learning_rate": 1.9784666666666667e-05, "loss": 0.8781, "step": 21950 }, { "epoch": 0.77, "learning_rate": 1.9779111111111114e-05, "loss": 0.9386, "step": 22000 }, { "epoch": 0.78, "learning_rate": 1.9773555555555558e-05, "loss": 0.8045, "step": 22050 }, { "epoch": 0.78, "learning_rate": 1.9768e-05, "loss": 0.8062, "step": 22100 }, { "epoch": 0.78, "learning_rate": 1.9762444444444445e-05, "loss": 0.8461, "step": 22150 }, { "epoch": 0.78, "learning_rate": 1.9756888888888888e-05, "loss": 0.8277, "step": 22200 }, { "epoch": 0.78, "learning_rate": 1.9751333333333335e-05, "loss": 0.9021, "step": 22250 }, { "epoch": 0.79, "learning_rate": 1.974577777777778e-05, "loss": 0.8154, "step": 22300 }, { "epoch": 0.79, "learning_rate": 1.9740222222222222e-05, "loss": 0.8667, "step": 22350 }, { "epoch": 0.79, "learning_rate": 1.973466666666667e-05, "loss": 0.8318, "step": 22400 }, { "epoch": 0.79, "learning_rate": 1.9729111111111113e-05, "loss": 0.8004, "step": 22450 }, { "epoch": 0.79, "learning_rate": 1.9723555555555556e-05, "loss": 0.8123, "step": 22500 }, { "epoch": 0.79, "eval_loss": 0.4794025719165802, "eval_runtime": 15.6813, "eval_samples_per_second": 90.554, "eval_steps_per_second": 5.676, "eval_wer": 0.38295361713715165, "step": 22500 }, { "epoch": 0.79, "learning_rate": 1.9718e-05, "loss": 0.7866, "step": 22550 }, { "epoch": 0.8, "learning_rate": 1.9712444444444443e-05, "loss": 0.8931, "step": 22600 }, { "epoch": 0.8, "learning_rate": 1.970688888888889e-05, "loss": 0.84, "step": 22650 }, { "epoch": 0.8, "learning_rate": 1.9701333333333334e-05, "loss": 0.9195, "step": 22700 }, { "epoch": 0.8, "learning_rate": 1.969577777777778e-05, "loss": 0.8629, "step": 22750 }, { "epoch": 0.8, "learning_rate": 1.9690222222222224e-05, "loss": 0.8154, "step": 22800 }, { "epoch": 0.8, "learning_rate": 1.9684666666666668e-05, "loss": 0.7755, "step": 22850 }, { "epoch": 0.81, "learning_rate": 1.967911111111111e-05, "loss": 0.905, "step": 22900 }, { "epoch": 0.81, "learning_rate": 1.9673555555555555e-05, "loss": 0.7548, "step": 22950 }, { "epoch": 0.81, "learning_rate": 1.9668000000000002e-05, "loss": 0.8041, "step": 23000 }, { "epoch": 0.81, "learning_rate": 1.9662444444444446e-05, "loss": 0.7988, "step": 23050 }, { "epoch": 0.81, "learning_rate": 1.965688888888889e-05, "loss": 0.8187, "step": 23100 }, { "epoch": 0.82, "learning_rate": 1.9651333333333336e-05, "loss": 0.8269, "step": 23150 }, { "epoch": 0.82, "learning_rate": 1.964577777777778e-05, "loss": 0.8079, "step": 23200 }, { "epoch": 0.82, "learning_rate": 1.9640222222222223e-05, "loss": 0.7726, "step": 23250 }, { "epoch": 0.82, "learning_rate": 1.963466666666667e-05, "loss": 0.8316, "step": 23300 }, { "epoch": 0.82, "learning_rate": 1.9629111111111114e-05, "loss": 0.8028, "step": 23350 }, { "epoch": 0.82, "learning_rate": 1.9623555555555557e-05, "loss": 0.8065, "step": 23400 }, { "epoch": 0.83, "learning_rate": 1.9618e-05, "loss": 0.7815, "step": 23450 }, { "epoch": 0.83, "learning_rate": 1.9612444444444444e-05, "loss": 0.7324, "step": 23500 }, { "epoch": 0.83, "learning_rate": 1.960688888888889e-05, "loss": 0.7558, "step": 23550 }, { "epoch": 0.83, "learning_rate": 1.9601333333333335e-05, "loss": 0.7784, "step": 23600 }, { "epoch": 0.83, "learning_rate": 1.9595777777777782e-05, "loss": 0.8073, "step": 23650 }, { "epoch": 0.83, "learning_rate": 1.9590222222222225e-05, "loss": 0.7704, "step": 23700 }, { "epoch": 0.84, "learning_rate": 1.958466666666667e-05, "loss": 0.7705, "step": 23750 }, { "epoch": 0.84, "learning_rate": 1.9579111111111113e-05, "loss": 0.748, "step": 23800 }, { "epoch": 0.84, "learning_rate": 1.9573555555555556e-05, "loss": 0.7521, "step": 23850 }, { "epoch": 0.84, "learning_rate": 1.9568000000000003e-05, "loss": 0.7704, "step": 23900 }, { "epoch": 0.84, "learning_rate": 1.9562444444444447e-05, "loss": 0.7418, "step": 23950 }, { "epoch": 0.85, "learning_rate": 1.955688888888889e-05, "loss": 0.7817, "step": 24000 }, { "epoch": 0.85, "learning_rate": 1.9551333333333337e-05, "loss": 0.7784, "step": 24050 }, { "epoch": 0.85, "learning_rate": 1.954577777777778e-05, "loss": 0.7747, "step": 24100 }, { "epoch": 0.85, "learning_rate": 1.9540222222222224e-05, "loss": 0.7535, "step": 24150 }, { "epoch": 0.85, "learning_rate": 1.9534666666666668e-05, "loss": 0.729, "step": 24200 }, { "epoch": 0.85, "learning_rate": 1.952911111111111e-05, "loss": 0.7675, "step": 24250 }, { "epoch": 0.86, "learning_rate": 1.9523555555555558e-05, "loss": 0.7447, "step": 24300 }, { "epoch": 0.86, "learning_rate": 1.9518000000000002e-05, "loss": 0.7853, "step": 24350 }, { "epoch": 0.86, "learning_rate": 1.9512555555555558e-05, "loss": 0.8753, "step": 24400 }, { "epoch": 0.86, "learning_rate": 1.9507e-05, "loss": 0.7518, "step": 24450 }, { "epoch": 0.86, "learning_rate": 1.9501444444444445e-05, "loss": 0.7638, "step": 24500 }, { "epoch": 0.86, "learning_rate": 1.949588888888889e-05, "loss": 0.7369, "step": 24550 }, { "epoch": 0.87, "learning_rate": 1.9490333333333336e-05, "loss": 0.7608, "step": 24600 }, { "epoch": 0.87, "learning_rate": 1.948477777777778e-05, "loss": 0.751, "step": 24650 }, { "epoch": 0.87, "learning_rate": 1.9479222222222226e-05, "loss": 0.8074, "step": 24700 }, { "epoch": 0.87, "learning_rate": 1.947366666666667e-05, "loss": 0.7591, "step": 24750 }, { "epoch": 0.87, "learning_rate": 1.9468111111111113e-05, "loss": 0.7645, "step": 24800 }, { "epoch": 0.87, "learning_rate": 1.9462555555555557e-05, "loss": 0.7599, "step": 24850 }, { "epoch": 0.88, "learning_rate": 1.9457e-05, "loss": 0.7833, "step": 24900 }, { "epoch": 0.88, "learning_rate": 1.9451444444444444e-05, "loss": 0.702, "step": 24950 }, { "epoch": 0.88, "learning_rate": 1.944588888888889e-05, "loss": 0.7568, "step": 25000 }, { "epoch": 0.88, "eval_loss": 0.4369264543056488, "eval_runtime": 56.0009, "eval_samples_per_second": 25.357, "eval_steps_per_second": 1.589, "eval_wer": 0.34628301715530546, "step": 25000 }, { "epoch": 0.88, "learning_rate": 1.9440333333333334e-05, "loss": 0.7389, "step": 25050 }, { "epoch": 0.88, "learning_rate": 1.943477777777778e-05, "loss": 0.768, "step": 25100 }, { "epoch": 0.89, "learning_rate": 1.9429222222222225e-05, "loss": 0.7999, "step": 25150 }, { "epoch": 0.89, "learning_rate": 1.942366666666667e-05, "loss": 0.7428, "step": 25200 }, { "epoch": 0.89, "learning_rate": 1.9418111111111112e-05, "loss": 0.7931, "step": 25250 }, { "epoch": 0.89, "learning_rate": 1.9412555555555555e-05, "loss": 0.7383, "step": 25300 }, { "epoch": 0.89, "learning_rate": 1.9407000000000002e-05, "loss": 0.7314, "step": 25350 }, { "epoch": 0.89, "learning_rate": 1.9401444444444446e-05, "loss": 0.7201, "step": 25400 }, { "epoch": 0.9, "learning_rate": 1.939588888888889e-05, "loss": 0.7923, "step": 25450 }, { "epoch": 0.9, "learning_rate": 1.9390333333333336e-05, "loss": 0.7446, "step": 25500 }, { "epoch": 0.9, "learning_rate": 1.938477777777778e-05, "loss": 1.1439, "step": 25550 }, { "epoch": 0.9, "learning_rate": 1.9379222222222224e-05, "loss": 0.8822, "step": 25600 }, { "epoch": 0.9, "learning_rate": 1.9373666666666667e-05, "loss": 0.7527, "step": 25650 }, { "epoch": 0.9, "learning_rate": 1.936811111111111e-05, "loss": 1.0362, "step": 25700 }, { "epoch": 0.91, "learning_rate": 1.9362555555555558e-05, "loss": 0.7212, "step": 25750 }, { "epoch": 0.91, "learning_rate": 1.9357e-05, "loss": 0.7722, "step": 25800 }, { "epoch": 0.91, "learning_rate": 1.9351444444444445e-05, "loss": 0.7685, "step": 25850 }, { "epoch": 0.91, "learning_rate": 1.934588888888889e-05, "loss": 0.7285, "step": 25900 }, { "epoch": 0.91, "learning_rate": 1.9340333333333335e-05, "loss": 0.769, "step": 25950 }, { "epoch": 0.92, "learning_rate": 1.933477777777778e-05, "loss": 0.7076, "step": 26000 }, { "epoch": 0.92, "learning_rate": 1.9329222222222222e-05, "loss": 0.705, "step": 26050 }, { "epoch": 0.92, "learning_rate": 1.9323666666666666e-05, "loss": 0.7872, "step": 26100 }, { "epoch": 0.92, "learning_rate": 1.9318111111111113e-05, "loss": 0.7334, "step": 26150 }, { "epoch": 0.92, "learning_rate": 1.9312555555555556e-05, "loss": 0.7255, "step": 26200 }, { "epoch": 0.92, "learning_rate": 1.9307000000000003e-05, "loss": 0.7109, "step": 26250 }, { "epoch": 0.93, "learning_rate": 1.9301444444444447e-05, "loss": 0.7008, "step": 26300 }, { "epoch": 0.93, "learning_rate": 1.929588888888889e-05, "loss": 0.994, "step": 26350 }, { "epoch": 0.93, "learning_rate": 1.9290333333333334e-05, "loss": 0.7608, "step": 26400 }, { "epoch": 0.93, "learning_rate": 1.9284777777777778e-05, "loss": 0.6991, "step": 26450 }, { "epoch": 0.93, "learning_rate": 1.9279222222222225e-05, "loss": 0.7236, "step": 26500 }, { "epoch": 0.93, "learning_rate": 1.9273666666666668e-05, "loss": 0.7109, "step": 26550 }, { "epoch": 0.94, "learning_rate": 1.9268222222222224e-05, "loss": 0.9335, "step": 26600 }, { "epoch": 0.94, "learning_rate": 1.9262666666666668e-05, "loss": 0.7389, "step": 26650 }, { "epoch": 0.94, "learning_rate": 1.9257111111111115e-05, "loss": 0.7394, "step": 26700 }, { "epoch": 0.94, "learning_rate": 1.9251666666666667e-05, "loss": 0.9309, "step": 26750 }, { "epoch": 0.94, "learning_rate": 1.924611111111111e-05, "loss": 0.7499, "step": 26800 }, { "epoch": 0.95, "learning_rate": 1.9240555555555558e-05, "loss": 0.7206, "step": 26850 }, { "epoch": 0.95, "learning_rate": 1.9235e-05, "loss": 0.6946, "step": 26900 }, { "epoch": 0.95, "learning_rate": 1.9229444444444445e-05, "loss": 0.7085, "step": 26950 }, { "epoch": 0.95, "learning_rate": 1.9223888888888892e-05, "loss": 0.7331, "step": 27000 }, { "epoch": 0.95, "learning_rate": 1.9218333333333335e-05, "loss": 0.7729, "step": 27050 }, { "epoch": 0.95, "learning_rate": 1.921277777777778e-05, "loss": 0.7521, "step": 27100 }, { "epoch": 0.96, "learning_rate": 1.9207222222222223e-05, "loss": 0.7325, "step": 27150 }, { "epoch": 0.96, "learning_rate": 1.9201666666666666e-05, "loss": 0.6923, "step": 27200 }, { "epoch": 0.96, "learning_rate": 1.9196111111111113e-05, "loss": 0.6878, "step": 27250 }, { "epoch": 0.96, "learning_rate": 1.9190555555555557e-05, "loss": 0.7417, "step": 27300 }, { "epoch": 0.96, "learning_rate": 1.9185000000000004e-05, "loss": 0.7092, "step": 27350 }, { "epoch": 0.96, "learning_rate": 1.9179444444444447e-05, "loss": 0.6721, "step": 27400 }, { "epoch": 0.97, "learning_rate": 1.917388888888889e-05, "loss": 0.6815, "step": 27450 }, { "epoch": 0.97, "learning_rate": 1.9168333333333334e-05, "loss": 0.7182, "step": 27500 }, { "epoch": 0.97, "eval_loss": 0.4110901355743408, "eval_runtime": 12.1151, "eval_samples_per_second": 117.209, "eval_steps_per_second": 7.346, "eval_wer": 0.3288554052827449, "step": 27500 }, { "epoch": 0.97, "learning_rate": 1.9162777777777778e-05, "loss": 0.8661, "step": 27550 }, { "epoch": 0.97, "learning_rate": 1.9157222222222225e-05, "loss": 0.6766, "step": 27600 }, { "epoch": 0.97, "learning_rate": 1.9151666666666668e-05, "loss": 0.7034, "step": 27650 }, { "epoch": 0.98, "learning_rate": 1.9146111111111112e-05, "loss": 0.7151, "step": 27700 }, { "epoch": 0.98, "learning_rate": 1.914055555555556e-05, "loss": 0.6869, "step": 27750 }, { "epoch": 0.98, "learning_rate": 1.9135000000000002e-05, "loss": 0.7513, "step": 27800 }, { "epoch": 0.98, "learning_rate": 1.9129444444444446e-05, "loss": 0.7039, "step": 27850 }, { "epoch": 0.98, "learning_rate": 1.912388888888889e-05, "loss": 0.6709, "step": 27900 }, { "epoch": 0.98, "learning_rate": 1.9118333333333333e-05, "loss": 0.7034, "step": 27950 }, { "epoch": 0.99, "learning_rate": 1.911277777777778e-05, "loss": 0.6856, "step": 28000 }, { "epoch": 0.99, "learning_rate": 1.9107222222222223e-05, "loss": 0.7096, "step": 28050 }, { "epoch": 0.99, "learning_rate": 1.9101666666666667e-05, "loss": 0.8148, "step": 28100 }, { "epoch": 0.99, "learning_rate": 1.9096111111111114e-05, "loss": 0.7227, "step": 28150 }, { "epoch": 0.99, "learning_rate": 1.9090555555555558e-05, "loss": 0.6732, "step": 28200 }, { "epoch": 0.99, "learning_rate": 1.9085e-05, "loss": 0.7195, "step": 28250 }, { "epoch": 1.0, "learning_rate": 1.9079444444444445e-05, "loss": 0.899, "step": 28300 }, { "epoch": 1.0, "learning_rate": 1.9073888888888888e-05, "loss": 0.6964, "step": 28350 }, { "epoch": 1.0, "learning_rate": 1.9068333333333335e-05, "loss": 0.7364, "step": 28400 }, { "epoch": 1.0, "learning_rate": 1.906277777777778e-05, "loss": 0.8452, "step": 28450 }, { "epoch": 1.0, "learning_rate": 1.9057222222222226e-05, "loss": 0.771, "step": 28500 }, { "epoch": 1.01, "learning_rate": 1.905166666666667e-05, "loss": 0.6508, "step": 28550 }, { "epoch": 1.01, "learning_rate": 1.9046111111111113e-05, "loss": 0.6883, "step": 28600 }, { "epoch": 1.01, "learning_rate": 1.9040555555555556e-05, "loss": 0.6595, "step": 28650 }, { "epoch": 1.01, "learning_rate": 1.9035e-05, "loss": 0.9459, "step": 28700 }, { "epoch": 1.01, "learning_rate": 1.9029444444444447e-05, "loss": 0.6745, "step": 28750 }, { "epoch": 1.01, "learning_rate": 1.902388888888889e-05, "loss": 0.79, "step": 28800 }, { "epoch": 1.02, "learning_rate": 1.9018333333333334e-05, "loss": 0.7138, "step": 28850 }, { "epoch": 1.02, "learning_rate": 1.901277777777778e-05, "loss": 0.7185, "step": 28900 }, { "epoch": 1.02, "learning_rate": 1.9007222222222224e-05, "loss": 0.6834, "step": 28950 }, { "epoch": 1.02, "learning_rate": 1.9001666666666668e-05, "loss": 0.7206, "step": 29000 }, { "epoch": 1.02, "learning_rate": 1.899611111111111e-05, "loss": 0.6949, "step": 29050 }, { "epoch": 1.02, "learning_rate": 1.8990555555555555e-05, "loss": 0.702, "step": 29100 }, { "epoch": 1.03, "learning_rate": 1.8985000000000002e-05, "loss": 0.6561, "step": 29150 }, { "epoch": 1.03, "learning_rate": 1.8979444444444446e-05, "loss": 0.6816, "step": 29200 }, { "epoch": 1.03, "learning_rate": 1.897388888888889e-05, "loss": 0.6899, "step": 29250 }, { "epoch": 1.03, "learning_rate": 1.8968333333333336e-05, "loss": 0.6952, "step": 29300 }, { "epoch": 1.03, "learning_rate": 1.896277777777778e-05, "loss": 0.708, "step": 29350 }, { "epoch": 1.04, "learning_rate": 1.8957222222222223e-05, "loss": 0.651, "step": 29400 }, { "epoch": 1.04, "learning_rate": 1.8951666666666667e-05, "loss": 0.6675, "step": 29450 }, { "epoch": 1.04, "learning_rate": 1.894611111111111e-05, "loss": 0.7116, "step": 29500 }, { "epoch": 1.04, "learning_rate": 1.8940555555555557e-05, "loss": 0.6723, "step": 29550 }, { "epoch": 1.04, "learning_rate": 1.8935e-05, "loss": 0.7197, "step": 29600 }, { "epoch": 1.04, "learning_rate": 1.8929444444444448e-05, "loss": 0.6777, "step": 29650 }, { "epoch": 1.05, "learning_rate": 1.892388888888889e-05, "loss": 0.7371, "step": 29700 }, { "epoch": 1.05, "learning_rate": 1.8918333333333335e-05, "loss": 0.6782, "step": 29750 }, { "epoch": 1.05, "learning_rate": 1.891277777777778e-05, "loss": 0.6672, "step": 29800 }, { "epoch": 1.05, "learning_rate": 1.8907222222222222e-05, "loss": 0.9266, "step": 29850 }, { "epoch": 1.05, "learning_rate": 1.890166666666667e-05, "loss": 0.7792, "step": 29900 }, { "epoch": 1.05, "learning_rate": 1.8896111111111112e-05, "loss": 0.6567, "step": 29950 }, { "epoch": 1.06, "learning_rate": 1.8890555555555556e-05, "loss": 0.6896, "step": 30000 }, { "epoch": 1.06, "eval_loss": 0.40406399965286255, "eval_runtime": 23.7102, "eval_samples_per_second": 59.89, "eval_steps_per_second": 3.754, "eval_wer": 0.3101570300444767, "step": 30000 }, { "epoch": 1.06, "learning_rate": 1.8885000000000003e-05, "loss": 0.6665, "step": 30050 }, { "epoch": 1.06, "learning_rate": 1.8879444444444447e-05, "loss": 0.6987, "step": 30100 }, { "epoch": 1.06, "learning_rate": 1.887388888888889e-05, "loss": 0.7226, "step": 30150 }, { "epoch": 1.06, "learning_rate": 1.8868333333333334e-05, "loss": 0.684, "step": 30200 }, { "epoch": 1.07, "learning_rate": 1.8862777777777777e-05, "loss": 0.6577, "step": 30250 }, { "epoch": 1.07, "learning_rate": 1.8857222222222224e-05, "loss": 0.6901, "step": 30300 }, { "epoch": 1.07, "learning_rate": 1.8851666666666668e-05, "loss": 0.6761, "step": 30350 }, { "epoch": 1.07, "learning_rate": 1.884611111111111e-05, "loss": 0.6749, "step": 30400 }, { "epoch": 1.07, "learning_rate": 1.8840555555555558e-05, "loss": 0.7069, "step": 30450 }, { "epoch": 1.07, "learning_rate": 1.8835000000000002e-05, "loss": 0.6678, "step": 30500 }, { "epoch": 1.08, "learning_rate": 1.8829444444444445e-05, "loss": 0.6614, "step": 30550 }, { "epoch": 1.08, "learning_rate": 1.882388888888889e-05, "loss": 0.6746, "step": 30600 }, { "epoch": 1.08, "learning_rate": 1.8818333333333332e-05, "loss": 0.6585, "step": 30650 }, { "epoch": 1.08, "learning_rate": 1.881277777777778e-05, "loss": 0.6507, "step": 30700 }, { "epoch": 1.08, "learning_rate": 1.8807222222222223e-05, "loss": 0.6672, "step": 30750 }, { "epoch": 1.08, "learning_rate": 1.880166666666667e-05, "loss": 0.8374, "step": 30800 }, { "epoch": 1.09, "learning_rate": 1.8796111111111113e-05, "loss": 0.6423, "step": 30850 }, { "epoch": 1.09, "learning_rate": 1.8790555555555557e-05, "loss": 0.6604, "step": 30900 }, { "epoch": 1.09, "learning_rate": 1.8785e-05, "loss": 0.73, "step": 30950 }, { "epoch": 1.09, "learning_rate": 1.8779444444444444e-05, "loss": 0.6563, "step": 31000 }, { "epoch": 1.09, "learning_rate": 1.877388888888889e-05, "loss": 0.7497, "step": 31050 }, { "epoch": 1.09, "learning_rate": 1.8768333333333335e-05, "loss": 0.6737, "step": 31100 }, { "epoch": 1.1, "learning_rate": 1.8762777777777778e-05, "loss": 0.6566, "step": 31150 }, { "epoch": 1.1, "learning_rate": 1.8757222222222225e-05, "loss": 0.6512, "step": 31200 }, { "epoch": 1.1, "learning_rate": 1.875166666666667e-05, "loss": 0.6747, "step": 31250 }, { "epoch": 1.1, "learning_rate": 1.8746111111111112e-05, "loss": 0.7623, "step": 31300 }, { "epoch": 1.1, "learning_rate": 1.8740555555555556e-05, "loss": 0.6491, "step": 31350 }, { "epoch": 1.11, "learning_rate": 1.8735e-05, "loss": 0.6406, "step": 31400 }, { "epoch": 1.11, "learning_rate": 1.8729444444444446e-05, "loss": 0.6285, "step": 31450 }, { "epoch": 1.11, "learning_rate": 1.872388888888889e-05, "loss": 0.6393, "step": 31500 }, { "epoch": 1.11, "learning_rate": 1.8718333333333333e-05, "loss": 0.6708, "step": 31550 }, { "epoch": 1.11, "learning_rate": 1.871277777777778e-05, "loss": 0.6393, "step": 31600 }, { "epoch": 1.11, "learning_rate": 1.8707222222222224e-05, "loss": 0.6533, "step": 31650 }, { "epoch": 1.12, "learning_rate": 1.8701666666666667e-05, "loss": 0.6819, "step": 31700 }, { "epoch": 1.12, "learning_rate": 1.869611111111111e-05, "loss": 0.6689, "step": 31750 }, { "epoch": 1.12, "learning_rate": 1.8690555555555555e-05, "loss": 0.6667, "step": 31800 }, { "epoch": 1.12, "learning_rate": 1.8685e-05, "loss": 0.628, "step": 31850 }, { "epoch": 1.12, "learning_rate": 1.8679444444444445e-05, "loss": 0.6403, "step": 31900 }, { "epoch": 1.12, "learning_rate": 1.8673888888888892e-05, "loss": 0.6979, "step": 31950 }, { "epoch": 1.13, "learning_rate": 1.8668333333333336e-05, "loss": 0.6403, "step": 32000 }, { "epoch": 1.13, "learning_rate": 1.866277777777778e-05, "loss": 0.6496, "step": 32050 }, { "epoch": 1.13, "learning_rate": 1.8657222222222223e-05, "loss": 0.6214, "step": 32100 }, { "epoch": 1.13, "learning_rate": 1.8651666666666666e-05, "loss": 0.6675, "step": 32150 }, { "epoch": 1.13, "learning_rate": 1.8646111111111113e-05, "loss": 0.6597, "step": 32200 }, { "epoch": 1.14, "learning_rate": 1.8640555555555557e-05, "loss": 0.669, "step": 32250 }, { "epoch": 1.14, "learning_rate": 1.8635e-05, "loss": 0.6799, "step": 32300 }, { "epoch": 1.14, "learning_rate": 1.8629444444444447e-05, "loss": 0.6637, "step": 32350 }, { "epoch": 1.14, "learning_rate": 1.8624000000000003e-05, "loss": 0.9309, "step": 32400 }, { "epoch": 1.14, "learning_rate": 1.8618444444444447e-05, "loss": 0.6376, "step": 32450 }, { "epoch": 1.14, "learning_rate": 1.861288888888889e-05, "loss": 0.6655, "step": 32500 }, { "epoch": 1.14, "eval_loss": 0.39331158995628357, "eval_runtime": 69.3417, "eval_samples_per_second": 20.478, "eval_steps_per_second": 1.283, "eval_wer": 0.29862939094127255, "step": 32500 }, { "epoch": 1.15, "learning_rate": 1.8607333333333334e-05, "loss": 0.733, "step": 32550 }, { "epoch": 1.15, "learning_rate": 1.8601777777777778e-05, "loss": 0.6592, "step": 32600 }, { "epoch": 1.15, "learning_rate": 1.8596222222222224e-05, "loss": 0.6435, "step": 32650 }, { "epoch": 1.15, "learning_rate": 1.8590666666666668e-05, "loss": 0.6445, "step": 32700 }, { "epoch": 1.15, "learning_rate": 1.858511111111111e-05, "loss": 0.6367, "step": 32750 }, { "epoch": 1.15, "learning_rate": 1.857955555555556e-05, "loss": 0.6593, "step": 32800 }, { "epoch": 1.16, "learning_rate": 1.8574000000000002e-05, "loss": 0.6952, "step": 32850 }, { "epoch": 1.16, "learning_rate": 1.8568444444444446e-05, "loss": 0.8381, "step": 32900 }, { "epoch": 1.16, "learning_rate": 1.856288888888889e-05, "loss": 0.6635, "step": 32950 }, { "epoch": 1.16, "learning_rate": 1.8557333333333333e-05, "loss": 0.6231, "step": 33000 }, { "epoch": 1.16, "learning_rate": 1.855177777777778e-05, "loss": 0.635, "step": 33050 }, { "epoch": 1.17, "learning_rate": 1.8546222222222223e-05, "loss": 0.6579, "step": 33100 }, { "epoch": 1.17, "learning_rate": 1.854066666666667e-05, "loss": 0.6708, "step": 33150 }, { "epoch": 1.17, "learning_rate": 1.8535111111111114e-05, "loss": 0.6603, "step": 33200 }, { "epoch": 1.17, "learning_rate": 1.8529555555555557e-05, "loss": 0.6644, "step": 33250 }, { "epoch": 1.17, "learning_rate": 1.8524e-05, "loss": 0.6091, "step": 33300 }, { "epoch": 1.17, "learning_rate": 1.8518444444444444e-05, "loss": 0.6539, "step": 33350 }, { "epoch": 1.18, "learning_rate": 1.851288888888889e-05, "loss": 0.6823, "step": 33400 }, { "epoch": 1.18, "learning_rate": 1.8507333333333335e-05, "loss": 0.6351, "step": 33450 }, { "epoch": 1.18, "learning_rate": 1.850177777777778e-05, "loss": 0.6163, "step": 33500 }, { "epoch": 1.18, "learning_rate": 1.8496222222222225e-05, "loss": 0.6693, "step": 33550 }, { "epoch": 1.18, "learning_rate": 1.849066666666667e-05, "loss": 0.6525, "step": 33600 }, { "epoch": 1.18, "learning_rate": 1.8485111111111113e-05, "loss": 0.6617, "step": 33650 }, { "epoch": 1.19, "learning_rate": 1.8479555555555556e-05, "loss": 0.6538, "step": 33700 }, { "epoch": 1.19, "learning_rate": 1.8474e-05, "loss": 0.6835, "step": 33750 }, { "epoch": 1.19, "learning_rate": 1.8468444444444447e-05, "loss": 0.667, "step": 33800 }, { "epoch": 1.19, "learning_rate": 1.846288888888889e-05, "loss": 0.7598, "step": 33850 }, { "epoch": 1.19, "learning_rate": 1.8457333333333334e-05, "loss": 0.6405, "step": 33900 }, { "epoch": 1.2, "learning_rate": 1.845177777777778e-05, "loss": 0.7015, "step": 33950 }, { "epoch": 1.2, "learning_rate": 1.8446222222222224e-05, "loss": 0.6497, "step": 34000 }, { "epoch": 1.2, "learning_rate": 1.8440666666666668e-05, "loss": 0.6038, "step": 34050 }, { "epoch": 1.2, "learning_rate": 1.843511111111111e-05, "loss": 0.6079, "step": 34100 }, { "epoch": 1.2, "learning_rate": 1.8429555555555555e-05, "loss": 0.7111, "step": 34150 }, { "epoch": 1.2, "learning_rate": 1.8424000000000002e-05, "loss": 0.6195, "step": 34200 }, { "epoch": 1.21, "learning_rate": 1.8418444444444445e-05, "loss": 0.6638, "step": 34250 }, { "epoch": 1.21, "learning_rate": 1.8412888888888892e-05, "loss": 0.6407, "step": 34300 }, { "epoch": 1.21, "learning_rate": 1.8407333333333336e-05, "loss": 0.6182, "step": 34350 }, { "epoch": 1.21, "learning_rate": 1.840177777777778e-05, "loss": 0.6237, "step": 34400 }, { "epoch": 1.21, "learning_rate": 1.8396222222222223e-05, "loss": 0.621, "step": 34450 }, { "epoch": 1.21, "learning_rate": 1.8390666666666667e-05, "loss": 0.607, "step": 34500 }, { "epoch": 1.22, "learning_rate": 1.8385111111111113e-05, "loss": 0.6372, "step": 34550 }, { "epoch": 1.22, "learning_rate": 1.8379555555555557e-05, "loss": 0.6549, "step": 34600 }, { "epoch": 1.22, "learning_rate": 1.8374e-05, "loss": 0.646, "step": 34650 }, { "epoch": 1.22, "learning_rate": 1.8368444444444448e-05, "loss": 0.6534, "step": 34700 }, { "epoch": 1.22, "learning_rate": 1.836288888888889e-05, "loss": 0.6403, "step": 34750 }, { "epoch": 1.23, "learning_rate": 1.8357444444444447e-05, "loss": 0.7818, "step": 34800 }, { "epoch": 1.23, "learning_rate": 1.835188888888889e-05, "loss": 0.704, "step": 34850 }, { "epoch": 1.23, "learning_rate": 1.8346333333333334e-05, "loss": 0.625, "step": 34900 }, { "epoch": 1.23, "learning_rate": 1.8340777777777778e-05, "loss": 0.658, "step": 34950 }, { "epoch": 1.23, "learning_rate": 1.8335222222222225e-05, "loss": 0.5738, "step": 35000 }, { "epoch": 1.23, "eval_loss": 0.36759084463119507, "eval_runtime": 33.2692, "eval_samples_per_second": 42.682, "eval_steps_per_second": 2.675, "eval_wer": 0.2829263864936008, "step": 35000 }, { "epoch": 1.23, "learning_rate": 1.832966666666667e-05, "loss": 0.7566, "step": 35050 }, { "epoch": 1.24, "learning_rate": 1.8324111111111115e-05, "loss": 0.6565, "step": 35100 }, { "epoch": 1.24, "learning_rate": 1.831855555555556e-05, "loss": 0.6429, "step": 35150 }, { "epoch": 1.24, "learning_rate": 1.8313000000000002e-05, "loss": 0.6209, "step": 35200 }, { "epoch": 1.24, "learning_rate": 1.8307444444444446e-05, "loss": 0.8319, "step": 35250 }, { "epoch": 1.24, "learning_rate": 1.830188888888889e-05, "loss": 0.6354, "step": 35300 }, { "epoch": 1.24, "learning_rate": 1.8296333333333333e-05, "loss": 0.6098, "step": 35350 }, { "epoch": 1.25, "learning_rate": 1.829077777777778e-05, "loss": 0.7195, "step": 35400 }, { "epoch": 1.25, "learning_rate": 1.8285222222222224e-05, "loss": 0.7081, "step": 35450 }, { "epoch": 1.25, "learning_rate": 1.827966666666667e-05, "loss": 0.6266, "step": 35500 }, { "epoch": 1.25, "learning_rate": 1.8274111111111114e-05, "loss": 0.6272, "step": 35550 }, { "epoch": 1.25, "learning_rate": 1.8268555555555558e-05, "loss": 0.6026, "step": 35600 }, { "epoch": 1.26, "learning_rate": 1.8263e-05, "loss": 0.6498, "step": 35650 }, { "epoch": 1.26, "learning_rate": 1.8257444444444445e-05, "loss": 0.6604, "step": 35700 }, { "epoch": 1.26, "learning_rate": 1.825188888888889e-05, "loss": 0.6309, "step": 35750 }, { "epoch": 1.26, "learning_rate": 1.8246333333333335e-05, "loss": 0.6096, "step": 35800 }, { "epoch": 1.26, "learning_rate": 1.824077777777778e-05, "loss": 0.6967, "step": 35850 }, { "epoch": 1.26, "learning_rate": 1.8235222222222226e-05, "loss": 0.6085, "step": 35900 }, { "epoch": 1.27, "learning_rate": 1.822966666666667e-05, "loss": 0.6093, "step": 35950 }, { "epoch": 1.27, "learning_rate": 1.8224111111111113e-05, "loss": 0.6309, "step": 36000 }, { "epoch": 1.27, "learning_rate": 1.8218555555555556e-05, "loss": 0.6217, "step": 36050 }, { "epoch": 1.27, "learning_rate": 1.8213e-05, "loss": 0.6016, "step": 36100 }, { "epoch": 1.27, "learning_rate": 1.8207444444444447e-05, "loss": 0.5993, "step": 36150 }, { "epoch": 1.27, "learning_rate": 1.820188888888889e-05, "loss": 0.6068, "step": 36200 }, { "epoch": 1.28, "learning_rate": 1.8196333333333337e-05, "loss": 0.602, "step": 36250 }, { "epoch": 1.28, "learning_rate": 1.819077777777778e-05, "loss": 0.63, "step": 36300 }, { "epoch": 1.28, "learning_rate": 1.8185222222222225e-05, "loss": 0.609, "step": 36350 }, { "epoch": 1.28, "learning_rate": 1.8179666666666668e-05, "loss": 0.6174, "step": 36400 }, { "epoch": 1.28, "learning_rate": 1.817411111111111e-05, "loss": 0.5986, "step": 36450 }, { "epoch": 1.29, "learning_rate": 1.8168555555555555e-05, "loss": 0.6095, "step": 36500 }, { "epoch": 1.29, "learning_rate": 1.8163000000000002e-05, "loss": 0.6871, "step": 36550 }, { "epoch": 1.29, "learning_rate": 1.8157444444444446e-05, "loss": 0.6174, "step": 36600 }, { "epoch": 1.29, "learning_rate": 1.8151888888888893e-05, "loss": 0.5797, "step": 36650 }, { "epoch": 1.29, "learning_rate": 1.8146333333333336e-05, "loss": 0.6224, "step": 36700 }, { "epoch": 1.29, "learning_rate": 1.814088888888889e-05, "loss": 0.718, "step": 36750 }, { "epoch": 1.3, "learning_rate": 1.8135333333333336e-05, "loss": 0.6352, "step": 36800 }, { "epoch": 1.3, "learning_rate": 1.812977777777778e-05, "loss": 0.619, "step": 36850 }, { "epoch": 1.3, "learning_rate": 1.8124222222222223e-05, "loss": 0.6404, "step": 36900 }, { "epoch": 1.3, "learning_rate": 1.811866666666667e-05, "loss": 0.6073, "step": 36950 }, { "epoch": 1.3, "learning_rate": 1.8113111111111113e-05, "loss": 0.6047, "step": 37000 }, { "epoch": 1.3, "learning_rate": 1.8107555555555557e-05, "loss": 0.6496, "step": 37050 }, { "epoch": 1.31, "learning_rate": 1.8102e-05, "loss": 0.7041, "step": 37100 }, { "epoch": 1.31, "learning_rate": 1.8096444444444444e-05, "loss": 0.638, "step": 37150 }, { "epoch": 1.31, "learning_rate": 1.809088888888889e-05, "loss": 0.6163, "step": 37200 }, { "epoch": 1.31, "learning_rate": 1.8085333333333335e-05, "loss": 0.6142, "step": 37250 }, { "epoch": 1.31, "learning_rate": 1.8079777777777778e-05, "loss": 0.7264, "step": 37300 }, { "epoch": 1.32, "learning_rate": 1.8074222222222225e-05, "loss": 0.6166, "step": 37350 }, { "epoch": 1.32, "learning_rate": 1.806866666666667e-05, "loss": 0.581, "step": 37400 }, { "epoch": 1.32, "learning_rate": 1.8063111111111112e-05, "loss": 0.6079, "step": 37450 }, { "epoch": 1.32, "learning_rate": 1.8057555555555556e-05, "loss": 0.6361, "step": 37500 }, { "epoch": 1.32, "eval_loss": 0.35325154662132263, "eval_runtime": 11.0683, "eval_samples_per_second": 128.295, "eval_steps_per_second": 8.041, "eval_wer": 0.2726695107561042, "step": 37500 }, { "epoch": 1.32, "learning_rate": 1.8052e-05, "loss": 0.5908, "step": 37550 }, { "epoch": 1.32, "learning_rate": 1.8046444444444446e-05, "loss": 0.7938, "step": 37600 }, { "epoch": 1.33, "learning_rate": 1.804088888888889e-05, "loss": 0.7984, "step": 37650 }, { "epoch": 1.33, "learning_rate": 1.8035333333333337e-05, "loss": 0.5863, "step": 37700 }, { "epoch": 1.33, "learning_rate": 1.802977777777778e-05, "loss": 0.6205, "step": 37750 }, { "epoch": 1.33, "learning_rate": 1.8024222222222224e-05, "loss": 0.6142, "step": 37800 }, { "epoch": 1.33, "learning_rate": 1.8018666666666667e-05, "loss": 0.5872, "step": 37850 }, { "epoch": 1.33, "learning_rate": 1.801311111111111e-05, "loss": 0.686, "step": 37900 }, { "epoch": 1.34, "learning_rate": 1.8007555555555558e-05, "loss": 0.5886, "step": 37950 }, { "epoch": 1.34, "learning_rate": 1.8002e-05, "loss": 0.583, "step": 38000 }, { "epoch": 1.34, "learning_rate": 1.7996444444444445e-05, "loss": 0.6181, "step": 38050 }, { "epoch": 1.34, "learning_rate": 1.7990888888888892e-05, "loss": 0.6093, "step": 38100 }, { "epoch": 1.34, "learning_rate": 1.7985333333333336e-05, "loss": 0.6812, "step": 38150 }, { "epoch": 1.34, "learning_rate": 1.797977777777778e-05, "loss": 0.5821, "step": 38200 }, { "epoch": 1.35, "learning_rate": 1.7974222222222223e-05, "loss": 0.5881, "step": 38250 }, { "epoch": 1.35, "learning_rate": 1.7968666666666666e-05, "loss": 0.6076, "step": 38300 }, { "epoch": 1.35, "learning_rate": 1.7963111111111113e-05, "loss": 0.6506, "step": 38350 }, { "epoch": 1.35, "learning_rate": 1.7957555555555557e-05, "loss": 0.6165, "step": 38400 }, { "epoch": 1.35, "learning_rate": 1.7952e-05, "loss": 0.5791, "step": 38450 }, { "epoch": 1.36, "learning_rate": 1.7946444444444447e-05, "loss": 0.6002, "step": 38500 }, { "epoch": 1.36, "learning_rate": 1.794088888888889e-05, "loss": 0.5807, "step": 38550 }, { "epoch": 1.36, "learning_rate": 1.7935333333333334e-05, "loss": 0.5954, "step": 38600 }, { "epoch": 1.36, "learning_rate": 1.7929777777777778e-05, "loss": 0.6095, "step": 38650 }, { "epoch": 1.36, "learning_rate": 1.792422222222222e-05, "loss": 0.6117, "step": 38700 }, { "epoch": 1.36, "learning_rate": 1.791866666666667e-05, "loss": 0.6242, "step": 38750 }, { "epoch": 1.37, "learning_rate": 1.7913111111111112e-05, "loss": 0.5836, "step": 38800 }, { "epoch": 1.37, "learning_rate": 1.790755555555556e-05, "loss": 0.5781, "step": 38850 }, { "epoch": 1.37, "learning_rate": 1.7902000000000002e-05, "loss": 0.5764, "step": 38900 }, { "epoch": 1.37, "learning_rate": 1.7896444444444446e-05, "loss": 0.6197, "step": 38950 }, { "epoch": 1.37, "learning_rate": 1.789088888888889e-05, "loss": 0.5826, "step": 39000 }, { "epoch": 1.37, "learning_rate": 1.7885333333333333e-05, "loss": 0.7337, "step": 39050 }, { "epoch": 1.38, "learning_rate": 1.787977777777778e-05, "loss": 0.6111, "step": 39100 }, { "epoch": 1.38, "learning_rate": 1.7874222222222224e-05, "loss": 0.6125, "step": 39150 }, { "epoch": 1.38, "learning_rate": 1.7868666666666667e-05, "loss": 0.6158, "step": 39200 }, { "epoch": 1.38, "learning_rate": 1.7863111111111114e-05, "loss": 0.6028, "step": 39250 }, { "epoch": 1.38, "learning_rate": 1.7857555555555558e-05, "loss": 0.5979, "step": 39300 }, { "epoch": 1.39, "learning_rate": 1.7852e-05, "loss": 0.5951, "step": 39350 }, { "epoch": 1.39, "learning_rate": 1.7846444444444445e-05, "loss": 0.5782, "step": 39400 }, { "epoch": 1.39, "learning_rate": 1.784088888888889e-05, "loss": 0.6052, "step": 39450 }, { "epoch": 1.39, "learning_rate": 1.7835333333333335e-05, "loss": 0.6236, "step": 39500 }, { "epoch": 1.39, "learning_rate": 1.782977777777778e-05, "loss": 0.5699, "step": 39550 }, { "epoch": 1.39, "learning_rate": 1.7824222222222222e-05, "loss": 0.7261, "step": 39600 }, { "epoch": 1.4, "learning_rate": 1.781866666666667e-05, "loss": 0.6265, "step": 39650 }, { "epoch": 1.4, "learning_rate": 1.7813111111111113e-05, "loss": 0.5944, "step": 39700 }, { "epoch": 1.4, "learning_rate": 1.7807555555555556e-05, "loss": 0.6069, "step": 39750 }, { "epoch": 1.4, "learning_rate": 1.7802e-05, "loss": 0.6097, "step": 39800 }, { "epoch": 1.4, "learning_rate": 1.7796444444444444e-05, "loss": 0.6155, "step": 39850 }, { "epoch": 1.4, "learning_rate": 1.779088888888889e-05, "loss": 0.6283, "step": 39900 }, { "epoch": 1.41, "learning_rate": 1.7785333333333334e-05, "loss": 0.5707, "step": 39950 }, { "epoch": 1.41, "learning_rate": 1.777977777777778e-05, "loss": 0.6142, "step": 40000 }, { "epoch": 1.41, "eval_loss": 0.3545148968696594, "eval_runtime": 11.9301, "eval_samples_per_second": 119.027, "eval_steps_per_second": 7.46, "eval_wer": 0.27158028501406917, "step": 40000 }, { "epoch": 1.41, "learning_rate": 1.7774222222222225e-05, "loss": 0.6248, "step": 40050 }, { "epoch": 1.41, "learning_rate": 1.7768666666666668e-05, "loss": 0.593, "step": 40100 }, { "epoch": 1.41, "learning_rate": 1.776311111111111e-05, "loss": 0.5962, "step": 40150 }, { "epoch": 1.42, "learning_rate": 1.7757555555555555e-05, "loss": 0.6111, "step": 40200 }, { "epoch": 1.42, "learning_rate": 1.7752e-05, "loss": 0.5936, "step": 40250 }, { "epoch": 1.42, "learning_rate": 1.7746444444444446e-05, "loss": 0.6866, "step": 40300 }, { "epoch": 1.42, "learning_rate": 1.774088888888889e-05, "loss": 0.6549, "step": 40350 }, { "epoch": 1.42, "learning_rate": 1.7735333333333336e-05, "loss": 0.5902, "step": 40400 }, { "epoch": 1.42, "learning_rate": 1.772977777777778e-05, "loss": 0.5755, "step": 40450 }, { "epoch": 1.43, "learning_rate": 1.7724222222222223e-05, "loss": 0.5898, "step": 40500 }, { "epoch": 1.43, "learning_rate": 1.7718666666666667e-05, "loss": 0.5863, "step": 40550 }, { "epoch": 1.43, "learning_rate": 1.771311111111111e-05, "loss": 0.6699, "step": 40600 }, { "epoch": 1.43, "learning_rate": 1.7707555555555557e-05, "loss": 0.5989, "step": 40650 }, { "epoch": 1.43, "learning_rate": 1.7702e-05, "loss": 0.5878, "step": 40700 }, { "epoch": 1.43, "learning_rate": 1.7696444444444444e-05, "loss": 0.6004, "step": 40750 }, { "epoch": 1.44, "learning_rate": 1.769088888888889e-05, "loss": 0.6847, "step": 40800 }, { "epoch": 1.44, "learning_rate": 1.7685333333333335e-05, "loss": 0.7376, "step": 40850 }, { "epoch": 1.44, "learning_rate": 1.767977777777778e-05, "loss": 0.6027, "step": 40900 }, { "epoch": 1.44, "learning_rate": 1.7674333333333335e-05, "loss": 0.672, "step": 40950 }, { "epoch": 1.44, "learning_rate": 1.7668777777777778e-05, "loss": 0.5868, "step": 41000 }, { "epoch": 1.45, "learning_rate": 1.7663222222222222e-05, "loss": 0.5746, "step": 41050 }, { "epoch": 1.45, "learning_rate": 1.765766666666667e-05, "loss": 0.5411, "step": 41100 }, { "epoch": 1.45, "learning_rate": 1.7652111111111112e-05, "loss": 0.6121, "step": 41150 }, { "epoch": 1.45, "learning_rate": 1.764655555555556e-05, "loss": 0.5597, "step": 41200 }, { "epoch": 1.45, "learning_rate": 1.7641000000000003e-05, "loss": 0.584, "step": 41250 }, { "epoch": 1.45, "learning_rate": 1.7635444444444446e-05, "loss": 0.6069, "step": 41300 }, { "epoch": 1.46, "learning_rate": 1.762988888888889e-05, "loss": 0.5685, "step": 41350 }, { "epoch": 1.46, "learning_rate": 1.7624333333333333e-05, "loss": 0.691, "step": 41400 }, { "epoch": 1.46, "learning_rate": 1.761877777777778e-05, "loss": 0.6247, "step": 41450 }, { "epoch": 1.46, "learning_rate": 1.7613222222222224e-05, "loss": 0.7853, "step": 41500 }, { "epoch": 1.46, "learning_rate": 1.7607666666666667e-05, "loss": 0.5773, "step": 41550 }, { "epoch": 1.46, "learning_rate": 1.7602111111111114e-05, "loss": 0.632, "step": 41600 }, { "epoch": 1.47, "learning_rate": 1.7596555555555558e-05, "loss": 0.6267, "step": 41650 }, { "epoch": 1.47, "learning_rate": 1.7591e-05, "loss": 0.879, "step": 41700 }, { "epoch": 1.47, "learning_rate": 1.7585444444444445e-05, "loss": 0.5982, "step": 41750 }, { "epoch": 1.47, "learning_rate": 1.757988888888889e-05, "loss": 0.6049, "step": 41800 }, { "epoch": 1.47, "learning_rate": 1.7574333333333336e-05, "loss": 0.5834, "step": 41850 }, { "epoch": 1.48, "learning_rate": 1.756877777777778e-05, "loss": 0.603, "step": 41900 }, { "epoch": 1.48, "learning_rate": 1.7563222222222223e-05, "loss": 0.5647, "step": 41950 }, { "epoch": 1.48, "learning_rate": 1.755766666666667e-05, "loss": 0.5773, "step": 42000 }, { "epoch": 1.48, "learning_rate": 1.7552111111111113e-05, "loss": 0.6292, "step": 42050 }, { "epoch": 1.48, "learning_rate": 1.7546555555555557e-05, "loss": 0.5832, "step": 42100 }, { "epoch": 1.48, "learning_rate": 1.7541e-05, "loss": 0.6394, "step": 42150 }, { "epoch": 1.49, "learning_rate": 1.7535444444444444e-05, "loss": 0.5718, "step": 42200 }, { "epoch": 1.49, "learning_rate": 1.752988888888889e-05, "loss": 0.6005, "step": 42250 }, { "epoch": 1.49, "learning_rate": 1.7524333333333334e-05, "loss": 0.653, "step": 42300 }, { "epoch": 1.49, "learning_rate": 1.751877777777778e-05, "loss": 0.5724, "step": 42350 }, { "epoch": 1.49, "learning_rate": 1.7513222222222225e-05, "loss": 0.5588, "step": 42400 }, { "epoch": 1.49, "learning_rate": 1.750766666666667e-05, "loss": 0.5701, "step": 42450 }, { "epoch": 1.5, "learning_rate": 1.7502111111111112e-05, "loss": 0.6346, "step": 42500 }, { "epoch": 1.5, "eval_loss": 0.3428270220756531, "eval_runtime": 12.6101, "eval_samples_per_second": 112.608, "eval_steps_per_second": 7.058, "eval_wer": 0.26150494690024506, "step": 42500 }, { "epoch": 1.5, "learning_rate": 1.7496555555555556e-05, "loss": 0.7485, "step": 42550 }, { "epoch": 1.5, "learning_rate": 1.7491000000000002e-05, "loss": 0.6093, "step": 42600 }, { "epoch": 1.5, "learning_rate": 1.7485444444444446e-05, "loss": 0.5708, "step": 42650 }, { "epoch": 1.5, "learning_rate": 1.747988888888889e-05, "loss": 0.6054, "step": 42700 }, { "epoch": 1.51, "learning_rate": 1.7474333333333337e-05, "loss": 0.7292, "step": 42750 }, { "epoch": 1.51, "learning_rate": 1.746877777777778e-05, "loss": 0.7634, "step": 42800 }, { "epoch": 1.51, "learning_rate": 1.7463222222222224e-05, "loss": 0.59, "step": 42850 }, { "epoch": 1.51, "learning_rate": 1.7457666666666667e-05, "loss": 0.5566, "step": 42900 }, { "epoch": 1.51, "learning_rate": 1.745211111111111e-05, "loss": 0.5971, "step": 42950 }, { "epoch": 1.51, "learning_rate": 1.7446555555555558e-05, "loss": 0.5703, "step": 43000 }, { "epoch": 1.52, "learning_rate": 1.7441e-05, "loss": 0.5855, "step": 43050 }, { "epoch": 1.52, "learning_rate": 1.7435444444444445e-05, "loss": 0.5643, "step": 43100 }, { "epoch": 1.52, "learning_rate": 1.7429888888888892e-05, "loss": 0.5666, "step": 43150 }, { "epoch": 1.52, "learning_rate": 1.7424333333333335e-05, "loss": 0.5958, "step": 43200 }, { "epoch": 1.52, "learning_rate": 1.741877777777778e-05, "loss": 0.6357, "step": 43250 }, { "epoch": 1.52, "learning_rate": 1.7413222222222222e-05, "loss": 0.6212, "step": 43300 }, { "epoch": 1.53, "learning_rate": 1.7407666666666666e-05, "loss": 0.5988, "step": 43350 }, { "epoch": 1.53, "learning_rate": 1.7402111111111113e-05, "loss": 0.5813, "step": 43400 }, { "epoch": 1.53, "learning_rate": 1.7396555555555556e-05, "loss": 0.5888, "step": 43450 }, { "epoch": 1.53, "learning_rate": 1.7391000000000003e-05, "loss": 0.5497, "step": 43500 }, { "epoch": 1.53, "learning_rate": 1.7385555555555556e-05, "loss": 0.633, "step": 43550 }, { "epoch": 1.54, "learning_rate": 1.7380000000000003e-05, "loss": 0.5787, "step": 43600 }, { "epoch": 1.54, "learning_rate": 1.7374444444444447e-05, "loss": 0.558, "step": 43650 }, { "epoch": 1.54, "learning_rate": 1.736888888888889e-05, "loss": 0.5837, "step": 43700 }, { "epoch": 1.54, "learning_rate": 1.7363333333333334e-05, "loss": 0.5828, "step": 43750 }, { "epoch": 1.54, "learning_rate": 1.735777777777778e-05, "loss": 0.5664, "step": 43800 }, { "epoch": 1.54, "learning_rate": 1.7352222222222224e-05, "loss": 0.5624, "step": 43850 }, { "epoch": 1.55, "learning_rate": 1.7346666666666668e-05, "loss": 0.5843, "step": 43900 }, { "epoch": 1.55, "learning_rate": 1.7341111111111115e-05, "loss": 0.5787, "step": 43950 }, { "epoch": 1.55, "learning_rate": 1.7335555555555558e-05, "loss": 0.5828, "step": 44000 }, { "epoch": 1.55, "learning_rate": 1.7330000000000002e-05, "loss": 0.6875, "step": 44050 }, { "epoch": 1.55, "learning_rate": 1.7324444444444445e-05, "loss": 0.5827, "step": 44100 }, { "epoch": 1.55, "learning_rate": 1.731888888888889e-05, "loss": 0.6, "step": 44150 }, { "epoch": 1.56, "learning_rate": 1.7313333333333336e-05, "loss": 0.5888, "step": 44200 }, { "epoch": 1.56, "learning_rate": 1.730777777777778e-05, "loss": 0.5596, "step": 44250 }, { "epoch": 1.56, "learning_rate": 1.7302222222222226e-05, "loss": 0.6228, "step": 44300 }, { "epoch": 1.56, "learning_rate": 1.729666666666667e-05, "loss": 0.5851, "step": 44350 }, { "epoch": 1.56, "learning_rate": 1.7291111111111113e-05, "loss": 0.5463, "step": 44400 }, { "epoch": 1.57, "learning_rate": 1.7285555555555557e-05, "loss": 0.5626, "step": 44450 }, { "epoch": 1.57, "learning_rate": 1.728e-05, "loss": 0.5719, "step": 44500 }, { "epoch": 1.57, "learning_rate": 1.7274444444444444e-05, "loss": 0.5769, "step": 44550 }, { "epoch": 1.57, "learning_rate": 1.726888888888889e-05, "loss": 0.5581, "step": 44600 }, { "epoch": 1.57, "learning_rate": 1.7263333333333335e-05, "loss": 0.6249, "step": 44650 }, { "epoch": 1.57, "learning_rate": 1.725777777777778e-05, "loss": 0.6894, "step": 44700 }, { "epoch": 1.58, "learning_rate": 1.7252222222222225e-05, "loss": 0.5778, "step": 44750 }, { "epoch": 1.58, "learning_rate": 1.724666666666667e-05, "loss": 0.554, "step": 44800 }, { "epoch": 1.58, "learning_rate": 1.7241111111111112e-05, "loss": 0.5495, "step": 44850 }, { "epoch": 1.58, "learning_rate": 1.7235555555555556e-05, "loss": 0.7732, "step": 44900 }, { "epoch": 1.58, "learning_rate": 1.7230000000000003e-05, "loss": 0.5915, "step": 44950 }, { "epoch": 1.58, "learning_rate": 1.7224444444444446e-05, "loss": 0.5739, "step": 45000 }, { "epoch": 1.58, "eval_loss": 0.3470255136489868, "eval_runtime": 72.9979, "eval_samples_per_second": 19.453, "eval_steps_per_second": 1.219, "eval_wer": 0.2577834256149587, "step": 45000 }, { "epoch": 1.59, "learning_rate": 1.721888888888889e-05, "loss": 0.5625, "step": 45050 }, { "epoch": 1.59, "learning_rate": 1.7213333333333337e-05, "loss": 0.5674, "step": 45100 }, { "epoch": 1.59, "learning_rate": 1.720777777777778e-05, "loss": 0.5523, "step": 45150 }, { "epoch": 1.59, "learning_rate": 1.7202222222222224e-05, "loss": 0.5494, "step": 45200 }, { "epoch": 1.59, "learning_rate": 1.7196666666666667e-05, "loss": 0.5827, "step": 45250 }, { "epoch": 1.59, "learning_rate": 1.719111111111111e-05, "loss": 0.5868, "step": 45300 }, { "epoch": 1.6, "learning_rate": 1.7185555555555558e-05, "loss": 0.5468, "step": 45350 }, { "epoch": 1.6, "learning_rate": 1.718e-05, "loss": 0.6206, "step": 45400 }, { "epoch": 1.6, "learning_rate": 1.717444444444445e-05, "loss": 0.6871, "step": 45450 }, { "epoch": 1.6, "learning_rate": 1.7168888888888892e-05, "loss": 0.5832, "step": 45500 }, { "epoch": 1.6, "learning_rate": 1.7163333333333336e-05, "loss": 0.5677, "step": 45550 }, { "epoch": 1.61, "learning_rate": 1.715777777777778e-05, "loss": 0.5628, "step": 45600 }, { "epoch": 1.61, "learning_rate": 1.7152222222222223e-05, "loss": 0.5721, "step": 45650 }, { "epoch": 1.61, "learning_rate": 1.7146666666666666e-05, "loss": 0.5802, "step": 45700 }, { "epoch": 1.61, "learning_rate": 1.7141111111111113e-05, "loss": 0.5697, "step": 45750 }, { "epoch": 1.61, "learning_rate": 1.7135555555555557e-05, "loss": 0.559, "step": 45800 }, { "epoch": 1.61, "learning_rate": 1.7130000000000004e-05, "loss": 0.5398, "step": 45850 }, { "epoch": 1.62, "learning_rate": 1.7124444444444447e-05, "loss": 0.5312, "step": 45900 }, { "epoch": 1.62, "learning_rate": 1.711888888888889e-05, "loss": 0.573, "step": 45950 }, { "epoch": 1.62, "learning_rate": 1.7113333333333334e-05, "loss": 0.567, "step": 46000 }, { "epoch": 1.62, "learning_rate": 1.7107777777777778e-05, "loss": 0.5887, "step": 46050 }, { "epoch": 1.62, "learning_rate": 1.7102222222222225e-05, "loss": 0.5814, "step": 46100 }, { "epoch": 1.62, "learning_rate": 1.709666666666667e-05, "loss": 0.5851, "step": 46150 }, { "epoch": 1.63, "learning_rate": 1.7091111111111112e-05, "loss": 0.5528, "step": 46200 }, { "epoch": 1.63, "learning_rate": 1.708555555555556e-05, "loss": 0.586, "step": 46250 }, { "epoch": 1.63, "learning_rate": 1.708011111111111e-05, "loss": 0.7257, "step": 46300 }, { "epoch": 1.63, "learning_rate": 1.7074555555555555e-05, "loss": 0.546, "step": 46350 }, { "epoch": 1.63, "learning_rate": 1.7069000000000002e-05, "loss": 0.7151, "step": 46400 }, { "epoch": 1.64, "learning_rate": 1.7063444444444446e-05, "loss": 0.5314, "step": 46450 }, { "epoch": 1.64, "learning_rate": 1.705788888888889e-05, "loss": 0.5981, "step": 46500 }, { "epoch": 1.64, "learning_rate": 1.7052444444444445e-05, "loss": 0.5394, "step": 46550 }, { "epoch": 1.64, "learning_rate": 1.7046888888888892e-05, "loss": 0.5726, "step": 46600 }, { "epoch": 1.64, "learning_rate": 1.7041333333333336e-05, "loss": 0.5513, "step": 46650 }, { "epoch": 1.64, "learning_rate": 1.703577777777778e-05, "loss": 0.5392, "step": 46700 }, { "epoch": 1.65, "learning_rate": 1.7030222222222223e-05, "loss": 0.564, "step": 46750 }, { "epoch": 1.65, "learning_rate": 1.7024666666666666e-05, "loss": 0.5472, "step": 46800 }, { "epoch": 1.65, "learning_rate": 1.7019111111111113e-05, "loss": 0.6365, "step": 46850 }, { "epoch": 1.65, "learning_rate": 1.7013555555555557e-05, "loss": 0.684, "step": 46900 }, { "epoch": 1.65, "learning_rate": 1.7008000000000004e-05, "loss": 0.5901, "step": 46950 }, { "epoch": 1.65, "learning_rate": 1.7002444444444447e-05, "loss": 0.5984, "step": 47000 }, { "epoch": 1.66, "learning_rate": 1.699688888888889e-05, "loss": 0.5443, "step": 47050 }, { "epoch": 1.66, "learning_rate": 1.6991333333333335e-05, "loss": 0.5464, "step": 47100 }, { "epoch": 1.66, "learning_rate": 1.6985777777777778e-05, "loss": 0.6189, "step": 47150 }, { "epoch": 1.66, "learning_rate": 1.6980222222222225e-05, "loss": 0.6035, "step": 47200 }, { "epoch": 1.66, "learning_rate": 1.697466666666667e-05, "loss": 0.5518, "step": 47250 }, { "epoch": 1.67, "learning_rate": 1.6969111111111112e-05, "loss": 0.7211, "step": 47300 }, { "epoch": 1.67, "learning_rate": 1.696355555555556e-05, "loss": 0.5759, "step": 47350 }, { "epoch": 1.67, "learning_rate": 1.6958000000000003e-05, "loss": 0.5575, "step": 47400 }, { "epoch": 1.67, "learning_rate": 1.6952444444444446e-05, "loss": 0.5782, "step": 47450 }, { "epoch": 1.67, "learning_rate": 1.694688888888889e-05, "loss": 0.544, "step": 47500 }, { "epoch": 1.67, "eval_loss": 0.32071319222450256, "eval_runtime": 13.5602, "eval_samples_per_second": 104.718, "eval_steps_per_second": 6.563, "eval_wer": 0.24897885086684216, "step": 47500 }, { "epoch": 1.67, "learning_rate": 1.6941333333333333e-05, "loss": 0.5724, "step": 47550 }, { "epoch": 1.68, "learning_rate": 1.693577777777778e-05, "loss": 0.683, "step": 47600 }, { "epoch": 1.68, "learning_rate": 1.6930222222222224e-05, "loss": 0.6379, "step": 47650 }, { "epoch": 1.68, "learning_rate": 1.6924666666666667e-05, "loss": 0.5754, "step": 47700 }, { "epoch": 1.68, "learning_rate": 1.6919111111111114e-05, "loss": 0.5727, "step": 47750 }, { "epoch": 1.68, "learning_rate": 1.6913555555555558e-05, "loss": 0.5912, "step": 47800 }, { "epoch": 1.68, "learning_rate": 1.6908e-05, "loss": 0.6104, "step": 47850 }, { "epoch": 1.69, "learning_rate": 1.6902444444444445e-05, "loss": 0.564, "step": 47900 }, { "epoch": 1.69, "learning_rate": 1.6897e-05, "loss": 0.5144, "step": 47950 }, { "epoch": 1.69, "learning_rate": 1.6891444444444445e-05, "loss": 0.5751, "step": 48000 }, { "epoch": 1.69, "learning_rate": 1.688588888888889e-05, "loss": 0.5761, "step": 48050 }, { "epoch": 1.69, "learning_rate": 1.6880333333333335e-05, "loss": 0.5385, "step": 48100 }, { "epoch": 1.7, "learning_rate": 1.687477777777778e-05, "loss": 0.5492, "step": 48150 }, { "epoch": 1.7, "learning_rate": 1.6869222222222222e-05, "loss": 0.6261, "step": 48200 }, { "epoch": 1.7, "learning_rate": 1.6863666666666666e-05, "loss": 0.545, "step": 48250 }, { "epoch": 1.7, "learning_rate": 1.6858111111111113e-05, "loss": 0.552, "step": 48300 }, { "epoch": 1.7, "learning_rate": 1.6852555555555556e-05, "loss": 0.5746, "step": 48350 }, { "epoch": 1.7, "learning_rate": 1.6847000000000003e-05, "loss": 0.5326, "step": 48400 }, { "epoch": 1.71, "learning_rate": 1.6841444444444447e-05, "loss": 0.6293, "step": 48450 }, { "epoch": 1.71, "learning_rate": 1.683588888888889e-05, "loss": 0.6511, "step": 48500 }, { "epoch": 1.71, "learning_rate": 1.6830333333333334e-05, "loss": 0.8434, "step": 48550 }, { "epoch": 1.71, "learning_rate": 1.6824777777777777e-05, "loss": 0.5357, "step": 48600 }, { "epoch": 1.71, "learning_rate": 1.6819222222222224e-05, "loss": 0.5562, "step": 48650 }, { "epoch": 1.71, "learning_rate": 1.6813666666666668e-05, "loss": 0.58, "step": 48700 }, { "epoch": 1.72, "learning_rate": 1.680811111111111e-05, "loss": 0.5324, "step": 48750 }, { "epoch": 1.72, "learning_rate": 1.680255555555556e-05, "loss": 0.5419, "step": 48800 }, { "epoch": 1.72, "learning_rate": 1.6797000000000002e-05, "loss": 0.5469, "step": 48850 }, { "epoch": 1.72, "learning_rate": 1.6791444444444446e-05, "loss": 0.5348, "step": 48900 }, { "epoch": 1.72, "learning_rate": 1.678588888888889e-05, "loss": 0.5359, "step": 48950 }, { "epoch": 1.73, "learning_rate": 1.6780333333333333e-05, "loss": 0.5418, "step": 49000 }, { "epoch": 1.73, "learning_rate": 1.677477777777778e-05, "loss": 0.55, "step": 49050 }, { "epoch": 1.73, "learning_rate": 1.6769222222222223e-05, "loss": 0.5817, "step": 49100 }, { "epoch": 1.73, "learning_rate": 1.6763666666666667e-05, "loss": 0.5542, "step": 49150 }, { "epoch": 1.73, "learning_rate": 1.6758111111111114e-05, "loss": 0.6008, "step": 49200 }, { "epoch": 1.73, "learning_rate": 1.6752555555555557e-05, "loss": 0.5671, "step": 49250 }, { "epoch": 1.74, "learning_rate": 1.6747e-05, "loss": 0.7473, "step": 49300 }, { "epoch": 1.74, "learning_rate": 1.6741444444444444e-05, "loss": 0.5608, "step": 49350 }, { "epoch": 1.74, "learning_rate": 1.6735888888888888e-05, "loss": 0.5401, "step": 49400 }, { "epoch": 1.74, "learning_rate": 1.6730333333333335e-05, "loss": 0.5483, "step": 49450 }, { "epoch": 1.74, "learning_rate": 1.672477777777778e-05, "loss": 0.5964, "step": 49500 }, { "epoch": 1.74, "learning_rate": 1.6719222222222225e-05, "loss": 0.5701, "step": 49550 }, { "epoch": 1.75, "learning_rate": 1.671366666666667e-05, "loss": 0.6102, "step": 49600 }, { "epoch": 1.75, "learning_rate": 1.6708111111111112e-05, "loss": 0.5593, "step": 49650 }, { "epoch": 1.75, "learning_rate": 1.6702555555555556e-05, "loss": 0.5305, "step": 49700 }, { "epoch": 1.75, "learning_rate": 1.6697e-05, "loss": 0.5501, "step": 49750 }, { "epoch": 1.75, "learning_rate": 1.6691444444444446e-05, "loss": 0.551, "step": 49800 }, { "epoch": 1.76, "learning_rate": 1.668588888888889e-05, "loss": 0.5912, "step": 49850 }, { "epoch": 1.76, "learning_rate": 1.6680333333333334e-05, "loss": 0.5757, "step": 49900 }, { "epoch": 1.76, "learning_rate": 1.667477777777778e-05, "loss": 0.5762, "step": 49950 }, { "epoch": 1.76, "learning_rate": 1.6669222222222224e-05, "loss": 0.5283, "step": 50000 }, { "epoch": 1.76, "eval_loss": 0.3202364444732666, "eval_runtime": 10.1336, "eval_samples_per_second": 140.128, "eval_steps_per_second": 8.783, "eval_wer": 0.2423527276027957, "step": 50000 }, { "epoch": 1.76, "learning_rate": 1.6663666666666668e-05, "loss": 0.6171, "step": 50050 }, { "epoch": 1.76, "learning_rate": 1.665811111111111e-05, "loss": 0.5526, "step": 50100 }, { "epoch": 1.77, "learning_rate": 1.6652555555555555e-05, "loss": 0.5467, "step": 50150 }, { "epoch": 1.77, "learning_rate": 1.6647000000000002e-05, "loss": 0.7412, "step": 50200 }, { "epoch": 1.77, "learning_rate": 1.6641444444444445e-05, "loss": 0.5582, "step": 50250 }, { "epoch": 1.77, "learning_rate": 1.663588888888889e-05, "loss": 0.5511, "step": 50300 }, { "epoch": 1.77, "learning_rate": 1.6630333333333336e-05, "loss": 0.5511, "step": 50350 }, { "epoch": 1.77, "learning_rate": 1.662477777777778e-05, "loss": 0.5604, "step": 50400 }, { "epoch": 1.78, "learning_rate": 1.6619222222222223e-05, "loss": 0.5505, "step": 50450 }, { "epoch": 1.78, "learning_rate": 1.6613666666666666e-05, "loss": 0.5654, "step": 50500 }, { "epoch": 1.78, "learning_rate": 1.660811111111111e-05, "loss": 0.5476, "step": 50550 }, { "epoch": 1.78, "learning_rate": 1.6602555555555557e-05, "loss": 0.5652, "step": 50600 }, { "epoch": 1.78, "learning_rate": 1.6597e-05, "loss": 0.6549, "step": 50650 }, { "epoch": 1.79, "learning_rate": 1.6591444444444447e-05, "loss": 0.5258, "step": 50700 }, { "epoch": 1.79, "learning_rate": 1.658588888888889e-05, "loss": 0.5808, "step": 50750 }, { "epoch": 1.79, "learning_rate": 1.6580333333333335e-05, "loss": 0.5448, "step": 50800 }, { "epoch": 1.79, "learning_rate": 1.6574777777777778e-05, "loss": 0.551, "step": 50850 }, { "epoch": 1.79, "learning_rate": 1.656922222222222e-05, "loss": 0.6163, "step": 50900 }, { "epoch": 1.79, "learning_rate": 1.656366666666667e-05, "loss": 0.5508, "step": 50950 }, { "epoch": 1.8, "learning_rate": 1.6558111111111112e-05, "loss": 0.5076, "step": 51000 }, { "epoch": 1.8, "learning_rate": 1.6552555555555556e-05, "loss": 0.6085, "step": 51050 }, { "epoch": 1.8, "learning_rate": 1.6547000000000003e-05, "loss": 0.5306, "step": 51100 }, { "epoch": 1.8, "learning_rate": 1.6541444444444446e-05, "loss": 0.6092, "step": 51150 }, { "epoch": 1.8, "learning_rate": 1.653588888888889e-05, "loss": 0.5386, "step": 51200 }, { "epoch": 1.8, "learning_rate": 1.6530333333333333e-05, "loss": 0.5188, "step": 51250 }, { "epoch": 1.81, "learning_rate": 1.6524777777777777e-05, "loss": 0.5527, "step": 51300 }, { "epoch": 1.81, "learning_rate": 1.6519222222222224e-05, "loss": 0.5686, "step": 51350 }, { "epoch": 1.81, "learning_rate": 1.6513666666666667e-05, "loss": 0.5419, "step": 51400 }, { "epoch": 1.81, "learning_rate": 1.650811111111111e-05, "loss": 0.5639, "step": 51450 }, { "epoch": 1.81, "learning_rate": 1.6502555555555558e-05, "loss": 0.6296, "step": 51500 }, { "epoch": 1.82, "learning_rate": 1.6497e-05, "loss": 0.5084, "step": 51550 }, { "epoch": 1.82, "learning_rate": 1.6491444444444445e-05, "loss": 0.5637, "step": 51600 }, { "epoch": 1.82, "learning_rate": 1.648588888888889e-05, "loss": 0.5285, "step": 51650 }, { "epoch": 1.82, "learning_rate": 1.6480333333333332e-05, "loss": 0.5963, "step": 51700 }, { "epoch": 1.82, "learning_rate": 1.647477777777778e-05, "loss": 0.5745, "step": 51750 }, { "epoch": 1.82, "learning_rate": 1.6469222222222223e-05, "loss": 0.6812, "step": 51800 }, { "epoch": 1.83, "learning_rate": 1.646366666666667e-05, "loss": 0.5354, "step": 51850 }, { "epoch": 1.83, "learning_rate": 1.6458111111111113e-05, "loss": 0.5434, "step": 51900 }, { "epoch": 1.83, "learning_rate": 1.6452555555555557e-05, "loss": 0.54, "step": 51950 }, { "epoch": 1.83, "learning_rate": 1.6447e-05, "loss": 0.5354, "step": 52000 }, { "epoch": 1.83, "learning_rate": 1.6441444444444444e-05, "loss": 0.5201, "step": 52050 }, { "epoch": 1.83, "learning_rate": 1.643588888888889e-05, "loss": 0.5274, "step": 52100 }, { "epoch": 1.84, "learning_rate": 1.6430333333333334e-05, "loss": 0.5458, "step": 52150 }, { "epoch": 1.84, "learning_rate": 1.6424777777777778e-05, "loss": 0.7196, "step": 52200 }, { "epoch": 1.84, "learning_rate": 1.6419222222222225e-05, "loss": 0.5242, "step": 52250 }, { "epoch": 1.84, "learning_rate": 1.641366666666667e-05, "loss": 0.5836, "step": 52300 }, { "epoch": 1.84, "learning_rate": 1.6408222222222224e-05, "loss": 0.7041, "step": 52350 }, { "epoch": 1.84, "learning_rate": 1.6402666666666668e-05, "loss": 0.5657, "step": 52400 }, { "epoch": 1.85, "learning_rate": 1.639711111111111e-05, "loss": 0.6842, "step": 52450 }, { "epoch": 1.85, "learning_rate": 1.6391555555555555e-05, "loss": 0.5552, "step": 52500 }, { "epoch": 1.85, "eval_loss": 0.31867992877960205, "eval_runtime": 17.7892, "eval_samples_per_second": 79.824, "eval_steps_per_second": 5.003, "eval_wer": 0.2379050558228193, "step": 52500 }, { "epoch": 1.85, "learning_rate": 1.6386000000000002e-05, "loss": 0.538, "step": 52550 }, { "epoch": 1.85, "learning_rate": 1.6380444444444446e-05, "loss": 0.5821, "step": 52600 }, { "epoch": 1.85, "learning_rate": 1.6374888888888893e-05, "loss": 0.7099, "step": 52650 }, { "epoch": 1.86, "learning_rate": 1.6369333333333336e-05, "loss": 0.5301, "step": 52700 }, { "epoch": 1.86, "learning_rate": 1.636377777777778e-05, "loss": 0.624, "step": 52750 }, { "epoch": 1.86, "learning_rate": 1.6358222222222223e-05, "loss": 0.5183, "step": 52800 }, { "epoch": 1.86, "learning_rate": 1.6352666666666667e-05, "loss": 0.5477, "step": 52850 }, { "epoch": 1.86, "learning_rate": 1.634711111111111e-05, "loss": 0.6519, "step": 52900 }, { "epoch": 1.86, "learning_rate": 1.6341555555555557e-05, "loss": 0.5497, "step": 52950 }, { "epoch": 1.87, "learning_rate": 1.6336e-05, "loss": 0.5563, "step": 53000 }, { "epoch": 1.87, "learning_rate": 1.6330444444444448e-05, "loss": 0.5055, "step": 53050 }, { "epoch": 1.87, "learning_rate": 1.632488888888889e-05, "loss": 0.5682, "step": 53100 }, { "epoch": 1.87, "learning_rate": 1.6319333333333335e-05, "loss": 0.5174, "step": 53150 }, { "epoch": 1.87, "learning_rate": 1.631377777777778e-05, "loss": 0.5932, "step": 53200 }, { "epoch": 1.87, "learning_rate": 1.6308222222222222e-05, "loss": 0.5349, "step": 53250 }, { "epoch": 1.88, "learning_rate": 1.630266666666667e-05, "loss": 0.522, "step": 53300 }, { "epoch": 1.88, "learning_rate": 1.6297111111111112e-05, "loss": 0.5621, "step": 53350 }, { "epoch": 1.88, "learning_rate": 1.6291555555555556e-05, "loss": 0.5548, "step": 53400 }, { "epoch": 1.88, "learning_rate": 1.6286000000000003e-05, "loss": 0.5709, "step": 53450 }, { "epoch": 1.88, "learning_rate": 1.6280444444444447e-05, "loss": 0.5436, "step": 53500 }, { "epoch": 1.89, "learning_rate": 1.627488888888889e-05, "loss": 0.5496, "step": 53550 }, { "epoch": 1.89, "learning_rate": 1.6269333333333334e-05, "loss": 0.5904, "step": 53600 }, { "epoch": 1.89, "learning_rate": 1.6263777777777777e-05, "loss": 0.521, "step": 53650 }, { "epoch": 1.89, "learning_rate": 1.6258222222222224e-05, "loss": 0.5418, "step": 53700 }, { "epoch": 1.89, "learning_rate": 1.6252666666666668e-05, "loss": 0.5381, "step": 53750 }, { "epoch": 1.89, "learning_rate": 1.6247111111111115e-05, "loss": 0.5472, "step": 53800 }, { "epoch": 1.9, "learning_rate": 1.6241555555555558e-05, "loss": 0.5566, "step": 53850 }, { "epoch": 1.9, "learning_rate": 1.6236000000000002e-05, "loss": 0.5026, "step": 53900 }, { "epoch": 1.9, "learning_rate": 1.6230444444444445e-05, "loss": 0.8364, "step": 53950 }, { "epoch": 1.9, "learning_rate": 1.622488888888889e-05, "loss": 0.5266, "step": 54000 }, { "epoch": 1.9, "learning_rate": 1.6219333333333332e-05, "loss": 0.5065, "step": 54050 }, { "epoch": 1.9, "learning_rate": 1.621377777777778e-05, "loss": 0.5534, "step": 54100 }, { "epoch": 1.91, "learning_rate": 1.6208222222222223e-05, "loss": 0.5064, "step": 54150 }, { "epoch": 1.91, "learning_rate": 1.620266666666667e-05, "loss": 0.5284, "step": 54200 }, { "epoch": 1.91, "learning_rate": 1.6197111111111113e-05, "loss": 0.6143, "step": 54250 }, { "epoch": 1.91, "learning_rate": 1.6191555555555557e-05, "loss": 0.5244, "step": 54300 }, { "epoch": 1.91, "learning_rate": 1.6186e-05, "loss": 0.5841, "step": 54350 }, { "epoch": 1.92, "learning_rate": 1.6180444444444444e-05, "loss": 0.5268, "step": 54400 }, { "epoch": 1.92, "learning_rate": 1.617488888888889e-05, "loss": 0.5505, "step": 54450 }, { "epoch": 1.92, "learning_rate": 1.6169333333333335e-05, "loss": 0.51, "step": 54500 }, { "epoch": 1.92, "learning_rate": 1.6163777777777778e-05, "loss": 0.5129, "step": 54550 }, { "epoch": 1.92, "learning_rate": 1.6158222222222225e-05, "loss": 0.4919, "step": 54600 }, { "epoch": 1.92, "learning_rate": 1.615266666666667e-05, "loss": 0.7325, "step": 54650 }, { "epoch": 1.93, "learning_rate": 1.6147111111111112e-05, "loss": 0.6419, "step": 54700 }, { "epoch": 1.93, "learning_rate": 1.6141555555555556e-05, "loss": 0.5212, "step": 54750 }, { "epoch": 1.93, "learning_rate": 1.6136e-05, "loss": 0.5155, "step": 54800 }, { "epoch": 1.93, "learning_rate": 1.6130444444444446e-05, "loss": 0.5238, "step": 54850 }, { "epoch": 1.93, "learning_rate": 1.612488888888889e-05, "loss": 0.5501, "step": 54900 }, { "epoch": 1.93, "learning_rate": 1.6119333333333337e-05, "loss": 0.5893, "step": 54950 }, { "epoch": 1.94, "learning_rate": 1.611377777777778e-05, "loss": 0.5218, "step": 55000 }, { "epoch": 1.94, "eval_loss": 0.32421165704727173, "eval_runtime": 10.3587, "eval_samples_per_second": 137.083, "eval_steps_per_second": 8.592, "eval_wer": 0.23826813107016429, "step": 55000 }, { "epoch": 1.94, "learning_rate": 1.6108222222222224e-05, "loss": 0.5497, "step": 55050 }, { "epoch": 1.94, "learning_rate": 1.6102666666666667e-05, "loss": 0.515, "step": 55100 }, { "epoch": 1.94, "learning_rate": 1.609711111111111e-05, "loss": 0.5276, "step": 55150 }, { "epoch": 1.94, "learning_rate": 1.6091555555555555e-05, "loss": 0.551, "step": 55200 }, { "epoch": 1.95, "learning_rate": 1.6086e-05, "loss": 0.5593, "step": 55250 }, { "epoch": 1.95, "learning_rate": 1.6080444444444445e-05, "loss": 0.5727, "step": 55300 }, { "epoch": 1.95, "learning_rate": 1.6074888888888892e-05, "loss": 0.5224, "step": 55350 }, { "epoch": 1.95, "learning_rate": 1.6069333333333336e-05, "loss": 0.5184, "step": 55400 }, { "epoch": 1.95, "learning_rate": 1.606377777777778e-05, "loss": 0.5468, "step": 55450 }, { "epoch": 1.95, "learning_rate": 1.6058222222222223e-05, "loss": 0.552, "step": 55500 }, { "epoch": 1.96, "learning_rate": 1.6052666666666666e-05, "loss": 0.5243, "step": 55550 }, { "epoch": 1.96, "learning_rate": 1.6047222222222222e-05, "loss": 0.6817, "step": 55600 }, { "epoch": 1.96, "learning_rate": 1.604166666666667e-05, "loss": 0.5353, "step": 55650 }, { "epoch": 1.96, "learning_rate": 1.6036111111111113e-05, "loss": 0.5242, "step": 55700 }, { "epoch": 1.96, "learning_rate": 1.6030555555555556e-05, "loss": 0.5514, "step": 55750 }, { "epoch": 1.96, "learning_rate": 1.6025000000000003e-05, "loss": 0.5133, "step": 55800 }, { "epoch": 1.97, "learning_rate": 1.6019444444444447e-05, "loss": 0.5157, "step": 55850 }, { "epoch": 1.97, "learning_rate": 1.601388888888889e-05, "loss": 0.5301, "step": 55900 }, { "epoch": 1.97, "learning_rate": 1.6008333333333334e-05, "loss": 0.5682, "step": 55950 }, { "epoch": 1.97, "learning_rate": 1.6002777777777777e-05, "loss": 0.5058, "step": 56000 }, { "epoch": 1.97, "learning_rate": 1.5997222222222224e-05, "loss": 0.5998, "step": 56050 }, { "epoch": 1.98, "learning_rate": 1.5991666666666668e-05, "loss": 0.5852, "step": 56100 }, { "epoch": 1.98, "learning_rate": 1.5986111111111115e-05, "loss": 0.4885, "step": 56150 }, { "epoch": 1.98, "learning_rate": 1.598055555555556e-05, "loss": 0.5215, "step": 56200 }, { "epoch": 1.98, "learning_rate": 1.5975000000000002e-05, "loss": 0.5291, "step": 56250 }, { "epoch": 1.98, "learning_rate": 1.5969444444444446e-05, "loss": 0.515, "step": 56300 }, { "epoch": 1.98, "learning_rate": 1.596388888888889e-05, "loss": 0.5319, "step": 56350 }, { "epoch": 1.99, "learning_rate": 1.5958333333333336e-05, "loss": 0.5858, "step": 56400 }, { "epoch": 1.99, "learning_rate": 1.595277777777778e-05, "loss": 0.5509, "step": 56450 }, { "epoch": 1.99, "learning_rate": 1.5947222222222223e-05, "loss": 0.5303, "step": 56500 }, { "epoch": 1.99, "learning_rate": 1.594166666666667e-05, "loss": 0.5727, "step": 56550 }, { "epoch": 1.99, "learning_rate": 1.5936111111111114e-05, "loss": 0.5412, "step": 56600 }, { "epoch": 1.99, "learning_rate": 1.5930555555555557e-05, "loss": 0.5197, "step": 56650 }, { "epoch": 2.0, "learning_rate": 1.5925e-05, "loss": 0.4933, "step": 56700 }, { "epoch": 2.0, "learning_rate": 1.5919444444444444e-05, "loss": 0.5301, "step": 56750 }, { "epoch": 2.0, "learning_rate": 1.591388888888889e-05, "loss": 0.5633, "step": 56800 }, { "epoch": 2.0, "learning_rate": 1.5908333333333335e-05, "loss": 0.5735, "step": 56850 }, { "epoch": 2.0, "learning_rate": 1.590277777777778e-05, "loss": 0.5179, "step": 56900 }, { "epoch": 2.01, "learning_rate": 1.5897222222222225e-05, "loss": 0.5011, "step": 56950 }, { "epoch": 2.01, "learning_rate": 1.589166666666667e-05, "loss": 0.6647, "step": 57000 }, { "epoch": 2.01, "learning_rate": 1.5886111111111113e-05, "loss": 0.5428, "step": 57050 }, { "epoch": 2.01, "learning_rate": 1.5880555555555556e-05, "loss": 0.5449, "step": 57100 }, { "epoch": 2.01, "learning_rate": 1.5875e-05, "loss": 0.5115, "step": 57150 }, { "epoch": 2.01, "learning_rate": 1.5869444444444447e-05, "loss": 0.5046, "step": 57200 }, { "epoch": 2.02, "learning_rate": 1.586388888888889e-05, "loss": 0.5417, "step": 57250 }, { "epoch": 2.02, "learning_rate": 1.5858333333333337e-05, "loss": 0.6466, "step": 57300 }, { "epoch": 2.02, "learning_rate": 1.585277777777778e-05, "loss": 0.5625, "step": 57350 }, { "epoch": 2.02, "learning_rate": 1.5847222222222224e-05, "loss": 0.5536, "step": 57400 }, { "epoch": 2.02, "learning_rate": 1.5841666666666668e-05, "loss": 0.5098, "step": 57450 }, { "epoch": 2.02, "learning_rate": 1.583611111111111e-05, "loss": 0.4939, "step": 57500 }, { "epoch": 2.02, "eval_loss": 0.3277219235897064, "eval_runtime": 10.0298, "eval_samples_per_second": 141.578, "eval_steps_per_second": 8.874, "eval_wer": 0.24180811473177816, "step": 57500 }, { "epoch": 2.03, "learning_rate": 1.5830555555555558e-05, "loss": 0.5079, "step": 57550 }, { "epoch": 2.03, "learning_rate": 1.5825000000000002e-05, "loss": 0.5303, "step": 57600 }, { "epoch": 2.03, "learning_rate": 1.5819444444444445e-05, "loss": 0.4911, "step": 57650 }, { "epoch": 2.03, "learning_rate": 1.5813888888888892e-05, "loss": 0.5412, "step": 57700 }, { "epoch": 2.03, "learning_rate": 1.5808333333333336e-05, "loss": 0.5741, "step": 57750 }, { "epoch": 2.04, "learning_rate": 1.580277777777778e-05, "loss": 0.4949, "step": 57800 }, { "epoch": 2.04, "learning_rate": 1.5797222222222223e-05, "loss": 0.5304, "step": 57850 }, { "epoch": 2.04, "learning_rate": 1.5791666666666667e-05, "loss": 0.5292, "step": 57900 }, { "epoch": 2.04, "learning_rate": 1.5786111111111113e-05, "loss": 0.4999, "step": 57950 }, { "epoch": 2.04, "learning_rate": 1.5780555555555557e-05, "loss": 0.5226, "step": 58000 }, { "epoch": 2.04, "learning_rate": 1.5775e-05, "loss": 0.5617, "step": 58050 }, { "epoch": 2.05, "learning_rate": 1.5769444444444448e-05, "loss": 0.5479, "step": 58100 }, { "epoch": 2.05, "learning_rate": 1.576388888888889e-05, "loss": 0.4858, "step": 58150 }, { "epoch": 2.05, "learning_rate": 1.5758333333333335e-05, "loss": 0.5223, "step": 58200 }, { "epoch": 2.05, "learning_rate": 1.5752777777777778e-05, "loss": 0.515, "step": 58250 }, { "epoch": 2.05, "learning_rate": 1.5747222222222222e-05, "loss": 0.5318, "step": 58300 }, { "epoch": 2.05, "learning_rate": 1.574166666666667e-05, "loss": 0.5223, "step": 58350 }, { "epoch": 2.06, "learning_rate": 1.5736111111111112e-05, "loss": 0.5245, "step": 58400 }, { "epoch": 2.06, "learning_rate": 1.573055555555556e-05, "loss": 0.5438, "step": 58450 }, { "epoch": 2.06, "learning_rate": 1.5725000000000003e-05, "loss": 0.5155, "step": 58500 }, { "epoch": 2.06, "learning_rate": 1.5719444444444446e-05, "loss": 0.5434, "step": 58550 }, { "epoch": 2.06, "learning_rate": 1.571388888888889e-05, "loss": 0.5322, "step": 58600 }, { "epoch": 2.06, "learning_rate": 1.5708333333333333e-05, "loss": 0.5132, "step": 58650 }, { "epoch": 2.07, "learning_rate": 1.570277777777778e-05, "loss": 0.5128, "step": 58700 }, { "epoch": 2.07, "learning_rate": 1.5697222222222224e-05, "loss": 0.5776, "step": 58750 }, { "epoch": 2.07, "learning_rate": 1.5691666666666667e-05, "loss": 0.5161, "step": 58800 }, { "epoch": 2.07, "learning_rate": 1.5686111111111114e-05, "loss": 0.501, "step": 58850 }, { "epoch": 2.07, "learning_rate": 1.5680555555555558e-05, "loss": 0.506, "step": 58900 }, { "epoch": 2.08, "learning_rate": 1.5675e-05, "loss": 0.5314, "step": 58950 }, { "epoch": 2.08, "learning_rate": 1.5669444444444445e-05, "loss": 0.5432, "step": 59000 }, { "epoch": 2.08, "learning_rate": 1.566388888888889e-05, "loss": 0.4975, "step": 59050 }, { "epoch": 2.08, "learning_rate": 1.5658333333333336e-05, "loss": 0.5064, "step": 59100 }, { "epoch": 2.08, "learning_rate": 1.565288888888889e-05, "loss": 0.5153, "step": 59150 }, { "epoch": 2.08, "learning_rate": 1.5647333333333335e-05, "loss": 0.5147, "step": 59200 }, { "epoch": 2.09, "learning_rate": 1.564177777777778e-05, "loss": 0.5079, "step": 59250 }, { "epoch": 2.09, "learning_rate": 1.5636222222222222e-05, "loss": 0.5381, "step": 59300 }, { "epoch": 2.09, "learning_rate": 1.5630666666666666e-05, "loss": 0.5113, "step": 59350 }, { "epoch": 2.09, "learning_rate": 1.5625111111111113e-05, "loss": 0.6247, "step": 59400 }, { "epoch": 2.09, "learning_rate": 1.5619555555555556e-05, "loss": 0.5446, "step": 59450 }, { "epoch": 2.09, "learning_rate": 1.5614e-05, "loss": 0.5206, "step": 59500 }, { "epoch": 2.1, "learning_rate": 1.5608444444444447e-05, "loss": 0.4945, "step": 59550 }, { "epoch": 2.1, "learning_rate": 1.560288888888889e-05, "loss": 0.5786, "step": 59600 }, { "epoch": 2.1, "learning_rate": 1.5597333333333334e-05, "loss": 0.4999, "step": 59650 }, { "epoch": 2.1, "learning_rate": 1.5591777777777778e-05, "loss": 0.5409, "step": 59700 }, { "epoch": 2.1, "learning_rate": 1.558622222222222e-05, "loss": 0.5468, "step": 59750 }, { "epoch": 2.11, "learning_rate": 1.5580666666666668e-05, "loss": 0.5235, "step": 59800 }, { "epoch": 2.11, "learning_rate": 1.557511111111111e-05, "loss": 0.4865, "step": 59850 }, { "epoch": 2.11, "learning_rate": 1.556955555555556e-05, "loss": 0.5163, "step": 59900 }, { "epoch": 2.11, "learning_rate": 1.5564000000000002e-05, "loss": 0.5255, "step": 59950 }, { "epoch": 2.11, "learning_rate": 1.5558444444444446e-05, "loss": 0.5141, "step": 60000 }, { "epoch": 2.11, "eval_loss": 0.30582571029663086, "eval_runtime": 49.1181, "eval_samples_per_second": 28.91, "eval_steps_per_second": 1.812, "eval_wer": 0.23291277117182535, "step": 60000 }, { "epoch": 2.11, "learning_rate": 1.555288888888889e-05, "loss": 0.5569, "step": 60050 }, { "epoch": 2.12, "learning_rate": 1.5547333333333333e-05, "loss": 0.5624, "step": 60100 }, { "epoch": 2.12, "learning_rate": 1.554177777777778e-05, "loss": 0.5086, "step": 60150 }, { "epoch": 2.12, "learning_rate": 1.5536222222222223e-05, "loss": 0.5266, "step": 60200 }, { "epoch": 2.12, "learning_rate": 1.5530666666666667e-05, "loss": 0.5445, "step": 60250 }, { "epoch": 2.12, "learning_rate": 1.5525111111111114e-05, "loss": 0.524, "step": 60300 }, { "epoch": 2.12, "learning_rate": 1.5519555555555557e-05, "loss": 0.4945, "step": 60350 }, { "epoch": 2.13, "learning_rate": 1.5514e-05, "loss": 0.4995, "step": 60400 }, { "epoch": 2.13, "learning_rate": 1.5508444444444444e-05, "loss": 0.5097, "step": 60450 }, { "epoch": 2.13, "learning_rate": 1.5502888888888888e-05, "loss": 0.506, "step": 60500 }, { "epoch": 2.13, "learning_rate": 1.5497333333333335e-05, "loss": 0.5127, "step": 60550 }, { "epoch": 2.13, "learning_rate": 1.549177777777778e-05, "loss": 0.528, "step": 60600 }, { "epoch": 2.14, "learning_rate": 1.5486222222222222e-05, "loss": 0.5173, "step": 60650 }, { "epoch": 2.14, "learning_rate": 1.548066666666667e-05, "loss": 0.5461, "step": 60700 }, { "epoch": 2.14, "learning_rate": 1.5475111111111113e-05, "loss": 0.5025, "step": 60750 }, { "epoch": 2.14, "learning_rate": 1.5469555555555556e-05, "loss": 0.5041, "step": 60800 }, { "epoch": 2.14, "learning_rate": 1.5464e-05, "loss": 0.5699, "step": 60850 }, { "epoch": 2.14, "learning_rate": 1.5458444444444443e-05, "loss": 0.5449, "step": 60900 }, { "epoch": 2.15, "learning_rate": 1.545288888888889e-05, "loss": 0.5013, "step": 60950 }, { "epoch": 2.15, "learning_rate": 1.5447333333333334e-05, "loss": 0.521, "step": 61000 }, { "epoch": 2.15, "learning_rate": 1.544177777777778e-05, "loss": 0.5076, "step": 61050 }, { "epoch": 2.15, "learning_rate": 1.5436222222222224e-05, "loss": 0.4838, "step": 61100 }, { "epoch": 2.15, "learning_rate": 1.5430666666666668e-05, "loss": 0.5127, "step": 61150 }, { "epoch": 2.15, "learning_rate": 1.542511111111111e-05, "loss": 0.4675, "step": 61200 }, { "epoch": 2.16, "learning_rate": 1.5419555555555555e-05, "loss": 0.5204, "step": 61250 }, { "epoch": 2.16, "learning_rate": 1.5414000000000002e-05, "loss": 0.5482, "step": 61300 }, { "epoch": 2.16, "learning_rate": 1.5408444444444445e-05, "loss": 0.4813, "step": 61350 }, { "epoch": 2.16, "learning_rate": 1.540288888888889e-05, "loss": 0.5614, "step": 61400 }, { "epoch": 2.16, "learning_rate": 1.5397333333333336e-05, "loss": 0.501, "step": 61450 }, { "epoch": 2.17, "learning_rate": 1.539177777777778e-05, "loss": 0.5015, "step": 61500 }, { "epoch": 2.17, "learning_rate": 1.5386222222222223e-05, "loss": 0.5323, "step": 61550 }, { "epoch": 2.17, "learning_rate": 1.5380666666666667e-05, "loss": 0.522, "step": 61600 }, { "epoch": 2.17, "learning_rate": 1.537511111111111e-05, "loss": 0.4968, "step": 61650 }, { "epoch": 2.17, "learning_rate": 1.5369555555555557e-05, "loss": 0.5109, "step": 61700 }, { "epoch": 2.17, "learning_rate": 1.5364e-05, "loss": 0.5074, "step": 61750 }, { "epoch": 2.18, "learning_rate": 1.5358444444444444e-05, "loss": 0.5037, "step": 61800 }, { "epoch": 2.18, "learning_rate": 1.535288888888889e-05, "loss": 0.5544, "step": 61850 }, { "epoch": 2.18, "learning_rate": 1.5347333333333335e-05, "loss": 0.532, "step": 61900 }, { "epoch": 2.18, "learning_rate": 1.5341777777777778e-05, "loss": 0.5018, "step": 61950 }, { "epoch": 2.18, "learning_rate": 1.5336222222222222e-05, "loss": 0.5023, "step": 62000 }, { "epoch": 2.18, "learning_rate": 1.5330666666666665e-05, "loss": 0.4937, "step": 62050 }, { "epoch": 2.19, "learning_rate": 1.5325111111111112e-05, "loss": 0.5127, "step": 62100 }, { "epoch": 2.19, "learning_rate": 1.5319555555555556e-05, "loss": 0.5116, "step": 62150 }, { "epoch": 2.19, "learning_rate": 1.5314000000000003e-05, "loss": 0.5205, "step": 62200 }, { "epoch": 2.19, "learning_rate": 1.5308444444444446e-05, "loss": 0.553, "step": 62250 }, { "epoch": 2.19, "learning_rate": 1.530288888888889e-05, "loss": 0.4693, "step": 62300 }, { "epoch": 2.2, "learning_rate": 1.5297333333333333e-05, "loss": 0.5314, "step": 62350 }, { "epoch": 2.2, "learning_rate": 1.529177777777778e-05, "loss": 0.492, "step": 62400 }, { "epoch": 2.2, "learning_rate": 1.5286222222222224e-05, "loss": 0.5389, "step": 62450 }, { "epoch": 2.2, "learning_rate": 1.5280666666666668e-05, "loss": 0.5189, "step": 62500 }, { "epoch": 2.2, "eval_loss": 0.30855029821395874, "eval_runtime": 17.827, "eval_samples_per_second": 79.655, "eval_steps_per_second": 4.992, "eval_wer": 0.22728510483797768, "step": 62500 }, { "epoch": 2.2, "learning_rate": 1.527511111111111e-05, "loss": 0.5279, "step": 62550 }, { "epoch": 2.2, "learning_rate": 1.5269555555555558e-05, "loss": 0.5, "step": 62600 }, { "epoch": 2.21, "learning_rate": 1.5264e-05, "loss": 0.4906, "step": 62650 }, { "epoch": 2.21, "learning_rate": 1.5258444444444445e-05, "loss": 0.5271, "step": 62700 }, { "epoch": 2.21, "learning_rate": 1.525288888888889e-05, "loss": 0.5663, "step": 62750 }, { "epoch": 2.21, "learning_rate": 1.5247333333333334e-05, "loss": 0.5153, "step": 62800 }, { "epoch": 2.21, "learning_rate": 1.524177777777778e-05, "loss": 0.5254, "step": 62850 }, { "epoch": 2.21, "learning_rate": 1.5236222222222223e-05, "loss": 0.4774, "step": 62900 }, { "epoch": 2.22, "learning_rate": 1.5230666666666666e-05, "loss": 0.517, "step": 62950 }, { "epoch": 2.22, "learning_rate": 1.5225111111111113e-05, "loss": 0.5256, "step": 63000 }, { "epoch": 2.22, "learning_rate": 1.5219555555555557e-05, "loss": 0.4851, "step": 63050 }, { "epoch": 2.22, "learning_rate": 1.5214000000000002e-05, "loss": 0.6529, "step": 63100 }, { "epoch": 2.22, "learning_rate": 1.5208444444444446e-05, "loss": 0.6696, "step": 63150 }, { "epoch": 2.23, "learning_rate": 1.520288888888889e-05, "loss": 0.513, "step": 63200 }, { "epoch": 2.23, "learning_rate": 1.5197333333333334e-05, "loss": 0.4848, "step": 63250 }, { "epoch": 2.23, "learning_rate": 1.519188888888889e-05, "loss": 0.5197, "step": 63300 }, { "epoch": 2.23, "learning_rate": 1.5186333333333334e-05, "loss": 0.4979, "step": 63350 }, { "epoch": 2.23, "learning_rate": 1.518077777777778e-05, "loss": 0.5077, "step": 63400 }, { "epoch": 2.23, "learning_rate": 1.5175222222222223e-05, "loss": 0.5273, "step": 63450 }, { "epoch": 2.24, "learning_rate": 1.5169666666666666e-05, "loss": 0.5514, "step": 63500 }, { "epoch": 2.24, "learning_rate": 1.5164111111111113e-05, "loss": 0.516, "step": 63550 }, { "epoch": 2.24, "learning_rate": 1.5158555555555557e-05, "loss": 0.5337, "step": 63600 }, { "epoch": 2.24, "learning_rate": 1.5153000000000002e-05, "loss": 0.5544, "step": 63650 }, { "epoch": 2.24, "learning_rate": 1.5147444444444446e-05, "loss": 0.5044, "step": 63700 }, { "epoch": 2.24, "learning_rate": 1.514188888888889e-05, "loss": 0.5137, "step": 63750 }, { "epoch": 2.25, "learning_rate": 1.5136333333333334e-05, "loss": 0.4702, "step": 63800 }, { "epoch": 2.25, "learning_rate": 1.5130777777777778e-05, "loss": 0.4631, "step": 63850 }, { "epoch": 2.25, "learning_rate": 1.5125222222222225e-05, "loss": 0.5794, "step": 63900 }, { "epoch": 2.25, "learning_rate": 1.5119666666666669e-05, "loss": 0.5355, "step": 63950 }, { "epoch": 2.25, "learning_rate": 1.5114111111111112e-05, "loss": 0.4866, "step": 64000 }, { "epoch": 2.26, "learning_rate": 1.5108555555555557e-05, "loss": 0.5323, "step": 64050 }, { "epoch": 2.26, "learning_rate": 1.5103000000000001e-05, "loss": 0.5234, "step": 64100 }, { "epoch": 2.26, "learning_rate": 1.5097444444444444e-05, "loss": 0.5186, "step": 64150 }, { "epoch": 2.26, "learning_rate": 1.509188888888889e-05, "loss": 0.5033, "step": 64200 }, { "epoch": 2.26, "learning_rate": 1.5086333333333333e-05, "loss": 0.5094, "step": 64250 }, { "epoch": 2.26, "learning_rate": 1.508077777777778e-05, "loss": 0.5175, "step": 64300 }, { "epoch": 2.27, "learning_rate": 1.5075222222222224e-05, "loss": 0.5219, "step": 64350 }, { "epoch": 2.27, "learning_rate": 1.5069666666666667e-05, "loss": 0.4876, "step": 64400 }, { "epoch": 2.27, "learning_rate": 1.5064111111111113e-05, "loss": 0.5355, "step": 64450 }, { "epoch": 2.27, "learning_rate": 1.5058555555555556e-05, "loss": 0.5126, "step": 64500 }, { "epoch": 2.27, "learning_rate": 1.5053000000000001e-05, "loss": 0.505, "step": 64550 }, { "epoch": 2.27, "learning_rate": 1.5047444444444445e-05, "loss": 0.5651, "step": 64600 }, { "epoch": 2.28, "learning_rate": 1.5041888888888889e-05, "loss": 0.489, "step": 64650 }, { "epoch": 2.28, "learning_rate": 1.5036333333333335e-05, "loss": 0.4957, "step": 64700 }, { "epoch": 2.28, "learning_rate": 1.5030777777777779e-05, "loss": 0.6336, "step": 64750 }, { "epoch": 2.28, "learning_rate": 1.5025222222222224e-05, "loss": 0.5196, "step": 64800 }, { "epoch": 2.28, "learning_rate": 1.5019666666666668e-05, "loss": 0.4723, "step": 64850 }, { "epoch": 2.29, "learning_rate": 1.5014111111111111e-05, "loss": 0.5317, "step": 64900 }, { "epoch": 2.29, "learning_rate": 1.5008555555555557e-05, "loss": 0.5426, "step": 64950 }, { "epoch": 2.29, "learning_rate": 1.5003e-05, "loss": 0.4993, "step": 65000 }, { "epoch": 2.29, "eval_loss": 0.30048081278800964, "eval_runtime": 27.17, "eval_samples_per_second": 52.264, "eval_steps_per_second": 3.276, "eval_wer": 0.22447127167105382, "step": 65000 }, { "epoch": 2.29, "learning_rate": 1.4997444444444447e-05, "loss": 0.5427, "step": 65050 }, { "epoch": 2.29, "learning_rate": 1.499188888888889e-05, "loss": 0.4956, "step": 65100 }, { "epoch": 2.29, "learning_rate": 1.4986333333333334e-05, "loss": 0.513, "step": 65150 }, { "epoch": 2.3, "learning_rate": 1.498077777777778e-05, "loss": 0.4675, "step": 65200 }, { "epoch": 2.3, "learning_rate": 1.4975222222222223e-05, "loss": 0.5054, "step": 65250 }, { "epoch": 2.3, "learning_rate": 1.4969666666666667e-05, "loss": 0.528, "step": 65300 }, { "epoch": 2.3, "learning_rate": 1.4964111111111112e-05, "loss": 0.5178, "step": 65350 }, { "epoch": 2.3, "learning_rate": 1.4958555555555555e-05, "loss": 0.4871, "step": 65400 }, { "epoch": 2.3, "learning_rate": 1.4953000000000002e-05, "loss": 0.4835, "step": 65450 }, { "epoch": 2.31, "learning_rate": 1.4947444444444446e-05, "loss": 0.5237, "step": 65500 }, { "epoch": 2.31, "learning_rate": 1.494188888888889e-05, "loss": 0.481, "step": 65550 }, { "epoch": 2.31, "learning_rate": 1.4936333333333335e-05, "loss": 0.5751, "step": 65600 }, { "epoch": 2.31, "learning_rate": 1.4930777777777778e-05, "loss": 0.5079, "step": 65650 }, { "epoch": 2.31, "learning_rate": 1.4925222222222224e-05, "loss": 0.489, "step": 65700 }, { "epoch": 2.31, "learning_rate": 1.4919666666666667e-05, "loss": 0.4996, "step": 65750 }, { "epoch": 2.32, "learning_rate": 1.491411111111111e-05, "loss": 0.4889, "step": 65800 }, { "epoch": 2.32, "learning_rate": 1.4908555555555558e-05, "loss": 0.4452, "step": 65850 }, { "epoch": 2.32, "learning_rate": 1.4903000000000001e-05, "loss": 0.4923, "step": 65900 }, { "epoch": 2.32, "learning_rate": 1.4897444444444446e-05, "loss": 0.5002, "step": 65950 }, { "epoch": 2.32, "learning_rate": 1.489188888888889e-05, "loss": 0.5052, "step": 66000 }, { "epoch": 2.33, "learning_rate": 1.4886333333333334e-05, "loss": 0.4834, "step": 66050 }, { "epoch": 2.33, "learning_rate": 1.4880777777777779e-05, "loss": 0.544, "step": 66100 }, { "epoch": 2.33, "learning_rate": 1.4875222222222222e-05, "loss": 0.5031, "step": 66150 }, { "epoch": 2.33, "learning_rate": 1.486966666666667e-05, "loss": 0.5012, "step": 66200 }, { "epoch": 2.33, "learning_rate": 1.4864111111111113e-05, "loss": 0.542, "step": 66250 }, { "epoch": 2.33, "learning_rate": 1.4858555555555556e-05, "loss": 0.5163, "step": 66300 }, { "epoch": 2.34, "learning_rate": 1.4853000000000002e-05, "loss": 0.5318, "step": 66350 }, { "epoch": 2.34, "learning_rate": 1.4847666666666667e-05, "loss": 0.8092, "step": 66400 }, { "epoch": 2.34, "learning_rate": 1.4842111111111112e-05, "loss": 0.5349, "step": 66450 }, { "epoch": 2.34, "learning_rate": 1.4836555555555556e-05, "loss": 0.5643, "step": 66500 }, { "epoch": 2.34, "learning_rate": 1.4831000000000003e-05, "loss": 0.5056, "step": 66550 }, { "epoch": 2.34, "learning_rate": 1.4825444444444446e-05, "loss": 0.56, "step": 66600 }, { "epoch": 2.35, "learning_rate": 1.481988888888889e-05, "loss": 0.519, "step": 66650 }, { "epoch": 2.35, "learning_rate": 1.4814333333333335e-05, "loss": 0.4727, "step": 66700 }, { "epoch": 2.35, "learning_rate": 1.4808777777777778e-05, "loss": 0.481, "step": 66750 }, { "epoch": 2.35, "learning_rate": 1.4803222222222224e-05, "loss": 0.4731, "step": 66800 }, { "epoch": 2.35, "learning_rate": 1.4797666666666667e-05, "loss": 0.6271, "step": 66850 }, { "epoch": 2.36, "learning_rate": 1.479211111111111e-05, "loss": 0.5222, "step": 66900 }, { "epoch": 2.36, "learning_rate": 1.4786555555555558e-05, "loss": 0.5272, "step": 66950 }, { "epoch": 2.36, "learning_rate": 1.4781000000000001e-05, "loss": 0.4851, "step": 67000 }, { "epoch": 2.36, "learning_rate": 1.4775444444444447e-05, "loss": 0.5465, "step": 67050 }, { "epoch": 2.36, "learning_rate": 1.476988888888889e-05, "loss": 0.5764, "step": 67100 }, { "epoch": 2.36, "learning_rate": 1.4764333333333334e-05, "loss": 0.5382, "step": 67150 }, { "epoch": 2.37, "learning_rate": 1.475888888888889e-05, "loss": 0.5516, "step": 67200 }, { "epoch": 2.37, "learning_rate": 1.4753333333333335e-05, "loss": 0.5642, "step": 67250 }, { "epoch": 2.37, "learning_rate": 1.4747777777777779e-05, "loss": 0.5138, "step": 67300 }, { "epoch": 2.37, "learning_rate": 1.4742222222222224e-05, "loss": 0.4901, "step": 67350 }, { "epoch": 2.37, "learning_rate": 1.4736666666666667e-05, "loss": 0.5497, "step": 67400 }, { "epoch": 2.37, "learning_rate": 1.4731111111111111e-05, "loss": 0.5167, "step": 67450 }, { "epoch": 2.38, "learning_rate": 1.4725555555555558e-05, "loss": 0.5156, "step": 67500 }, { "epoch": 2.38, "eval_loss": 0.29976242780685425, "eval_runtime": 11.8857, "eval_samples_per_second": 119.472, "eval_steps_per_second": 7.488, "eval_wer": 0.22229282018698376, "step": 67500 }, { "epoch": 2.38, "learning_rate": 1.4720000000000001e-05, "loss": 0.5023, "step": 67550 }, { "epoch": 2.38, "learning_rate": 1.4714444444444447e-05, "loss": 0.5064, "step": 67600 }, { "epoch": 2.38, "learning_rate": 1.470888888888889e-05, "loss": 0.5769, "step": 67650 }, { "epoch": 2.38, "learning_rate": 1.4703333333333334e-05, "loss": 0.4776, "step": 67700 }, { "epoch": 2.39, "learning_rate": 1.4697777777777779e-05, "loss": 0.5187, "step": 67750 }, { "epoch": 2.39, "learning_rate": 1.4692222222222223e-05, "loss": 0.4884, "step": 67800 }, { "epoch": 2.39, "learning_rate": 1.4686666666666666e-05, "loss": 0.4971, "step": 67850 }, { "epoch": 2.39, "learning_rate": 1.4681111111111113e-05, "loss": 0.5041, "step": 67900 }, { "epoch": 2.39, "learning_rate": 1.4675555555555557e-05, "loss": 0.5033, "step": 67950 }, { "epoch": 2.39, "learning_rate": 1.4670000000000002e-05, "loss": 0.4824, "step": 68000 }, { "epoch": 2.4, "learning_rate": 1.4664444444444445e-05, "loss": 0.6615, "step": 68050 }, { "epoch": 2.4, "learning_rate": 1.4658888888888889e-05, "loss": 0.4916, "step": 68100 }, { "epoch": 2.4, "learning_rate": 1.4653333333333334e-05, "loss": 0.5595, "step": 68150 }, { "epoch": 2.4, "learning_rate": 1.4647777777777778e-05, "loss": 0.504, "step": 68200 }, { "epoch": 2.4, "learning_rate": 1.4642222222222225e-05, "loss": 0.4777, "step": 68250 }, { "epoch": 2.4, "learning_rate": 1.4636666666666668e-05, "loss": 0.5201, "step": 68300 }, { "epoch": 2.41, "learning_rate": 1.4631111111111112e-05, "loss": 0.5932, "step": 68350 }, { "epoch": 2.41, "learning_rate": 1.4625555555555557e-05, "loss": 0.4799, "step": 68400 }, { "epoch": 2.41, "learning_rate": 1.462e-05, "loss": 0.4508, "step": 68450 }, { "epoch": 2.41, "learning_rate": 1.4614444444444446e-05, "loss": 0.4984, "step": 68500 }, { "epoch": 2.41, "learning_rate": 1.460888888888889e-05, "loss": 0.4788, "step": 68550 }, { "epoch": 2.42, "learning_rate": 1.4603333333333333e-05, "loss": 0.6557, "step": 68600 }, { "epoch": 2.42, "learning_rate": 1.459777777777778e-05, "loss": 0.6037, "step": 68650 }, { "epoch": 2.42, "learning_rate": 1.4592222222222223e-05, "loss": 0.5046, "step": 68700 }, { "epoch": 2.42, "learning_rate": 1.4586666666666667e-05, "loss": 0.4739, "step": 68750 }, { "epoch": 2.42, "learning_rate": 1.4581111111111112e-05, "loss": 0.5983, "step": 68800 }, { "epoch": 2.42, "learning_rate": 1.4575555555555556e-05, "loss": 0.5119, "step": 68850 }, { "epoch": 2.43, "learning_rate": 1.4570000000000001e-05, "loss": 0.545, "step": 68900 }, { "epoch": 2.43, "learning_rate": 1.4564444444444445e-05, "loss": 0.4929, "step": 68950 }, { "epoch": 2.43, "learning_rate": 1.455888888888889e-05, "loss": 0.5099, "step": 69000 }, { "epoch": 2.43, "learning_rate": 1.4553333333333335e-05, "loss": 0.4977, "step": 69050 }, { "epoch": 2.43, "learning_rate": 1.4547777777777779e-05, "loss": 0.601, "step": 69100 }, { "epoch": 2.43, "learning_rate": 1.4542222222222224e-05, "loss": 0.4997, "step": 69150 }, { "epoch": 2.44, "learning_rate": 1.4536666666666668e-05, "loss": 0.4976, "step": 69200 }, { "epoch": 2.44, "learning_rate": 1.4531111111111111e-05, "loss": 0.4833, "step": 69250 }, { "epoch": 2.44, "learning_rate": 1.4525555555555558e-05, "loss": 0.5333, "step": 69300 }, { "epoch": 2.44, "learning_rate": 1.4520000000000002e-05, "loss": 0.4947, "step": 69350 }, { "epoch": 2.44, "learning_rate": 1.4514444444444447e-05, "loss": 0.4949, "step": 69400 }, { "epoch": 2.45, "learning_rate": 1.450888888888889e-05, "loss": 0.4751, "step": 69450 }, { "epoch": 2.45, "learning_rate": 1.4503333333333334e-05, "loss": 0.4843, "step": 69500 }, { "epoch": 2.45, "learning_rate": 1.449777777777778e-05, "loss": 0.5145, "step": 69550 }, { "epoch": 2.45, "learning_rate": 1.4492222222222223e-05, "loss": 0.5, "step": 69600 }, { "epoch": 2.45, "learning_rate": 1.448666666666667e-05, "loss": 0.5081, "step": 69650 }, { "epoch": 2.45, "learning_rate": 1.4481111111111113e-05, "loss": 0.4867, "step": 69700 }, { "epoch": 2.46, "learning_rate": 1.4475555555555557e-05, "loss": 0.4912, "step": 69750 }, { "epoch": 2.46, "learning_rate": 1.4470000000000002e-05, "loss": 0.5019, "step": 69800 }, { "epoch": 2.46, "learning_rate": 1.4464444444444446e-05, "loss": 0.5059, "step": 69850 }, { "epoch": 2.46, "learning_rate": 1.445888888888889e-05, "loss": 0.51, "step": 69900 }, { "epoch": 2.46, "learning_rate": 1.4453333333333334e-05, "loss": 0.506, "step": 69950 }, { "epoch": 2.46, "learning_rate": 1.4447777777777778e-05, "loss": 0.4787, "step": 70000 }, { "epoch": 2.46, "eval_loss": 0.29399725794792175, "eval_runtime": 20.3488, "eval_samples_per_second": 69.783, "eval_steps_per_second": 4.374, "eval_wer": 0.21730053553598982, "step": 70000 }, { "epoch": 2.47, "learning_rate": 1.4442222222222225e-05, "loss": 0.5145, "step": 70050 }, { "epoch": 2.47, "learning_rate": 1.4436666666666668e-05, "loss": 0.4893, "step": 70100 }, { "epoch": 2.47, "learning_rate": 1.4431111111111112e-05, "loss": 0.4683, "step": 70150 }, { "epoch": 2.47, "learning_rate": 1.4425555555555557e-05, "loss": 0.4993, "step": 70200 }, { "epoch": 2.47, "learning_rate": 1.4420000000000001e-05, "loss": 0.5134, "step": 70250 }, { "epoch": 2.48, "learning_rate": 1.4414444444444446e-05, "loss": 0.545, "step": 70300 }, { "epoch": 2.48, "learning_rate": 1.440888888888889e-05, "loss": 0.5423, "step": 70350 }, { "epoch": 2.48, "learning_rate": 1.4403333333333333e-05, "loss": 0.4912, "step": 70400 }, { "epoch": 2.48, "learning_rate": 1.439777777777778e-05, "loss": 0.5026, "step": 70450 }, { "epoch": 2.48, "learning_rate": 1.4392222222222224e-05, "loss": 0.5025, "step": 70500 }, { "epoch": 2.48, "learning_rate": 1.4386666666666669e-05, "loss": 0.5125, "step": 70550 }, { "epoch": 2.49, "learning_rate": 1.4381111111111113e-05, "loss": 0.5165, "step": 70600 }, { "epoch": 2.49, "learning_rate": 1.4375555555555556e-05, "loss": 0.472, "step": 70650 }, { "epoch": 2.49, "learning_rate": 1.4370000000000001e-05, "loss": 0.5107, "step": 70700 }, { "epoch": 2.49, "learning_rate": 1.4364444444444445e-05, "loss": 0.5011, "step": 70750 }, { "epoch": 2.49, "learning_rate": 1.4358888888888892e-05, "loss": 0.4609, "step": 70800 }, { "epoch": 2.49, "learning_rate": 1.4353333333333335e-05, "loss": 0.5209, "step": 70850 }, { "epoch": 2.5, "learning_rate": 1.4347777777777779e-05, "loss": 0.4946, "step": 70900 }, { "epoch": 2.5, "learning_rate": 1.4342222222222224e-05, "loss": 0.531, "step": 70950 }, { "epoch": 2.5, "learning_rate": 1.4336666666666668e-05, "loss": 0.4813, "step": 71000 }, { "epoch": 2.5, "learning_rate": 1.4331111111111111e-05, "loss": 0.5104, "step": 71050 }, { "epoch": 2.5, "learning_rate": 1.4325555555555557e-05, "loss": 0.5025, "step": 71100 }, { "epoch": 2.51, "learning_rate": 1.432e-05, "loss": 0.4931, "step": 71150 }, { "epoch": 2.51, "learning_rate": 1.4314444444444447e-05, "loss": 0.4744, "step": 71200 }, { "epoch": 2.51, "learning_rate": 1.430888888888889e-05, "loss": 0.4829, "step": 71250 }, { "epoch": 2.51, "learning_rate": 1.4303333333333334e-05, "loss": 0.4585, "step": 71300 }, { "epoch": 2.51, "learning_rate": 1.429777777777778e-05, "loss": 0.498, "step": 71350 }, { "epoch": 2.51, "learning_rate": 1.4292222222222223e-05, "loss": 0.6953, "step": 71400 }, { "epoch": 2.52, "learning_rate": 1.4286666666666668e-05, "loss": 0.4883, "step": 71450 }, { "epoch": 2.52, "learning_rate": 1.4281111111111112e-05, "loss": 0.4842, "step": 71500 }, { "epoch": 2.52, "learning_rate": 1.4275555555555555e-05, "loss": 0.5308, "step": 71550 }, { "epoch": 2.52, "learning_rate": 1.4270111111111111e-05, "loss": 0.655, "step": 71600 }, { "epoch": 2.52, "learning_rate": 1.4264555555555557e-05, "loss": 0.5366, "step": 71650 }, { "epoch": 2.52, "learning_rate": 1.4259e-05, "loss": 0.4806, "step": 71700 }, { "epoch": 2.53, "learning_rate": 1.4253444444444447e-05, "loss": 0.4832, "step": 71750 }, { "epoch": 2.53, "learning_rate": 1.424788888888889e-05, "loss": 0.5365, "step": 71800 }, { "epoch": 2.53, "learning_rate": 1.4242333333333334e-05, "loss": 0.4717, "step": 71850 }, { "epoch": 2.53, "learning_rate": 1.423677777777778e-05, "loss": 0.4892, "step": 71900 }, { "epoch": 2.53, "learning_rate": 1.4231222222222223e-05, "loss": 0.4812, "step": 71950 }, { "epoch": 2.54, "learning_rate": 1.4225666666666668e-05, "loss": 0.5184, "step": 72000 }, { "epoch": 2.54, "learning_rate": 1.4220111111111112e-05, "loss": 0.485, "step": 72050 }, { "epoch": 2.54, "learning_rate": 1.4214555555555555e-05, "loss": 0.4744, "step": 72100 }, { "epoch": 2.54, "learning_rate": 1.4209000000000002e-05, "loss": 0.5018, "step": 72150 }, { "epoch": 2.54, "learning_rate": 1.4203444444444446e-05, "loss": 0.49, "step": 72200 }, { "epoch": 2.54, "learning_rate": 1.4198e-05, "loss": 0.8148, "step": 72250 }, { "epoch": 2.55, "learning_rate": 1.4192444444444447e-05, "loss": 0.4992, "step": 72300 }, { "epoch": 2.55, "learning_rate": 1.418688888888889e-05, "loss": 0.5138, "step": 72350 }, { "epoch": 2.55, "learning_rate": 1.4181333333333334e-05, "loss": 0.4772, "step": 72400 }, { "epoch": 2.55, "learning_rate": 1.417577777777778e-05, "loss": 0.5495, "step": 72450 }, { "epoch": 2.55, "learning_rate": 1.4170222222222223e-05, "loss": 0.5296, "step": 72500 }, { "epoch": 2.55, "eval_loss": 0.3003145456314087, "eval_runtime": 90.3862, "eval_samples_per_second": 15.71, "eval_steps_per_second": 0.985, "eval_wer": 0.22247435781065625, "step": 72500 }, { "epoch": 2.55, "learning_rate": 1.4164666666666668e-05, "loss": 0.4633, "step": 72550 }, { "epoch": 2.56, "learning_rate": 1.4159111111111112e-05, "loss": 0.5736, "step": 72600 }, { "epoch": 2.56, "learning_rate": 1.4153555555555555e-05, "loss": 0.5376, "step": 72650 }, { "epoch": 2.56, "learning_rate": 1.4148000000000002e-05, "loss": 0.4853, "step": 72700 }, { "epoch": 2.56, "learning_rate": 1.4142444444444446e-05, "loss": 0.4798, "step": 72750 }, { "epoch": 2.56, "learning_rate": 1.4136888888888891e-05, "loss": 0.5108, "step": 72800 }, { "epoch": 2.56, "learning_rate": 1.4131333333333335e-05, "loss": 0.4903, "step": 72850 }, { "epoch": 2.57, "learning_rate": 1.4125777777777778e-05, "loss": 0.4925, "step": 72900 }, { "epoch": 2.57, "learning_rate": 1.4120222222222224e-05, "loss": 0.4871, "step": 72950 }, { "epoch": 2.57, "learning_rate": 1.4114666666666667e-05, "loss": 0.5103, "step": 73000 }, { "epoch": 2.57, "learning_rate": 1.410911111111111e-05, "loss": 0.4777, "step": 73050 }, { "epoch": 2.57, "learning_rate": 1.4103555555555558e-05, "loss": 0.559, "step": 73100 }, { "epoch": 2.58, "learning_rate": 1.4098000000000001e-05, "loss": 0.4943, "step": 73150 }, { "epoch": 2.58, "learning_rate": 1.4092444444444446e-05, "loss": 0.4791, "step": 73200 }, { "epoch": 2.58, "learning_rate": 1.408688888888889e-05, "loss": 0.5141, "step": 73250 }, { "epoch": 2.58, "learning_rate": 1.4081333333333334e-05, "loss": 0.5165, "step": 73300 }, { "epoch": 2.58, "learning_rate": 1.4075777777777779e-05, "loss": 0.4746, "step": 73350 }, { "epoch": 2.58, "learning_rate": 1.4070222222222222e-05, "loss": 0.4637, "step": 73400 }, { "epoch": 2.59, "learning_rate": 1.406466666666667e-05, "loss": 0.6618, "step": 73450 }, { "epoch": 2.59, "learning_rate": 1.4059111111111113e-05, "loss": 0.4839, "step": 73500 }, { "epoch": 2.59, "learning_rate": 1.4053555555555556e-05, "loss": 0.482, "step": 73550 }, { "epoch": 2.59, "learning_rate": 1.4048000000000002e-05, "loss": 0.5254, "step": 73600 }, { "epoch": 2.59, "learning_rate": 1.4042444444444445e-05, "loss": 0.5462, "step": 73650 }, { "epoch": 2.59, "learning_rate": 1.403688888888889e-05, "loss": 0.5094, "step": 73700 }, { "epoch": 2.6, "learning_rate": 1.4031333333333334e-05, "loss": 0.4562, "step": 73750 }, { "epoch": 2.6, "learning_rate": 1.4025777777777778e-05, "loss": 0.4994, "step": 73800 }, { "epoch": 2.6, "learning_rate": 1.4020222222222225e-05, "loss": 0.4718, "step": 73850 }, { "epoch": 2.6, "learning_rate": 1.4014666666666668e-05, "loss": 0.6079, "step": 73900 }, { "epoch": 2.6, "learning_rate": 1.4009111111111113e-05, "loss": 0.477, "step": 73950 }, { "epoch": 2.61, "learning_rate": 1.4003555555555557e-05, "loss": 0.4692, "step": 74000 }, { "epoch": 2.61, "learning_rate": 1.3998e-05, "loss": 0.484, "step": 74050 }, { "epoch": 2.61, "learning_rate": 1.3992444444444446e-05, "loss": 0.5277, "step": 74100 }, { "epoch": 2.61, "learning_rate": 1.398688888888889e-05, "loss": 0.4875, "step": 74150 }, { "epoch": 2.61, "learning_rate": 1.3981333333333333e-05, "loss": 0.495, "step": 74200 }, { "epoch": 2.61, "learning_rate": 1.397577777777778e-05, "loss": 0.4925, "step": 74250 }, { "epoch": 2.62, "learning_rate": 1.3970222222222223e-05, "loss": 0.4855, "step": 74300 }, { "epoch": 2.62, "learning_rate": 1.3964666666666669e-05, "loss": 0.4916, "step": 74350 }, { "epoch": 2.62, "learning_rate": 1.3959111111111112e-05, "loss": 0.5297, "step": 74400 }, { "epoch": 2.62, "learning_rate": 1.3953555555555556e-05, "loss": 0.4743, "step": 74450 }, { "epoch": 2.62, "learning_rate": 1.3948000000000001e-05, "loss": 0.4746, "step": 74500 }, { "epoch": 2.62, "learning_rate": 1.3942444444444445e-05, "loss": 0.5209, "step": 74550 }, { "epoch": 2.63, "learning_rate": 1.3936888888888891e-05, "loss": 0.4979, "step": 74600 }, { "epoch": 2.63, "learning_rate": 1.3931333333333335e-05, "loss": 0.4853, "step": 74650 }, { "epoch": 2.63, "learning_rate": 1.3925777777777779e-05, "loss": 0.5162, "step": 74700 }, { "epoch": 2.63, "learning_rate": 1.3920222222222224e-05, "loss": 0.4694, "step": 74750 }, { "epoch": 2.63, "learning_rate": 1.3914666666666667e-05, "loss": 0.5476, "step": 74800 }, { "epoch": 2.64, "learning_rate": 1.3909111111111113e-05, "loss": 0.4958, "step": 74850 }, { "epoch": 2.64, "learning_rate": 1.3903555555555556e-05, "loss": 0.4663, "step": 74900 }, { "epoch": 2.64, "learning_rate": 1.3898e-05, "loss": 0.5113, "step": 74950 }, { "epoch": 2.64, "learning_rate": 1.3892444444444447e-05, "loss": 0.4759, "step": 75000 }, { "epoch": 2.64, "eval_loss": 0.29953446984291077, "eval_runtime": 13.9664, "eval_samples_per_second": 101.673, "eval_steps_per_second": 6.372, "eval_wer": 0.21439593355722975, "step": 75000 }, { "epoch": 2.64, "learning_rate": 1.388688888888889e-05, "loss": 0.474, "step": 75050 }, { "epoch": 2.64, "learning_rate": 1.3881333333333336e-05, "loss": 0.5201, "step": 75100 }, { "epoch": 2.65, "learning_rate": 1.3875777777777779e-05, "loss": 0.5118, "step": 75150 }, { "epoch": 2.65, "learning_rate": 1.3870222222222223e-05, "loss": 0.4705, "step": 75200 }, { "epoch": 2.65, "learning_rate": 1.3864666666666668e-05, "loss": 0.4749, "step": 75250 }, { "epoch": 2.65, "learning_rate": 1.3859111111111111e-05, "loss": 0.4649, "step": 75300 }, { "epoch": 2.65, "learning_rate": 1.3853555555555555e-05, "loss": 0.4632, "step": 75350 }, { "epoch": 2.65, "learning_rate": 1.3848000000000002e-05, "loss": 0.4704, "step": 75400 }, { "epoch": 2.66, "learning_rate": 1.3842444444444445e-05, "loss": 0.5032, "step": 75450 }, { "epoch": 2.66, "learning_rate": 1.383688888888889e-05, "loss": 0.5307, "step": 75500 }, { "epoch": 2.66, "learning_rate": 1.3831333333333334e-05, "loss": 0.507, "step": 75550 }, { "epoch": 2.66, "learning_rate": 1.3825777777777778e-05, "loss": 0.4901, "step": 75600 }, { "epoch": 2.66, "learning_rate": 1.3820222222222223e-05, "loss": 0.4719, "step": 75650 }, { "epoch": 2.67, "learning_rate": 1.3814666666666667e-05, "loss": 0.4888, "step": 75700 }, { "epoch": 2.67, "learning_rate": 1.3809111111111114e-05, "loss": 0.4815, "step": 75750 }, { "epoch": 2.67, "learning_rate": 1.3803555555555557e-05, "loss": 0.4854, "step": 75800 }, { "epoch": 2.67, "learning_rate": 1.3798e-05, "loss": 0.468, "step": 75850 }, { "epoch": 2.67, "learning_rate": 1.3792444444444446e-05, "loss": 0.4611, "step": 75900 }, { "epoch": 2.67, "learning_rate": 1.3787000000000002e-05, "loss": 0.5973, "step": 75950 }, { "epoch": 2.68, "learning_rate": 1.3781444444444446e-05, "loss": 0.4777, "step": 76000 }, { "epoch": 2.68, "learning_rate": 1.377588888888889e-05, "loss": 0.4753, "step": 76050 }, { "epoch": 2.68, "learning_rate": 1.3770333333333334e-05, "loss": 0.4902, "step": 76100 }, { "epoch": 2.68, "learning_rate": 1.3764777777777778e-05, "loss": 0.4874, "step": 76150 }, { "epoch": 2.68, "learning_rate": 1.3759222222222223e-05, "loss": 0.4833, "step": 76200 }, { "epoch": 2.68, "learning_rate": 1.3753666666666667e-05, "loss": 0.4725, "step": 76250 }, { "epoch": 2.69, "learning_rate": 1.3748111111111114e-05, "loss": 0.5042, "step": 76300 }, { "epoch": 2.69, "learning_rate": 1.3742555555555557e-05, "loss": 0.5115, "step": 76350 }, { "epoch": 2.69, "learning_rate": 1.3737e-05, "loss": 0.5192, "step": 76400 }, { "epoch": 2.69, "learning_rate": 1.3731444444444446e-05, "loss": 0.4587, "step": 76450 }, { "epoch": 2.69, "learning_rate": 1.372588888888889e-05, "loss": 0.4528, "step": 76500 }, { "epoch": 2.7, "learning_rate": 1.3720333333333335e-05, "loss": 0.4936, "step": 76550 }, { "epoch": 2.7, "learning_rate": 1.3714777777777778e-05, "loss": 0.4834, "step": 76600 }, { "epoch": 2.7, "learning_rate": 1.3709222222222222e-05, "loss": 0.4947, "step": 76650 }, { "epoch": 2.7, "learning_rate": 1.3703666666666669e-05, "loss": 0.4982, "step": 76700 }, { "epoch": 2.7, "learning_rate": 1.3698111111111112e-05, "loss": 0.4869, "step": 76750 }, { "epoch": 2.7, "learning_rate": 1.3692555555555556e-05, "loss": 0.4838, "step": 76800 }, { "epoch": 2.71, "learning_rate": 1.3687000000000001e-05, "loss": 0.4959, "step": 76850 }, { "epoch": 2.71, "learning_rate": 1.3681444444444445e-05, "loss": 0.4362, "step": 76900 }, { "epoch": 2.71, "learning_rate": 1.367588888888889e-05, "loss": 0.4858, "step": 76950 }, { "epoch": 2.71, "learning_rate": 1.3670333333333334e-05, "loss": 0.4937, "step": 77000 }, { "epoch": 2.71, "learning_rate": 1.3664777777777777e-05, "loss": 0.4549, "step": 77050 }, { "epoch": 2.71, "learning_rate": 1.3659222222222224e-05, "loss": 0.4661, "step": 77100 }, { "epoch": 2.72, "learning_rate": 1.3653666666666668e-05, "loss": 0.4878, "step": 77150 }, { "epoch": 2.72, "learning_rate": 1.3648111111111113e-05, "loss": 0.4567, "step": 77200 }, { "epoch": 2.72, "learning_rate": 1.3642555555555556e-05, "loss": 0.4606, "step": 77250 }, { "epoch": 2.72, "learning_rate": 1.3637e-05, "loss": 0.4966, "step": 77300 }, { "epoch": 2.72, "learning_rate": 1.3631444444444445e-05, "loss": 0.4548, "step": 77350 }, { "epoch": 2.73, "learning_rate": 1.3625888888888889e-05, "loss": 0.5026, "step": 77400 }, { "epoch": 2.73, "learning_rate": 1.3620333333333336e-05, "loss": 0.4965, "step": 77450 }, { "epoch": 2.73, "learning_rate": 1.361477777777778e-05, "loss": 0.485, "step": 77500 }, { "epoch": 2.73, "eval_loss": 0.28823402523994446, "eval_runtime": 7.853, "eval_samples_per_second": 180.823, "eval_steps_per_second": 11.333, "eval_wer": 0.21258055732050468, "step": 77500 }, { "epoch": 2.73, "learning_rate": 1.3609222222222223e-05, "loss": 0.4713, "step": 77550 }, { "epoch": 2.73, "learning_rate": 1.3603666666666668e-05, "loss": 0.4984, "step": 77600 }, { "epoch": 2.73, "learning_rate": 1.3598111111111112e-05, "loss": 0.4938, "step": 77650 }, { "epoch": 2.74, "learning_rate": 1.3592555555555557e-05, "loss": 0.5119, "step": 77700 }, { "epoch": 2.74, "learning_rate": 1.3587e-05, "loss": 0.477, "step": 77750 }, { "epoch": 2.74, "learning_rate": 1.3581444444444444e-05, "loss": 0.485, "step": 77800 }, { "epoch": 2.74, "learning_rate": 1.3575888888888891e-05, "loss": 0.5134, "step": 77850 }, { "epoch": 2.74, "learning_rate": 1.3570333333333335e-05, "loss": 0.4837, "step": 77900 }, { "epoch": 2.74, "learning_rate": 1.3564777777777778e-05, "loss": 0.5264, "step": 77950 }, { "epoch": 2.75, "learning_rate": 1.3559222222222223e-05, "loss": 0.5039, "step": 78000 }, { "epoch": 2.75, "learning_rate": 1.3553666666666667e-05, "loss": 0.4825, "step": 78050 }, { "epoch": 2.75, "learning_rate": 1.3548111111111112e-05, "loss": 0.4906, "step": 78100 }, { "epoch": 2.75, "learning_rate": 1.3542555555555556e-05, "loss": 0.4511, "step": 78150 }, { "epoch": 2.75, "learning_rate": 1.3537e-05, "loss": 0.4852, "step": 78200 }, { "epoch": 2.76, "learning_rate": 1.3531444444444446e-05, "loss": 0.4615, "step": 78250 }, { "epoch": 2.76, "learning_rate": 1.352588888888889e-05, "loss": 0.4497, "step": 78300 }, { "epoch": 2.76, "learning_rate": 1.3520333333333335e-05, "loss": 0.4958, "step": 78350 }, { "epoch": 2.76, "learning_rate": 1.3514777777777779e-05, "loss": 0.5124, "step": 78400 }, { "epoch": 2.76, "learning_rate": 1.3509222222222222e-05, "loss": 0.4755, "step": 78450 }, { "epoch": 2.76, "learning_rate": 1.3503666666666667e-05, "loss": 0.4973, "step": 78500 }, { "epoch": 2.77, "learning_rate": 1.3498111111111113e-05, "loss": 0.4657, "step": 78550 }, { "epoch": 2.77, "learning_rate": 1.3492555555555558e-05, "loss": 0.4751, "step": 78600 }, { "epoch": 2.77, "learning_rate": 1.3487000000000001e-05, "loss": 0.4909, "step": 78650 }, { "epoch": 2.77, "learning_rate": 1.3481444444444445e-05, "loss": 0.4831, "step": 78700 }, { "epoch": 2.77, "learning_rate": 1.347588888888889e-05, "loss": 0.5733, "step": 78750 }, { "epoch": 2.77, "learning_rate": 1.3470333333333334e-05, "loss": 0.4674, "step": 78800 }, { "epoch": 2.78, "learning_rate": 1.346477777777778e-05, "loss": 0.5188, "step": 78850 }, { "epoch": 2.78, "learning_rate": 1.3459222222222224e-05, "loss": 0.4778, "step": 78900 }, { "epoch": 2.78, "learning_rate": 1.3453666666666668e-05, "loss": 0.4544, "step": 78950 }, { "epoch": 2.78, "learning_rate": 1.3448111111111113e-05, "loss": 0.453, "step": 79000 }, { "epoch": 2.78, "learning_rate": 1.3442555555555557e-05, "loss": 0.4664, "step": 79050 }, { "epoch": 2.79, "learning_rate": 1.3437e-05, "loss": 0.4759, "step": 79100 }, { "epoch": 2.79, "learning_rate": 1.3431444444444446e-05, "loss": 0.4725, "step": 79150 }, { "epoch": 2.79, "learning_rate": 1.3425888888888889e-05, "loss": 0.4832, "step": 79200 }, { "epoch": 2.79, "learning_rate": 1.3420333333333336e-05, "loss": 0.4699, "step": 79250 }, { "epoch": 2.79, "learning_rate": 1.341477777777778e-05, "loss": 0.4687, "step": 79300 }, { "epoch": 2.79, "learning_rate": 1.3409222222222223e-05, "loss": 0.4713, "step": 79350 }, { "epoch": 2.8, "learning_rate": 1.3403666666666668e-05, "loss": 0.4507, "step": 79400 }, { "epoch": 2.8, "learning_rate": 1.3398111111111112e-05, "loss": 0.4884, "step": 79450 }, { "epoch": 2.8, "learning_rate": 1.3392555555555557e-05, "loss": 0.5252, "step": 79500 }, { "epoch": 2.8, "learning_rate": 1.3387e-05, "loss": 0.5134, "step": 79550 }, { "epoch": 2.8, "learning_rate": 1.3381444444444444e-05, "loss": 0.4883, "step": 79600 }, { "epoch": 2.8, "learning_rate": 1.3375888888888891e-05, "loss": 0.457, "step": 79650 }, { "epoch": 2.81, "learning_rate": 1.3370333333333335e-05, "loss": 0.4726, "step": 79700 }, { "epoch": 2.81, "learning_rate": 1.336477777777778e-05, "loss": 0.5077, "step": 79750 }, { "epoch": 2.81, "learning_rate": 1.3359222222222224e-05, "loss": 0.516, "step": 79800 }, { "epoch": 2.81, "learning_rate": 1.3353666666666667e-05, "loss": 0.5268, "step": 79850 }, { "epoch": 2.81, "learning_rate": 1.3348111111111112e-05, "loss": 0.4333, "step": 79900 }, { "epoch": 2.81, "learning_rate": 1.3342555555555556e-05, "loss": 0.4619, "step": 79950 }, { "epoch": 2.82, "learning_rate": 1.3337000000000003e-05, "loss": 0.4888, "step": 80000 }, { "epoch": 2.82, "eval_loss": 0.2892592251300812, "eval_runtime": 108.0657, "eval_samples_per_second": 13.14, "eval_steps_per_second": 0.824, "eval_wer": 0.21893437414904238, "step": 80000 }, { "epoch": 2.82, "learning_rate": 1.3331444444444446e-05, "loss": 0.5044, "step": 80050 }, { "epoch": 2.82, "learning_rate": 1.332588888888889e-05, "loss": 0.47, "step": 80100 }, { "epoch": 2.82, "learning_rate": 1.3320333333333335e-05, "loss": 0.5046, "step": 80150 }, { "epoch": 2.82, "learning_rate": 1.3314777777777779e-05, "loss": 0.4819, "step": 80200 }, { "epoch": 2.83, "learning_rate": 1.3309222222222222e-05, "loss": 0.4707, "step": 80250 }, { "epoch": 2.83, "learning_rate": 1.3303666666666668e-05, "loss": 0.4536, "step": 80300 }, { "epoch": 2.83, "learning_rate": 1.3298111111111111e-05, "loss": 0.4946, "step": 80350 }, { "epoch": 2.83, "learning_rate": 1.3292555555555558e-05, "loss": 0.474, "step": 80400 }, { "epoch": 2.83, "learning_rate": 1.3287000000000002e-05, "loss": 0.5379, "step": 80450 }, { "epoch": 2.83, "learning_rate": 1.3281444444444445e-05, "loss": 0.4889, "step": 80500 }, { "epoch": 2.84, "learning_rate": 1.327588888888889e-05, "loss": 0.4749, "step": 80550 }, { "epoch": 2.84, "learning_rate": 1.3270333333333334e-05, "loss": 0.5886, "step": 80600 }, { "epoch": 2.84, "learning_rate": 1.326477777777778e-05, "loss": 0.4787, "step": 80650 }, { "epoch": 2.84, "learning_rate": 1.3259222222222223e-05, "loss": 0.4808, "step": 80700 }, { "epoch": 2.84, "learning_rate": 1.3253666666666666e-05, "loss": 0.46, "step": 80750 }, { "epoch": 2.84, "learning_rate": 1.3248111111111113e-05, "loss": 0.4797, "step": 80800 }, { "epoch": 2.85, "learning_rate": 1.3242555555555557e-05, "loss": 0.5124, "step": 80850 }, { "epoch": 2.85, "learning_rate": 1.3237000000000002e-05, "loss": 0.5898, "step": 80900 }, { "epoch": 2.85, "learning_rate": 1.3231444444444446e-05, "loss": 0.503, "step": 80950 }, { "epoch": 2.85, "learning_rate": 1.322588888888889e-05, "loss": 0.4533, "step": 81000 }, { "epoch": 2.85, "learning_rate": 1.3220333333333335e-05, "loss": 0.4745, "step": 81050 }, { "epoch": 2.86, "learning_rate": 1.3214777777777778e-05, "loss": 0.4597, "step": 81100 }, { "epoch": 2.86, "learning_rate": 1.3209222222222225e-05, "loss": 0.455, "step": 81150 }, { "epoch": 2.86, "learning_rate": 1.3203666666666669e-05, "loss": 0.4871, "step": 81200 }, { "epoch": 2.86, "learning_rate": 1.3198111111111112e-05, "loss": 0.4642, "step": 81250 }, { "epoch": 2.86, "learning_rate": 1.3192555555555557e-05, "loss": 0.4756, "step": 81300 }, { "epoch": 2.86, "learning_rate": 1.3187000000000001e-05, "loss": 0.5523, "step": 81350 }, { "epoch": 2.87, "learning_rate": 1.3181444444444445e-05, "loss": 0.5078, "step": 81400 }, { "epoch": 2.87, "learning_rate": 1.317588888888889e-05, "loss": 0.4863, "step": 81450 }, { "epoch": 2.87, "learning_rate": 1.3170333333333333e-05, "loss": 0.4988, "step": 81500 }, { "epoch": 2.87, "learning_rate": 1.316477777777778e-05, "loss": 0.4821, "step": 81550 }, { "epoch": 2.87, "learning_rate": 1.3159222222222224e-05, "loss": 0.472, "step": 81600 }, { "epoch": 2.87, "learning_rate": 1.3153666666666667e-05, "loss": 0.4556, "step": 81650 }, { "epoch": 2.88, "learning_rate": 1.3148111111111113e-05, "loss": 0.4408, "step": 81700 }, { "epoch": 2.88, "learning_rate": 1.3142555555555556e-05, "loss": 0.4908, "step": 81750 }, { "epoch": 2.88, "learning_rate": 1.3137000000000001e-05, "loss": 0.5055, "step": 81800 }, { "epoch": 2.88, "learning_rate": 1.3131444444444445e-05, "loss": 0.5399, "step": 81850 }, { "epoch": 2.88, "learning_rate": 1.3125888888888889e-05, "loss": 0.534, "step": 81900 }, { "epoch": 2.89, "learning_rate": 1.3120333333333336e-05, "loss": 0.4656, "step": 81950 }, { "epoch": 2.89, "learning_rate": 1.3114777777777779e-05, "loss": 0.4512, "step": 82000 }, { "epoch": 2.89, "learning_rate": 1.3109222222222224e-05, "loss": 0.4813, "step": 82050 }, { "epoch": 2.89, "learning_rate": 1.3103666666666668e-05, "loss": 0.4523, "step": 82100 }, { "epoch": 2.89, "learning_rate": 1.3098111111111111e-05, "loss": 0.4848, "step": 82150 }, { "epoch": 2.89, "learning_rate": 1.3092666666666667e-05, "loss": 0.4811, "step": 82200 }, { "epoch": 2.9, "learning_rate": 1.3087111111111113e-05, "loss": 0.6556, "step": 82250 }, { "epoch": 2.9, "learning_rate": 1.3081555555555556e-05, "loss": 0.4524, "step": 82300 }, { "epoch": 2.9, "learning_rate": 1.3076000000000002e-05, "loss": 0.5052, "step": 82350 }, { "epoch": 2.9, "learning_rate": 1.3070444444444445e-05, "loss": 0.4908, "step": 82400 }, { "epoch": 2.9, "learning_rate": 1.3064888888888889e-05, "loss": 0.5298, "step": 82450 }, { "epoch": 2.9, "learning_rate": 1.3059333333333336e-05, "loss": 0.51, "step": 82500 }, { "epoch": 2.9, "eval_loss": 0.2767323851585388, "eval_runtime": 192.9105, "eval_samples_per_second": 7.361, "eval_steps_per_second": 0.461, "eval_wer": 0.2045929018789144, "step": 82500 }, { "epoch": 2.91, "learning_rate": 1.3053777777777779e-05, "loss": 0.4743, "step": 82550 }, { "epoch": 2.91, "learning_rate": 1.3048222222222224e-05, "loss": 0.4488, "step": 82600 }, { "epoch": 2.91, "learning_rate": 1.3042666666666668e-05, "loss": 0.4978, "step": 82650 }, { "epoch": 2.91, "learning_rate": 1.3037111111111111e-05, "loss": 0.4763, "step": 82700 }, { "epoch": 2.91, "learning_rate": 1.3031555555555557e-05, "loss": 0.4606, "step": 82750 }, { "epoch": 2.92, "learning_rate": 1.3026e-05, "loss": 0.4852, "step": 82800 }, { "epoch": 2.92, "learning_rate": 1.3020444444444444e-05, "loss": 0.4407, "step": 82850 }, { "epoch": 2.92, "learning_rate": 1.301488888888889e-05, "loss": 0.6662, "step": 82900 }, { "epoch": 2.92, "learning_rate": 1.3009333333333334e-05, "loss": 0.4731, "step": 82950 }, { "epoch": 2.92, "learning_rate": 1.300377777777778e-05, "loss": 0.5279, "step": 83000 }, { "epoch": 2.92, "learning_rate": 1.2998222222222223e-05, "loss": 0.4856, "step": 83050 }, { "epoch": 2.93, "learning_rate": 1.2992666666666667e-05, "loss": 0.5333, "step": 83100 }, { "epoch": 2.93, "learning_rate": 1.2987111111111112e-05, "loss": 0.4949, "step": 83150 }, { "epoch": 2.93, "learning_rate": 1.2981555555555556e-05, "loss": 0.4592, "step": 83200 }, { "epoch": 2.93, "learning_rate": 1.2976000000000002e-05, "loss": 0.469, "step": 83250 }, { "epoch": 2.93, "learning_rate": 1.2970555555555557e-05, "loss": 0.4921, "step": 83300 }, { "epoch": 2.93, "learning_rate": 1.2965e-05, "loss": 0.4934, "step": 83350 }, { "epoch": 2.94, "learning_rate": 1.2959444444444444e-05, "loss": 0.4678, "step": 83400 }, { "epoch": 2.94, "learning_rate": 1.2953888888888891e-05, "loss": 0.5091, "step": 83450 }, { "epoch": 2.94, "learning_rate": 1.2948333333333334e-05, "loss": 0.4548, "step": 83500 }, { "epoch": 2.94, "learning_rate": 1.294277777777778e-05, "loss": 0.457, "step": 83550 }, { "epoch": 2.94, "learning_rate": 1.2937222222222223e-05, "loss": 0.4836, "step": 83600 }, { "epoch": 2.95, "learning_rate": 1.2931666666666667e-05, "loss": 0.4687, "step": 83650 }, { "epoch": 2.95, "learning_rate": 1.2926111111111112e-05, "loss": 0.4975, "step": 83700 }, { "epoch": 2.95, "learning_rate": 1.2920555555555556e-05, "loss": 0.4679, "step": 83750 }, { "epoch": 2.95, "learning_rate": 1.2915000000000003e-05, "loss": 0.4676, "step": 83800 }, { "epoch": 2.95, "learning_rate": 1.2909444444444446e-05, "loss": 0.4448, "step": 83850 }, { "epoch": 2.95, "learning_rate": 1.290388888888889e-05, "loss": 0.4938, "step": 83900 }, { "epoch": 2.96, "learning_rate": 1.2898333333333335e-05, "loss": 0.469, "step": 83950 }, { "epoch": 2.96, "learning_rate": 1.2892777777777778e-05, "loss": 0.4657, "step": 84000 }, { "epoch": 2.96, "learning_rate": 1.2887222222222224e-05, "loss": 0.4559, "step": 84050 }, { "epoch": 2.96, "learning_rate": 1.2881666666666667e-05, "loss": 0.4587, "step": 84100 }, { "epoch": 2.96, "learning_rate": 1.2876222222222223e-05, "loss": 0.4358, "step": 84150 }, { "epoch": 2.96, "learning_rate": 1.2870666666666667e-05, "loss": 0.4313, "step": 84200 }, { "epoch": 2.97, "learning_rate": 1.2865111111111112e-05, "loss": 0.4871, "step": 84250 }, { "epoch": 2.97, "learning_rate": 1.2859555555555556e-05, "loss": 0.4552, "step": 84300 }, { "epoch": 2.97, "learning_rate": 1.2854000000000003e-05, "loss": 0.4798, "step": 84350 }, { "epoch": 2.97, "learning_rate": 1.2848444444444446e-05, "loss": 0.4702, "step": 84400 }, { "epoch": 2.97, "learning_rate": 1.284288888888889e-05, "loss": 0.483, "step": 84450 }, { "epoch": 2.98, "learning_rate": 1.2837333333333335e-05, "loss": 0.4963, "step": 84500 }, { "epoch": 2.98, "learning_rate": 1.2831777777777779e-05, "loss": 0.4553, "step": 84550 }, { "epoch": 2.98, "learning_rate": 1.2826222222222224e-05, "loss": 0.4795, "step": 84600 }, { "epoch": 2.98, "learning_rate": 1.2820666666666667e-05, "loss": 0.4835, "step": 84650 }, { "epoch": 2.98, "learning_rate": 1.2815111111111111e-05, "loss": 0.536, "step": 84700 }, { "epoch": 2.98, "learning_rate": 1.2809555555555558e-05, "loss": 0.468, "step": 84750 }, { "epoch": 2.99, "learning_rate": 1.2804000000000001e-05, "loss": 0.5001, "step": 84800 }, { "epoch": 2.99, "learning_rate": 1.2798444444444445e-05, "loss": 0.4494, "step": 84850 }, { "epoch": 2.99, "learning_rate": 1.279288888888889e-05, "loss": 0.5469, "step": 84900 }, { "epoch": 2.99, "learning_rate": 1.2787333333333334e-05, "loss": 0.4692, "step": 84950 }, { "epoch": 2.99, "learning_rate": 1.2781777777777779e-05, "loss": 0.4703, "step": 85000 }, { "epoch": 2.99, "eval_loss": 0.28990375995635986, "eval_runtime": 6.4799, "eval_samples_per_second": 219.14, "eval_steps_per_second": 13.735, "eval_wer": 0.21239901969683217, "step": 85000 }, { "epoch": 2.99, "learning_rate": 1.2776222222222223e-05, "loss": 0.481, "step": 85050 }, { "epoch": 3.0, "learning_rate": 1.2770666666666666e-05, "loss": 0.4613, "step": 85100 }, { "epoch": 3.0, "learning_rate": 1.2765111111111113e-05, "loss": 0.5013, "step": 85150 }, { "epoch": 3.0, "learning_rate": 1.2759555555555557e-05, "loss": 0.4639, "step": 85200 }, { "epoch": 3.0, "learning_rate": 1.2754000000000002e-05, "loss": 0.4834, "step": 85250 }, { "epoch": 3.0, "learning_rate": 1.2748444444444445e-05, "loss": 0.4931, "step": 85300 }, { "epoch": 3.01, "learning_rate": 1.2742888888888889e-05, "loss": 0.4702, "step": 85350 }, { "epoch": 3.01, "learning_rate": 1.2737333333333334e-05, "loss": 0.4486, "step": 85400 }, { "epoch": 3.01, "learning_rate": 1.2731777777777778e-05, "loss": 0.4782, "step": 85450 }, { "epoch": 3.01, "learning_rate": 1.2726222222222225e-05, "loss": 0.4818, "step": 85500 }, { "epoch": 3.01, "learning_rate": 1.2720666666666668e-05, "loss": 0.4725, "step": 85550 }, { "epoch": 3.01, "learning_rate": 1.2715111111111112e-05, "loss": 0.4723, "step": 85600 }, { "epoch": 3.02, "learning_rate": 1.2709555555555557e-05, "loss": 0.4871, "step": 85650 }, { "epoch": 3.02, "learning_rate": 1.2704e-05, "loss": 0.4535, "step": 85700 }, { "epoch": 3.02, "learning_rate": 1.2698444444444446e-05, "loss": 0.4609, "step": 85750 }, { "epoch": 3.02, "learning_rate": 1.269288888888889e-05, "loss": 0.5877, "step": 85800 }, { "epoch": 3.02, "learning_rate": 1.2687333333333333e-05, "loss": 0.4592, "step": 85850 }, { "epoch": 3.02, "learning_rate": 1.268177777777778e-05, "loss": 0.4604, "step": 85900 }, { "epoch": 3.03, "learning_rate": 1.2676222222222224e-05, "loss": 0.4754, "step": 85950 }, { "epoch": 3.03, "learning_rate": 1.2670666666666667e-05, "loss": 0.4439, "step": 86000 }, { "epoch": 3.03, "learning_rate": 1.2665111111111112e-05, "loss": 0.494, "step": 86050 }, { "epoch": 3.03, "learning_rate": 1.2659555555555556e-05, "loss": 0.4835, "step": 86100 }, { "epoch": 3.03, "learning_rate": 1.2654000000000001e-05, "loss": 0.4709, "step": 86150 }, { "epoch": 3.03, "learning_rate": 1.2648444444444445e-05, "loss": 0.5342, "step": 86200 }, { "epoch": 3.04, "learning_rate": 1.2642888888888888e-05, "loss": 0.5081, "step": 86250 }, { "epoch": 3.04, "learning_rate": 1.2637333333333335e-05, "loss": 0.4571, "step": 86300 }, { "epoch": 3.04, "learning_rate": 1.2631777777777779e-05, "loss": 0.4627, "step": 86350 }, { "epoch": 3.04, "learning_rate": 1.2626222222222224e-05, "loss": 0.4583, "step": 86400 }, { "epoch": 3.04, "learning_rate": 1.2620666666666668e-05, "loss": 0.4655, "step": 86450 }, { "epoch": 3.05, "learning_rate": 1.2615111111111111e-05, "loss": 0.4903, "step": 86500 }, { "epoch": 3.05, "learning_rate": 1.2609555555555556e-05, "loss": 0.5361, "step": 86550 }, { "epoch": 3.05, "learning_rate": 1.2604e-05, "loss": 0.495, "step": 86600 }, { "epoch": 3.05, "learning_rate": 1.2598444444444447e-05, "loss": 0.4586, "step": 86650 }, { "epoch": 3.05, "learning_rate": 1.259288888888889e-05, "loss": 0.4813, "step": 86700 }, { "epoch": 3.05, "learning_rate": 1.2587333333333334e-05, "loss": 0.4722, "step": 86750 }, { "epoch": 3.06, "learning_rate": 1.258177777777778e-05, "loss": 0.4824, "step": 86800 }, { "epoch": 3.06, "learning_rate": 1.2576222222222223e-05, "loss": 0.4411, "step": 86850 }, { "epoch": 3.06, "learning_rate": 1.2570666666666668e-05, "loss": 0.4585, "step": 86900 }, { "epoch": 3.06, "learning_rate": 1.2565111111111112e-05, "loss": 0.4716, "step": 86950 }, { "epoch": 3.06, "learning_rate": 1.2559555555555555e-05, "loss": 0.4646, "step": 87000 }, { "epoch": 3.06, "learning_rate": 1.2554000000000002e-05, "loss": 0.6259, "step": 87050 }, { "epoch": 3.07, "learning_rate": 1.2548444444444446e-05, "loss": 0.4555, "step": 87100 }, { "epoch": 3.07, "learning_rate": 1.254288888888889e-05, "loss": 0.4359, "step": 87150 }, { "epoch": 3.07, "learning_rate": 1.2537333333333334e-05, "loss": 0.4617, "step": 87200 }, { "epoch": 3.07, "learning_rate": 1.2531777777777778e-05, "loss": 0.4929, "step": 87250 }, { "epoch": 3.07, "learning_rate": 1.2526222222222223e-05, "loss": 0.4587, "step": 87300 }, { "epoch": 3.08, "learning_rate": 1.2520666666666667e-05, "loss": 0.5065, "step": 87350 }, { "epoch": 3.08, "learning_rate": 1.251511111111111e-05, "loss": 0.4911, "step": 87400 }, { "epoch": 3.08, "learning_rate": 1.2509555555555557e-05, "loss": 0.4398, "step": 87450 }, { "epoch": 3.08, "learning_rate": 1.2504000000000001e-05, "loss": 0.4406, "step": 87500 }, { "epoch": 3.08, "eval_loss": 0.2786855399608612, "eval_runtime": 33.2311, "eval_samples_per_second": 42.731, "eval_steps_per_second": 2.678, "eval_wer": 0.20677135336298447, "step": 87500 }, { "epoch": 3.08, "learning_rate": 1.2498444444444446e-05, "loss": 0.4437, "step": 87550 }, { "epoch": 3.08, "learning_rate": 1.249288888888889e-05, "loss": 0.4972, "step": 87600 }, { "epoch": 3.09, "learning_rate": 1.2487333333333333e-05, "loss": 0.4606, "step": 87650 }, { "epoch": 3.09, "learning_rate": 1.2481777777777779e-05, "loss": 0.5049, "step": 87700 }, { "epoch": 3.09, "learning_rate": 1.2476222222222222e-05, "loss": 0.4714, "step": 87750 }, { "epoch": 3.09, "learning_rate": 1.2470666666666669e-05, "loss": 0.5037, "step": 87800 }, { "epoch": 3.09, "learning_rate": 1.2465111111111113e-05, "loss": 0.5244, "step": 87850 }, { "epoch": 3.09, "learning_rate": 1.2459555555555556e-05, "loss": 0.4877, "step": 87900 }, { "epoch": 3.1, "learning_rate": 1.2454000000000001e-05, "loss": 0.4725, "step": 87950 }, { "epoch": 3.1, "learning_rate": 1.2448444444444445e-05, "loss": 0.4503, "step": 88000 }, { "epoch": 3.1, "learning_rate": 1.244288888888889e-05, "loss": 0.4812, "step": 88050 }, { "epoch": 3.1, "learning_rate": 1.2437333333333335e-05, "loss": 0.4552, "step": 88100 }, { "epoch": 3.1, "learning_rate": 1.2431777777777779e-05, "loss": 0.4801, "step": 88150 }, { "epoch": 3.11, "learning_rate": 1.2426222222222224e-05, "loss": 0.4854, "step": 88200 }, { "epoch": 3.11, "learning_rate": 1.2420666666666668e-05, "loss": 0.494, "step": 88250 }, { "epoch": 3.11, "learning_rate": 1.2415222222222222e-05, "loss": 0.6009, "step": 88300 }, { "epoch": 3.11, "learning_rate": 1.2409666666666669e-05, "loss": 0.438, "step": 88350 }, { "epoch": 3.11, "learning_rate": 1.2404111111111113e-05, "loss": 0.4636, "step": 88400 }, { "epoch": 3.11, "learning_rate": 1.2398555555555556e-05, "loss": 0.4701, "step": 88450 }, { "epoch": 3.12, "learning_rate": 1.2393000000000001e-05, "loss": 0.4491, "step": 88500 }, { "epoch": 3.12, "learning_rate": 1.2387444444444445e-05, "loss": 0.469, "step": 88550 }, { "epoch": 3.12, "learning_rate": 1.2381888888888889e-05, "loss": 0.4729, "step": 88600 }, { "epoch": 3.12, "learning_rate": 1.2376333333333334e-05, "loss": 0.471, "step": 88650 }, { "epoch": 3.12, "learning_rate": 1.2370777777777777e-05, "loss": 0.4787, "step": 88700 }, { "epoch": 3.12, "learning_rate": 1.2365222222222224e-05, "loss": 0.4569, "step": 88750 }, { "epoch": 3.13, "learning_rate": 1.2359666666666668e-05, "loss": 0.4787, "step": 88800 }, { "epoch": 3.13, "learning_rate": 1.2354111111111111e-05, "loss": 0.4534, "step": 88850 }, { "epoch": 3.13, "learning_rate": 1.2348555555555557e-05, "loss": 0.4884, "step": 88900 }, { "epoch": 3.13, "learning_rate": 1.2343e-05, "loss": 0.4638, "step": 88950 }, { "epoch": 3.13, "learning_rate": 1.2337444444444445e-05, "loss": 0.4636, "step": 89000 }, { "epoch": 3.14, "learning_rate": 1.233188888888889e-05, "loss": 0.4799, "step": 89050 }, { "epoch": 3.14, "learning_rate": 1.2326444444444445e-05, "loss": 0.4665, "step": 89100 }, { "epoch": 3.14, "learning_rate": 1.2320888888888889e-05, "loss": 0.4556, "step": 89150 }, { "epoch": 3.14, "learning_rate": 1.2315333333333334e-05, "loss": 0.5512, "step": 89200 }, { "epoch": 3.14, "learning_rate": 1.2309777777777777e-05, "loss": 0.4629, "step": 89250 }, { "epoch": 3.14, "learning_rate": 1.2304222222222224e-05, "loss": 0.4732, "step": 89300 }, { "epoch": 3.15, "learning_rate": 1.2298666666666668e-05, "loss": 0.4386, "step": 89350 }, { "epoch": 3.15, "learning_rate": 1.2293111111111112e-05, "loss": 0.473, "step": 89400 }, { "epoch": 3.15, "learning_rate": 1.2287555555555557e-05, "loss": 0.5243, "step": 89450 }, { "epoch": 3.15, "learning_rate": 1.2282e-05, "loss": 0.4517, "step": 89500 }, { "epoch": 3.15, "learning_rate": 1.2276444444444446e-05, "loss": 0.476, "step": 89550 }, { "epoch": 3.15, "learning_rate": 1.2270888888888889e-05, "loss": 0.4694, "step": 89600 }, { "epoch": 3.16, "learning_rate": 1.2265333333333334e-05, "loss": 0.4644, "step": 89650 }, { "epoch": 3.16, "learning_rate": 1.225977777777778e-05, "loss": 0.4456, "step": 89700 }, { "epoch": 3.16, "learning_rate": 1.2254222222222223e-05, "loss": 0.4485, "step": 89750 }, { "epoch": 3.16, "learning_rate": 1.2248666666666668e-05, "loss": 0.4441, "step": 89800 }, { "epoch": 3.16, "learning_rate": 1.2243111111111112e-05, "loss": 0.4653, "step": 89850 }, { "epoch": 3.17, "learning_rate": 1.2237555555555556e-05, "loss": 0.4612, "step": 89900 }, { "epoch": 3.17, "learning_rate": 1.2232000000000002e-05, "loss": 0.4813, "step": 89950 }, { "epoch": 3.17, "learning_rate": 1.2226444444444446e-05, "loss": 0.4328, "step": 90000 }, { "epoch": 3.17, "eval_loss": 0.28234174847602844, "eval_runtime": 40.4271, "eval_samples_per_second": 35.125, "eval_steps_per_second": 2.201, "eval_wer": 0.20704365979849323, "step": 90000 }, { "epoch": 3.17, "learning_rate": 1.222088888888889e-05, "loss": 0.479, "step": 90050 }, { "epoch": 3.17, "learning_rate": 1.2215333333333335e-05, "loss": 0.4662, "step": 90100 }, { "epoch": 3.17, "learning_rate": 1.2209777777777778e-05, "loss": 0.4389, "step": 90150 }, { "epoch": 3.18, "learning_rate": 1.2204222222222224e-05, "loss": 0.467, "step": 90200 }, { "epoch": 3.18, "learning_rate": 1.2198666666666667e-05, "loss": 0.4652, "step": 90250 }, { "epoch": 3.18, "learning_rate": 1.219311111111111e-05, "loss": 0.4457, "step": 90300 }, { "epoch": 3.18, "learning_rate": 1.2187555555555558e-05, "loss": 0.8314, "step": 90350 }, { "epoch": 3.18, "learning_rate": 1.2182000000000001e-05, "loss": 0.452, "step": 90400 }, { "epoch": 3.18, "learning_rate": 1.2176444444444447e-05, "loss": 0.4832, "step": 90450 }, { "epoch": 3.19, "learning_rate": 1.217088888888889e-05, "loss": 0.4486, "step": 90500 }, { "epoch": 3.19, "learning_rate": 1.2165333333333334e-05, "loss": 0.4692, "step": 90550 }, { "epoch": 3.19, "learning_rate": 1.2159777777777779e-05, "loss": 0.4664, "step": 90600 }, { "epoch": 3.19, "learning_rate": 1.2154222222222222e-05, "loss": 0.4481, "step": 90650 }, { "epoch": 3.19, "learning_rate": 1.214866666666667e-05, "loss": 0.4999, "step": 90700 }, { "epoch": 3.2, "learning_rate": 1.2143111111111113e-05, "loss": 0.4351, "step": 90750 }, { "epoch": 3.2, "learning_rate": 1.2137555555555557e-05, "loss": 0.4391, "step": 90800 }, { "epoch": 3.2, "learning_rate": 1.2132000000000002e-05, "loss": 0.4689, "step": 90850 }, { "epoch": 3.2, "learning_rate": 1.2126444444444445e-05, "loss": 0.4652, "step": 90900 }, { "epoch": 3.2, "learning_rate": 1.212088888888889e-05, "loss": 0.4621, "step": 90950 }, { "epoch": 3.2, "learning_rate": 1.2115333333333334e-05, "loss": 0.4382, "step": 91000 }, { "epoch": 3.21, "learning_rate": 1.2109777777777778e-05, "loss": 0.5006, "step": 91050 }, { "epoch": 3.21, "learning_rate": 1.2104222222222225e-05, "loss": 0.5159, "step": 91100 }, { "epoch": 3.21, "learning_rate": 1.2098666666666668e-05, "loss": 0.5437, "step": 91150 }, { "epoch": 3.21, "learning_rate": 1.2093111111111112e-05, "loss": 0.5102, "step": 91200 }, { "epoch": 3.21, "learning_rate": 1.2087555555555557e-05, "loss": 0.4441, "step": 91250 }, { "epoch": 3.21, "learning_rate": 1.2082e-05, "loss": 0.486, "step": 91300 }, { "epoch": 3.22, "learning_rate": 1.2076444444444446e-05, "loss": 0.4513, "step": 91350 }, { "epoch": 3.22, "learning_rate": 1.207088888888889e-05, "loss": 0.4512, "step": 91400 }, { "epoch": 3.22, "learning_rate": 1.2065333333333333e-05, "loss": 0.4618, "step": 91450 }, { "epoch": 3.22, "learning_rate": 1.205977777777778e-05, "loss": 0.4563, "step": 91500 }, { "epoch": 3.22, "learning_rate": 1.2054222222222223e-05, "loss": 0.463, "step": 91550 }, { "epoch": 3.23, "learning_rate": 1.2048666666666669e-05, "loss": 0.4343, "step": 91600 }, { "epoch": 3.23, "learning_rate": 1.2043111111111112e-05, "loss": 0.4804, "step": 91650 }, { "epoch": 3.23, "learning_rate": 1.2037555555555556e-05, "loss": 0.5541, "step": 91700 }, { "epoch": 3.23, "learning_rate": 1.2032000000000001e-05, "loss": 0.4487, "step": 91750 }, { "epoch": 3.23, "learning_rate": 1.2026444444444445e-05, "loss": 0.4579, "step": 91800 }, { "epoch": 3.23, "learning_rate": 1.2020888888888892e-05, "loss": 0.4567, "step": 91850 }, { "epoch": 3.24, "learning_rate": 1.2015333333333335e-05, "loss": 0.4628, "step": 91900 }, { "epoch": 3.24, "learning_rate": 1.2009777777777779e-05, "loss": 0.4574, "step": 91950 }, { "epoch": 3.24, "learning_rate": 1.2004222222222224e-05, "loss": 0.4445, "step": 92000 }, { "epoch": 3.24, "learning_rate": 1.1998666666666667e-05, "loss": 0.5173, "step": 92050 }, { "epoch": 3.24, "learning_rate": 1.1993111111111113e-05, "loss": 0.4681, "step": 92100 }, { "epoch": 3.24, "learning_rate": 1.1987555555555556e-05, "loss": 0.4461, "step": 92150 }, { "epoch": 3.25, "learning_rate": 1.1982e-05, "loss": 0.4567, "step": 92200 }, { "epoch": 3.25, "learning_rate": 1.1976444444444447e-05, "loss": 0.4566, "step": 92250 }, { "epoch": 3.25, "learning_rate": 1.197088888888889e-05, "loss": 0.4324, "step": 92300 }, { "epoch": 3.25, "learning_rate": 1.1965333333333334e-05, "loss": 0.4596, "step": 92350 }, { "epoch": 3.25, "learning_rate": 1.1959777777777779e-05, "loss": 0.4426, "step": 92400 }, { "epoch": 3.26, "learning_rate": 1.1954222222222223e-05, "loss": 0.4613, "step": 92450 }, { "epoch": 3.26, "learning_rate": 1.1948666666666668e-05, "loss": 0.4399, "step": 92500 }, { "epoch": 3.26, "eval_loss": 0.2802058160305023, "eval_runtime": 39.1528, "eval_samples_per_second": 36.268, "eval_steps_per_second": 2.273, "eval_wer": 0.2057728964327857, "step": 92500 }, { "epoch": 3.26, "learning_rate": 1.1943111111111111e-05, "loss": 0.483, "step": 92550 }, { "epoch": 3.26, "learning_rate": 1.1937555555555555e-05, "loss": 0.4663, "step": 92600 }, { "epoch": 3.26, "learning_rate": 1.1932000000000002e-05, "loss": 0.4367, "step": 92650 }, { "epoch": 3.26, "learning_rate": 1.1926444444444446e-05, "loss": 0.46, "step": 92700 }, { "epoch": 3.27, "learning_rate": 1.192088888888889e-05, "loss": 0.441, "step": 92750 }, { "epoch": 3.27, "learning_rate": 1.1915333333333334e-05, "loss": 0.4935, "step": 92800 }, { "epoch": 3.27, "learning_rate": 1.1909777777777778e-05, "loss": 0.4729, "step": 92850 }, { "epoch": 3.27, "learning_rate": 1.1904222222222223e-05, "loss": 0.5525, "step": 92900 }, { "epoch": 3.27, "learning_rate": 1.1898666666666667e-05, "loss": 0.453, "step": 92950 }, { "epoch": 3.27, "learning_rate": 1.1893111111111114e-05, "loss": 0.4847, "step": 93000 }, { "epoch": 3.28, "learning_rate": 1.1887555555555557e-05, "loss": 0.4559, "step": 93050 }, { "epoch": 3.28, "learning_rate": 1.1882e-05, "loss": 0.4839, "step": 93100 }, { "epoch": 3.28, "learning_rate": 1.1876444444444446e-05, "loss": 0.4634, "step": 93150 }, { "epoch": 3.28, "learning_rate": 1.187088888888889e-05, "loss": 0.5046, "step": 93200 }, { "epoch": 3.28, "learning_rate": 1.1865333333333335e-05, "loss": 0.4928, "step": 93250 }, { "epoch": 3.28, "learning_rate": 1.1859777777777778e-05, "loss": 0.4844, "step": 93300 }, { "epoch": 3.29, "learning_rate": 1.1854222222222222e-05, "loss": 0.4674, "step": 93350 }, { "epoch": 3.29, "learning_rate": 1.1848666666666669e-05, "loss": 0.4289, "step": 93400 }, { "epoch": 3.29, "learning_rate": 1.1843111111111112e-05, "loss": 0.4458, "step": 93450 }, { "epoch": 3.29, "learning_rate": 1.1837555555555556e-05, "loss": 0.4868, "step": 93500 }, { "epoch": 3.29, "learning_rate": 1.1832000000000001e-05, "loss": 0.4585, "step": 93550 }, { "epoch": 3.3, "learning_rate": 1.1826444444444445e-05, "loss": 0.4786, "step": 93600 }, { "epoch": 3.3, "learning_rate": 1.182088888888889e-05, "loss": 0.45, "step": 93650 }, { "epoch": 3.3, "learning_rate": 1.1815333333333334e-05, "loss": 0.4725, "step": 93700 }, { "epoch": 3.3, "learning_rate": 1.1809777777777777e-05, "loss": 0.5266, "step": 93750 }, { "epoch": 3.3, "learning_rate": 1.1804222222222224e-05, "loss": 0.4718, "step": 93800 }, { "epoch": 3.3, "learning_rate": 1.1798666666666668e-05, "loss": 0.4529, "step": 93850 }, { "epoch": 3.31, "learning_rate": 1.1793111111111113e-05, "loss": 0.4406, "step": 93900 }, { "epoch": 3.31, "learning_rate": 1.1787555555555556e-05, "loss": 0.4486, "step": 93950 }, { "epoch": 3.31, "learning_rate": 1.1782e-05, "loss": 0.4564, "step": 94000 }, { "epoch": 3.31, "learning_rate": 1.1776444444444445e-05, "loss": 0.4583, "step": 94050 }, { "epoch": 3.31, "learning_rate": 1.1770888888888889e-05, "loss": 0.442, "step": 94100 }, { "epoch": 3.31, "learning_rate": 1.1765333333333336e-05, "loss": 0.4438, "step": 94150 }, { "epoch": 3.32, "learning_rate": 1.175977777777778e-05, "loss": 0.4548, "step": 94200 }, { "epoch": 3.32, "learning_rate": 1.1754222222222223e-05, "loss": 0.5067, "step": 94250 }, { "epoch": 3.32, "learning_rate": 1.1748666666666668e-05, "loss": 0.4432, "step": 94300 }, { "epoch": 3.32, "learning_rate": 1.1743111111111112e-05, "loss": 0.4445, "step": 94350 }, { "epoch": 3.32, "learning_rate": 1.1737555555555557e-05, "loss": 0.4557, "step": 94400 }, { "epoch": 3.33, "learning_rate": 1.1732e-05, "loss": 0.4297, "step": 94450 }, { "epoch": 3.33, "learning_rate": 1.1726444444444444e-05, "loss": 0.4359, "step": 94500 }, { "epoch": 3.33, "learning_rate": 1.1720888888888891e-05, "loss": 0.4677, "step": 94550 }, { "epoch": 3.33, "learning_rate": 1.1715333333333335e-05, "loss": 0.4629, "step": 94600 }, { "epoch": 3.33, "learning_rate": 1.1709777777777778e-05, "loss": 0.479, "step": 94650 }, { "epoch": 3.33, "learning_rate": 1.1704222222222223e-05, "loss": 0.4528, "step": 94700 }, { "epoch": 3.34, "learning_rate": 1.1698666666666667e-05, "loss": 0.4502, "step": 94750 }, { "epoch": 3.34, "learning_rate": 1.1693111111111112e-05, "loss": 0.4279, "step": 94800 }, { "epoch": 3.34, "learning_rate": 1.1687555555555556e-05, "loss": 0.4528, "step": 94850 }, { "epoch": 3.34, "learning_rate": 1.1682e-05, "loss": 0.4642, "step": 94900 }, { "epoch": 3.34, "learning_rate": 1.1676444444444446e-05, "loss": 0.4557, "step": 94950 }, { "epoch": 3.34, "learning_rate": 1.167088888888889e-05, "loss": 0.4788, "step": 95000 }, { "epoch": 3.34, "eval_loss": 0.2741318345069885, "eval_runtime": 18.4914, "eval_samples_per_second": 76.793, "eval_steps_per_second": 4.813, "eval_wer": 0.20840519197603705, "step": 95000 }, { "epoch": 3.35, "learning_rate": 1.1665333333333335e-05, "loss": 0.4481, "step": 95050 }, { "epoch": 3.35, "learning_rate": 1.1659777777777779e-05, "loss": 0.4757, "step": 95100 }, { "epoch": 3.35, "learning_rate": 1.1654222222222222e-05, "loss": 0.532, "step": 95150 }, { "epoch": 3.35, "learning_rate": 1.1648666666666667e-05, "loss": 0.4371, "step": 95200 }, { "epoch": 3.35, "learning_rate": 1.1643111111111111e-05, "loss": 0.4492, "step": 95250 }, { "epoch": 3.36, "learning_rate": 1.1637555555555558e-05, "loss": 0.4517, "step": 95300 }, { "epoch": 3.36, "learning_rate": 1.1632000000000001e-05, "loss": 0.4459, "step": 95350 }, { "epoch": 3.36, "learning_rate": 1.1626444444444445e-05, "loss": 0.489, "step": 95400 }, { "epoch": 3.36, "learning_rate": 1.162088888888889e-05, "loss": 0.4852, "step": 95450 }, { "epoch": 3.36, "learning_rate": 1.1615333333333334e-05, "loss": 0.4342, "step": 95500 }, { "epoch": 3.36, "learning_rate": 1.1609777777777779e-05, "loss": 0.4422, "step": 95550 }, { "epoch": 3.37, "learning_rate": 1.1604222222222223e-05, "loss": 0.4299, "step": 95600 }, { "epoch": 3.37, "learning_rate": 1.1598666666666666e-05, "loss": 0.4616, "step": 95650 }, { "epoch": 3.37, "learning_rate": 1.1593111111111113e-05, "loss": 0.4277, "step": 95700 }, { "epoch": 3.37, "learning_rate": 1.1587666666666667e-05, "loss": 0.4512, "step": 95750 }, { "epoch": 3.37, "learning_rate": 1.1582111111111111e-05, "loss": 0.4357, "step": 95800 }, { "epoch": 3.37, "learning_rate": 1.1576555555555558e-05, "loss": 0.4301, "step": 95850 }, { "epoch": 3.38, "learning_rate": 1.1571000000000002e-05, "loss": 0.4509, "step": 95900 }, { "epoch": 3.38, "learning_rate": 1.1565444444444445e-05, "loss": 0.448, "step": 95950 }, { "epoch": 3.38, "learning_rate": 1.155988888888889e-05, "loss": 0.4908, "step": 96000 }, { "epoch": 3.38, "learning_rate": 1.1554333333333334e-05, "loss": 0.4401, "step": 96050 }, { "epoch": 3.38, "learning_rate": 1.1548777777777777e-05, "loss": 0.5636, "step": 96100 }, { "epoch": 3.39, "learning_rate": 1.1543222222222223e-05, "loss": 0.4918, "step": 96150 }, { "epoch": 3.39, "learning_rate": 1.1537666666666666e-05, "loss": 0.4364, "step": 96200 }, { "epoch": 3.39, "learning_rate": 1.1532111111111113e-05, "loss": 0.4424, "step": 96250 }, { "epoch": 3.39, "learning_rate": 1.1526555555555557e-05, "loss": 0.4185, "step": 96300 }, { "epoch": 3.39, "learning_rate": 1.1521e-05, "loss": 0.4677, "step": 96350 }, { "epoch": 3.39, "learning_rate": 1.1515444444444446e-05, "loss": 0.4423, "step": 96400 }, { "epoch": 3.4, "learning_rate": 1.1509888888888889e-05, "loss": 0.4513, "step": 96450 }, { "epoch": 3.4, "learning_rate": 1.1504333333333334e-05, "loss": 0.4423, "step": 96500 }, { "epoch": 3.4, "learning_rate": 1.1498777777777778e-05, "loss": 0.4579, "step": 96550 }, { "epoch": 3.4, "learning_rate": 1.1493222222222221e-05, "loss": 0.4877, "step": 96600 }, { "epoch": 3.4, "learning_rate": 1.1487666666666668e-05, "loss": 0.4173, "step": 96650 }, { "epoch": 3.4, "learning_rate": 1.1482111111111112e-05, "loss": 0.4364, "step": 96700 }, { "epoch": 3.41, "learning_rate": 1.1476555555555557e-05, "loss": 0.5784, "step": 96750 }, { "epoch": 3.41, "learning_rate": 1.1471e-05, "loss": 0.4639, "step": 96800 }, { "epoch": 3.41, "learning_rate": 1.1465444444444444e-05, "loss": 0.4447, "step": 96850 }, { "epoch": 3.41, "learning_rate": 1.145988888888889e-05, "loss": 0.4352, "step": 96900 }, { "epoch": 3.41, "learning_rate": 1.1454333333333333e-05, "loss": 0.4634, "step": 96950 }, { "epoch": 3.42, "learning_rate": 1.144877777777778e-05, "loss": 0.4469, "step": 97000 }, { "epoch": 3.42, "learning_rate": 1.1443222222222224e-05, "loss": 0.5037, "step": 97050 }, { "epoch": 3.42, "learning_rate": 1.1437666666666667e-05, "loss": 0.464, "step": 97100 }, { "epoch": 3.42, "learning_rate": 1.1432111111111112e-05, "loss": 0.4156, "step": 97150 }, { "epoch": 3.42, "learning_rate": 1.1426555555555556e-05, "loss": 0.4243, "step": 97200 }, { "epoch": 3.42, "learning_rate": 1.1421e-05, "loss": 0.4395, "step": 97250 }, { "epoch": 3.43, "learning_rate": 1.1415444444444445e-05, "loss": 0.4255, "step": 97300 }, { "epoch": 3.43, "learning_rate": 1.140988888888889e-05, "loss": 0.4609, "step": 97350 }, { "epoch": 3.43, "learning_rate": 1.1404333333333335e-05, "loss": 0.4392, "step": 97400 }, { "epoch": 3.43, "learning_rate": 1.1398777777777779e-05, "loss": 0.4451, "step": 97450 }, { "epoch": 3.43, "learning_rate": 1.1393222222222222e-05, "loss": 0.4621, "step": 97500 }, { "epoch": 3.43, "eval_loss": 0.2817385494709015, "eval_runtime": 38.8812, "eval_samples_per_second": 36.522, "eval_steps_per_second": 2.289, "eval_wer": 0.20377598257238813, "step": 97500 }, { "epoch": 3.43, "learning_rate": 1.1387666666666668e-05, "loss": 0.4464, "step": 97550 }, { "epoch": 3.44, "learning_rate": 1.1382111111111111e-05, "loss": 0.47, "step": 97600 }, { "epoch": 3.44, "learning_rate": 1.1376555555555558e-05, "loss": 0.4815, "step": 97650 }, { "epoch": 3.44, "learning_rate": 1.1371000000000002e-05, "loss": 0.4546, "step": 97700 }, { "epoch": 3.44, "learning_rate": 1.1365444444444445e-05, "loss": 0.489, "step": 97750 }, { "epoch": 3.44, "learning_rate": 1.135988888888889e-05, "loss": 0.4439, "step": 97800 }, { "epoch": 3.45, "learning_rate": 1.1354333333333334e-05, "loss": 0.4385, "step": 97850 }, { "epoch": 3.45, "learning_rate": 1.134877777777778e-05, "loss": 0.4341, "step": 97900 }, { "epoch": 3.45, "learning_rate": 1.1343222222222223e-05, "loss": 0.428, "step": 97950 }, { "epoch": 3.45, "learning_rate": 1.1337666666666666e-05, "loss": 0.4736, "step": 98000 }, { "epoch": 3.45, "learning_rate": 1.1332111111111113e-05, "loss": 0.4526, "step": 98050 }, { "epoch": 3.45, "learning_rate": 1.1326555555555557e-05, "loss": 0.437, "step": 98100 }, { "epoch": 3.46, "learning_rate": 1.1321000000000002e-05, "loss": 0.4374, "step": 98150 }, { "epoch": 3.46, "learning_rate": 1.1315444444444446e-05, "loss": 0.4566, "step": 98200 }, { "epoch": 3.46, "learning_rate": 1.131e-05, "loss": 0.7112, "step": 98250 }, { "epoch": 3.46, "learning_rate": 1.1304444444444445e-05, "loss": 0.4699, "step": 98300 }, { "epoch": 3.46, "learning_rate": 1.129888888888889e-05, "loss": 0.4354, "step": 98350 }, { "epoch": 3.46, "learning_rate": 1.1293333333333334e-05, "loss": 0.4285, "step": 98400 }, { "epoch": 3.47, "learning_rate": 1.128777777777778e-05, "loss": 0.4407, "step": 98450 }, { "epoch": 3.47, "learning_rate": 1.1282222222222223e-05, "loss": 0.4475, "step": 98500 }, { "epoch": 3.47, "learning_rate": 1.1276666666666667e-05, "loss": 0.4929, "step": 98550 }, { "epoch": 3.47, "learning_rate": 1.1271111111111113e-05, "loss": 0.4671, "step": 98600 }, { "epoch": 3.47, "learning_rate": 1.1265555555555557e-05, "loss": 0.4496, "step": 98650 }, { "epoch": 3.48, "learning_rate": 1.126e-05, "loss": 0.4265, "step": 98700 }, { "epoch": 3.48, "learning_rate": 1.1254444444444446e-05, "loss": 0.4526, "step": 98750 }, { "epoch": 3.48, "learning_rate": 1.124888888888889e-05, "loss": 0.4428, "step": 98800 }, { "epoch": 3.48, "learning_rate": 1.1243333333333335e-05, "loss": 0.4741, "step": 98850 }, { "epoch": 3.48, "learning_rate": 1.1237777777777778e-05, "loss": 0.4947, "step": 98900 }, { "epoch": 3.48, "learning_rate": 1.1232222222222222e-05, "loss": 0.4472, "step": 98950 }, { "epoch": 3.49, "learning_rate": 1.1226666666666669e-05, "loss": 0.4651, "step": 99000 }, { "epoch": 3.49, "learning_rate": 1.1221111111111112e-05, "loss": 0.4511, "step": 99050 }, { "epoch": 3.49, "learning_rate": 1.1215555555555558e-05, "loss": 0.455, "step": 99100 }, { "epoch": 3.49, "learning_rate": 1.1210000000000001e-05, "loss": 0.4677, "step": 99150 }, { "epoch": 3.49, "learning_rate": 1.1204444444444445e-05, "loss": 0.4331, "step": 99200 }, { "epoch": 3.49, "learning_rate": 1.119888888888889e-05, "loss": 0.4653, "step": 99250 }, { "epoch": 3.5, "learning_rate": 1.1193333333333333e-05, "loss": 0.4581, "step": 99300 }, { "epoch": 3.5, "learning_rate": 1.118777777777778e-05, "loss": 0.4894, "step": 99350 }, { "epoch": 3.5, "learning_rate": 1.1182222222222224e-05, "loss": 0.4667, "step": 99400 }, { "epoch": 3.5, "learning_rate": 1.1176666666666668e-05, "loss": 0.425, "step": 99450 }, { "epoch": 3.5, "learning_rate": 1.1171111111111113e-05, "loss": 0.454, "step": 99500 }, { "epoch": 3.51, "learning_rate": 1.1165555555555556e-05, "loss": 0.4352, "step": 99550 }, { "epoch": 3.51, "learning_rate": 1.1160000000000002e-05, "loss": 0.4814, "step": 99600 }, { "epoch": 3.51, "learning_rate": 1.1154444444444445e-05, "loss": 0.444, "step": 99650 }, { "epoch": 3.51, "learning_rate": 1.1148888888888889e-05, "loss": 0.461, "step": 99700 }, { "epoch": 3.51, "learning_rate": 1.1143333333333336e-05, "loss": 0.438, "step": 99750 }, { "epoch": 3.51, "learning_rate": 1.113777777777778e-05, "loss": 0.4307, "step": 99800 }, { "epoch": 3.52, "learning_rate": 1.1132222222222223e-05, "loss": 0.4267, "step": 99850 }, { "epoch": 3.52, "learning_rate": 1.1126666666666668e-05, "loss": 0.4471, "step": 99900 }, { "epoch": 3.52, "learning_rate": 1.1121111111111112e-05, "loss": 0.437, "step": 99950 }, { "epoch": 3.52, "learning_rate": 1.1115555555555557e-05, "loss": 0.523, "step": 100000 }, { "epoch": 3.52, "eval_loss": 0.2734874188899994, "eval_runtime": 23.7587, "eval_samples_per_second": 59.768, "eval_steps_per_second": 3.746, "eval_wer": 0.2015067622764818, "step": 100000 }, { "epoch": 3.52, "learning_rate": 1.111e-05, "loss": 0.4425, "step": 100050 }, { "epoch": 3.52, "learning_rate": 1.1104444444444444e-05, "loss": 0.5907, "step": 100100 }, { "epoch": 3.53, "learning_rate": 1.1098888888888891e-05, "loss": 0.4773, "step": 100150 }, { "epoch": 3.53, "learning_rate": 1.1093333333333334e-05, "loss": 0.449, "step": 100200 }, { "epoch": 3.53, "learning_rate": 1.108777777777778e-05, "loss": 0.471, "step": 100250 }, { "epoch": 3.53, "learning_rate": 1.1082222222222223e-05, "loss": 0.4276, "step": 100300 }, { "epoch": 3.53, "learning_rate": 1.1076666666666667e-05, "loss": 0.4976, "step": 100350 }, { "epoch": 3.53, "learning_rate": 1.1071111111111112e-05, "loss": 0.4428, "step": 100400 }, { "epoch": 3.54, "learning_rate": 1.1065666666666668e-05, "loss": 0.4837, "step": 100450 }, { "epoch": 3.54, "learning_rate": 1.1060111111111112e-05, "loss": 0.4538, "step": 100500 }, { "epoch": 3.54, "learning_rate": 1.1054555555555557e-05, "loss": 0.4185, "step": 100550 }, { "epoch": 3.54, "learning_rate": 1.1049e-05, "loss": 0.4813, "step": 100600 }, { "epoch": 3.54, "learning_rate": 1.1043444444444444e-05, "loss": 0.4508, "step": 100650 }, { "epoch": 3.55, "learning_rate": 1.1038e-05, "loss": 0.4866, "step": 100700 }, { "epoch": 3.55, "learning_rate": 1.1032444444444445e-05, "loss": 0.4645, "step": 100750 }, { "epoch": 3.55, "learning_rate": 1.1026888888888889e-05, "loss": 0.4645, "step": 100800 }, { "epoch": 3.55, "learning_rate": 1.1021333333333336e-05, "loss": 0.4523, "step": 100850 }, { "epoch": 3.55, "learning_rate": 1.101577777777778e-05, "loss": 0.4466, "step": 100900 }, { "epoch": 3.55, "learning_rate": 1.1010222222222223e-05, "loss": 0.489, "step": 100950 }, { "epoch": 3.56, "learning_rate": 1.1004666666666668e-05, "loss": 0.4386, "step": 101000 }, { "epoch": 3.56, "learning_rate": 1.0999111111111112e-05, "loss": 0.4912, "step": 101050 }, { "epoch": 3.56, "learning_rate": 1.0993555555555557e-05, "loss": 0.4324, "step": 101100 }, { "epoch": 3.56, "learning_rate": 1.0988e-05, "loss": 0.4622, "step": 101150 }, { "epoch": 3.56, "learning_rate": 1.0982444444444444e-05, "loss": 0.4603, "step": 101200 }, { "epoch": 3.56, "learning_rate": 1.0976888888888891e-05, "loss": 0.4164, "step": 101250 }, { "epoch": 3.57, "learning_rate": 1.0971333333333335e-05, "loss": 0.4127, "step": 101300 }, { "epoch": 3.57, "learning_rate": 1.096577777777778e-05, "loss": 0.4553, "step": 101350 }, { "epoch": 3.57, "learning_rate": 1.0960222222222223e-05, "loss": 0.4298, "step": 101400 }, { "epoch": 3.57, "learning_rate": 1.0954666666666667e-05, "loss": 0.4575, "step": 101450 }, { "epoch": 3.57, "learning_rate": 1.0949111111111112e-05, "loss": 0.4116, "step": 101500 }, { "epoch": 3.58, "learning_rate": 1.0943555555555556e-05, "loss": 0.4355, "step": 101550 }, { "epoch": 3.58, "learning_rate": 1.0938000000000003e-05, "loss": 0.48, "step": 101600 }, { "epoch": 3.58, "learning_rate": 1.0932444444444446e-05, "loss": 0.5111, "step": 101650 }, { "epoch": 3.58, "learning_rate": 1.092688888888889e-05, "loss": 0.4452, "step": 101700 }, { "epoch": 3.58, "learning_rate": 1.0921333333333335e-05, "loss": 0.4585, "step": 101750 }, { "epoch": 3.58, "learning_rate": 1.0915777777777779e-05, "loss": 0.4156, "step": 101800 }, { "epoch": 3.59, "learning_rate": 1.0910222222222222e-05, "loss": 0.4756, "step": 101850 }, { "epoch": 3.59, "learning_rate": 1.0904666666666667e-05, "loss": 0.4457, "step": 101900 }, { "epoch": 3.59, "learning_rate": 1.0899111111111111e-05, "loss": 0.427, "step": 101950 }, { "epoch": 3.59, "learning_rate": 1.0893555555555558e-05, "loss": 0.4762, "step": 102000 }, { "epoch": 3.59, "learning_rate": 1.0888000000000001e-05, "loss": 0.4694, "step": 102050 }, { "epoch": 3.59, "learning_rate": 1.0882444444444445e-05, "loss": 0.4348, "step": 102100 }, { "epoch": 3.6, "learning_rate": 1.087688888888889e-05, "loss": 0.4455, "step": 102150 }, { "epoch": 3.6, "learning_rate": 1.0871333333333334e-05, "loss": 0.4408, "step": 102200 }, { "epoch": 3.6, "learning_rate": 1.0865777777777779e-05, "loss": 0.4628, "step": 102250 }, { "epoch": 3.6, "learning_rate": 1.0860222222222223e-05, "loss": 0.4388, "step": 102300 }, { "epoch": 3.6, "learning_rate": 1.0854666666666666e-05, "loss": 0.4233, "step": 102350 }, { "epoch": 3.61, "learning_rate": 1.0849111111111113e-05, "loss": 0.4413, "step": 102400 }, { "epoch": 3.61, "learning_rate": 1.0843555555555557e-05, "loss": 0.4433, "step": 102450 }, { "epoch": 3.61, "learning_rate": 1.0838000000000002e-05, "loss": 0.4689, "step": 102500 }, { "epoch": 3.61, "eval_loss": 0.26310908794403076, "eval_runtime": 20.0328, "eval_samples_per_second": 70.884, "eval_steps_per_second": 4.443, "eval_wer": 0.19950984841608424, "step": 102500 }, { "epoch": 3.61, "learning_rate": 1.0832444444444445e-05, "loss": 0.4561, "step": 102550 }, { "epoch": 3.61, "learning_rate": 1.0826888888888889e-05, "loss": 0.4636, "step": 102600 }, { "epoch": 3.61, "learning_rate": 1.0821333333333334e-05, "loss": 0.4222, "step": 102650 }, { "epoch": 3.62, "learning_rate": 1.0815777777777778e-05, "loss": 0.4553, "step": 102700 }, { "epoch": 3.62, "learning_rate": 1.0810222222222225e-05, "loss": 0.4163, "step": 102750 }, { "epoch": 3.62, "learning_rate": 1.0804666666666668e-05, "loss": 0.4422, "step": 102800 }, { "epoch": 3.62, "learning_rate": 1.0799111111111112e-05, "loss": 0.4602, "step": 102850 }, { "epoch": 3.62, "learning_rate": 1.0793555555555557e-05, "loss": 0.4411, "step": 102900 }, { "epoch": 3.62, "learning_rate": 1.0788e-05, "loss": 0.4348, "step": 102950 }, { "epoch": 3.63, "learning_rate": 1.0782444444444444e-05, "loss": 0.4254, "step": 103000 }, { "epoch": 3.63, "learning_rate": 1.077688888888889e-05, "loss": 0.4604, "step": 103050 }, { "epoch": 3.63, "learning_rate": 1.0771333333333333e-05, "loss": 0.5076, "step": 103100 }, { "epoch": 3.63, "learning_rate": 1.076577777777778e-05, "loss": 0.4382, "step": 103150 }, { "epoch": 3.63, "learning_rate": 1.0760222222222224e-05, "loss": 0.453, "step": 103200 }, { "epoch": 3.64, "learning_rate": 1.0754666666666667e-05, "loss": 0.4488, "step": 103250 }, { "epoch": 3.64, "learning_rate": 1.0749111111111112e-05, "loss": 0.4468, "step": 103300 }, { "epoch": 3.64, "learning_rate": 1.0743555555555556e-05, "loss": 0.4433, "step": 103350 }, { "epoch": 3.64, "learning_rate": 1.0738000000000001e-05, "loss": 0.4463, "step": 103400 }, { "epoch": 3.64, "learning_rate": 1.0732444444444445e-05, "loss": 0.4553, "step": 103450 }, { "epoch": 3.64, "learning_rate": 1.0726888888888888e-05, "loss": 0.444, "step": 103500 }, { "epoch": 3.65, "learning_rate": 1.0721333333333335e-05, "loss": 0.5977, "step": 103550 }, { "epoch": 3.65, "learning_rate": 1.0715777777777779e-05, "loss": 0.4463, "step": 103600 }, { "epoch": 3.65, "learning_rate": 1.0710222222222224e-05, "loss": 0.451, "step": 103650 }, { "epoch": 3.65, "learning_rate": 1.070477777777778e-05, "loss": 0.4431, "step": 103700 }, { "epoch": 3.65, "learning_rate": 1.0699222222222224e-05, "loss": 0.4413, "step": 103750 }, { "epoch": 3.65, "learning_rate": 1.0693666666666667e-05, "loss": 0.4566, "step": 103800 }, { "epoch": 3.66, "learning_rate": 1.0688111111111112e-05, "loss": 0.4555, "step": 103850 }, { "epoch": 3.66, "learning_rate": 1.0682555555555556e-05, "loss": 0.4408, "step": 103900 }, { "epoch": 3.66, "learning_rate": 1.0677000000000001e-05, "loss": 0.4401, "step": 103950 }, { "epoch": 3.66, "learning_rate": 1.0671444444444445e-05, "loss": 0.4622, "step": 104000 }, { "epoch": 3.66, "learning_rate": 1.0665888888888888e-05, "loss": 0.4987, "step": 104050 }, { "epoch": 3.67, "learning_rate": 1.0660333333333335e-05, "loss": 0.4389, "step": 104100 }, { "epoch": 3.67, "learning_rate": 1.0654777777777779e-05, "loss": 0.5163, "step": 104150 }, { "epoch": 3.67, "learning_rate": 1.0649222222222224e-05, "loss": 0.4436, "step": 104200 }, { "epoch": 3.67, "learning_rate": 1.0643666666666668e-05, "loss": 0.432, "step": 104250 }, { "epoch": 3.67, "learning_rate": 1.0638111111111111e-05, "loss": 0.4451, "step": 104300 }, { "epoch": 3.67, "learning_rate": 1.0632555555555557e-05, "loss": 0.5093, "step": 104350 }, { "epoch": 3.68, "learning_rate": 1.0627e-05, "loss": 0.5062, "step": 104400 }, { "epoch": 3.68, "learning_rate": 1.0621444444444444e-05, "loss": 0.4409, "step": 104450 }, { "epoch": 3.68, "learning_rate": 1.061588888888889e-05, "loss": 0.4394, "step": 104500 }, { "epoch": 3.68, "learning_rate": 1.0610333333333334e-05, "loss": 0.457, "step": 104550 }, { "epoch": 3.68, "learning_rate": 1.060477777777778e-05, "loss": 0.429, "step": 104600 }, { "epoch": 3.68, "learning_rate": 1.0599222222222223e-05, "loss": 0.4847, "step": 104650 }, { "epoch": 3.69, "learning_rate": 1.0593666666666666e-05, "loss": 0.4821, "step": 104700 }, { "epoch": 3.69, "learning_rate": 1.0588111111111112e-05, "loss": 0.5837, "step": 104750 }, { "epoch": 3.69, "learning_rate": 1.0582555555555555e-05, "loss": 0.4297, "step": 104800 }, { "epoch": 3.69, "learning_rate": 1.0577000000000002e-05, "loss": 0.4336, "step": 104850 }, { "epoch": 3.69, "learning_rate": 1.0571444444444446e-05, "loss": 0.4425, "step": 104900 }, { "epoch": 3.7, "learning_rate": 1.056588888888889e-05, "loss": 0.5026, "step": 104950 }, { "epoch": 3.7, "learning_rate": 1.0560333333333335e-05, "loss": 0.4502, "step": 105000 }, { "epoch": 3.7, "eval_loss": 0.26892954111099243, "eval_runtime": 11.8114, "eval_samples_per_second": 120.223, "eval_steps_per_second": 7.535, "eval_wer": 0.1986021602977217, "step": 105000 }, { "epoch": 3.7, "learning_rate": 1.0554777777777778e-05, "loss": 0.4145, "step": 105050 }, { "epoch": 3.7, "learning_rate": 1.0549222222222223e-05, "loss": 0.517, "step": 105100 }, { "epoch": 3.7, "learning_rate": 1.0543666666666667e-05, "loss": 0.4447, "step": 105150 }, { "epoch": 3.7, "learning_rate": 1.053811111111111e-05, "loss": 0.4763, "step": 105200 }, { "epoch": 3.71, "learning_rate": 1.0532555555555557e-05, "loss": 0.4459, "step": 105250 }, { "epoch": 3.71, "learning_rate": 1.0527000000000001e-05, "loss": 0.4048, "step": 105300 }, { "epoch": 3.71, "learning_rate": 1.0521444444444446e-05, "loss": 0.4451, "step": 105350 }, { "epoch": 3.71, "learning_rate": 1.051588888888889e-05, "loss": 0.4286, "step": 105400 }, { "epoch": 3.71, "learning_rate": 1.0510333333333333e-05, "loss": 0.5862, "step": 105450 }, { "epoch": 3.71, "learning_rate": 1.0504777777777779e-05, "loss": 0.4896, "step": 105500 }, { "epoch": 3.72, "learning_rate": 1.0499222222222222e-05, "loss": 0.4689, "step": 105550 }, { "epoch": 3.72, "learning_rate": 1.0493666666666666e-05, "loss": 0.457, "step": 105600 }, { "epoch": 3.72, "learning_rate": 1.0488111111111113e-05, "loss": 0.435, "step": 105650 }, { "epoch": 3.72, "learning_rate": 1.0482555555555556e-05, "loss": 0.464, "step": 105700 }, { "epoch": 3.72, "learning_rate": 1.0477000000000002e-05, "loss": 0.4425, "step": 105750 }, { "epoch": 3.73, "learning_rate": 1.0471444444444445e-05, "loss": 0.467, "step": 105800 }, { "epoch": 3.73, "learning_rate": 1.0465888888888889e-05, "loss": 0.4526, "step": 105850 }, { "epoch": 3.73, "learning_rate": 1.0460333333333334e-05, "loss": 0.4294, "step": 105900 }, { "epoch": 3.73, "learning_rate": 1.0454777777777777e-05, "loss": 0.4832, "step": 105950 }, { "epoch": 3.73, "learning_rate": 1.0449222222222224e-05, "loss": 0.429, "step": 106000 }, { "epoch": 3.73, "learning_rate": 1.0443666666666668e-05, "loss": 0.4243, "step": 106050 }, { "epoch": 3.74, "learning_rate": 1.0438111111111111e-05, "loss": 0.4574, "step": 106100 }, { "epoch": 3.74, "learning_rate": 1.0432555555555557e-05, "loss": 0.4708, "step": 106150 }, { "epoch": 3.74, "learning_rate": 1.0427e-05, "loss": 0.429, "step": 106200 }, { "epoch": 3.74, "learning_rate": 1.0421444444444446e-05, "loss": 0.4328, "step": 106250 }, { "epoch": 3.74, "learning_rate": 1.0415888888888889e-05, "loss": 0.4413, "step": 106300 }, { "epoch": 3.74, "learning_rate": 1.0410333333333333e-05, "loss": 0.4647, "step": 106350 }, { "epoch": 3.75, "learning_rate": 1.040477777777778e-05, "loss": 0.4467, "step": 106400 }, { "epoch": 3.75, "learning_rate": 1.0399222222222223e-05, "loss": 0.5032, "step": 106450 }, { "epoch": 3.75, "learning_rate": 1.0393666666666668e-05, "loss": 0.4493, "step": 106500 }, { "epoch": 3.75, "learning_rate": 1.0388111111111112e-05, "loss": 0.4196, "step": 106550 }, { "epoch": 3.75, "learning_rate": 1.0382555555555556e-05, "loss": 0.4268, "step": 106600 }, { "epoch": 3.76, "learning_rate": 1.0377e-05, "loss": 0.4263, "step": 106650 }, { "epoch": 3.76, "learning_rate": 1.0371444444444444e-05, "loss": 0.4322, "step": 106700 }, { "epoch": 3.76, "learning_rate": 1.0365888888888888e-05, "loss": 0.4482, "step": 106750 }, { "epoch": 3.76, "learning_rate": 1.0360333333333335e-05, "loss": 0.4906, "step": 106800 }, { "epoch": 3.76, "learning_rate": 1.0354777777777778e-05, "loss": 0.444, "step": 106850 }, { "epoch": 3.76, "learning_rate": 1.0349222222222224e-05, "loss": 0.4468, "step": 106900 }, { "epoch": 3.77, "learning_rate": 1.0343666666666667e-05, "loss": 0.419, "step": 106950 }, { "epoch": 3.77, "learning_rate": 1.033811111111111e-05, "loss": 0.4494, "step": 107000 }, { "epoch": 3.77, "learning_rate": 1.0332555555555556e-05, "loss": 0.4474, "step": 107050 }, { "epoch": 3.77, "learning_rate": 1.0327e-05, "loss": 0.4505, "step": 107100 }, { "epoch": 3.77, "learning_rate": 1.0321444444444446e-05, "loss": 0.4514, "step": 107150 }, { "epoch": 3.77, "learning_rate": 1.031588888888889e-05, "loss": 0.4227, "step": 107200 }, { "epoch": 3.78, "learning_rate": 1.0310333333333334e-05, "loss": 0.4431, "step": 107250 }, { "epoch": 3.78, "learning_rate": 1.0304777777777779e-05, "loss": 0.4387, "step": 107300 }, { "epoch": 3.78, "learning_rate": 1.0299222222222222e-05, "loss": 0.4715, "step": 107350 }, { "epoch": 3.78, "learning_rate": 1.0293666666666668e-05, "loss": 0.449, "step": 107400 }, { "epoch": 3.78, "learning_rate": 1.0288111111111111e-05, "loss": 0.4406, "step": 107450 }, { "epoch": 3.78, "learning_rate": 1.0282555555555555e-05, "loss": 0.4402, "step": 107500 }, { "epoch": 3.78, "eval_loss": 0.27264848351478577, "eval_runtime": 31.4516, "eval_samples_per_second": 45.149, "eval_steps_per_second": 2.83, "eval_wer": 0.19869292910955796, "step": 107500 }, { "epoch": 3.79, "learning_rate": 1.0277000000000002e-05, "loss": 0.4826, "step": 107550 }, { "epoch": 3.79, "learning_rate": 1.0271444444444445e-05, "loss": 0.4321, "step": 107600 }, { "epoch": 3.79, "learning_rate": 1.026588888888889e-05, "loss": 0.4663, "step": 107650 }, { "epoch": 3.79, "learning_rate": 1.0260333333333334e-05, "loss": 0.4341, "step": 107700 }, { "epoch": 3.79, "learning_rate": 1.0254777777777778e-05, "loss": 0.4133, "step": 107750 }, { "epoch": 3.8, "learning_rate": 1.0249222222222223e-05, "loss": 0.4423, "step": 107800 }, { "epoch": 3.8, "learning_rate": 1.0243666666666668e-05, "loss": 0.4111, "step": 107850 }, { "epoch": 3.8, "learning_rate": 1.0238111111111112e-05, "loss": 0.4412, "step": 107900 }, { "epoch": 3.8, "learning_rate": 1.0232555555555557e-05, "loss": 0.4105, "step": 107950 }, { "epoch": 3.8, "learning_rate": 1.0227e-05, "loss": 0.4345, "step": 108000 }, { "epoch": 3.8, "learning_rate": 1.0221444444444446e-05, "loss": 0.4216, "step": 108050 }, { "epoch": 3.81, "learning_rate": 1.021588888888889e-05, "loss": 0.4287, "step": 108100 }, { "epoch": 3.81, "learning_rate": 1.0210444444444445e-05, "loss": 0.5731, "step": 108150 }, { "epoch": 3.81, "learning_rate": 1.0204888888888889e-05, "loss": 0.4498, "step": 108200 }, { "epoch": 3.81, "learning_rate": 1.0199333333333334e-05, "loss": 0.4439, "step": 108250 }, { "epoch": 3.81, "learning_rate": 1.0193777777777778e-05, "loss": 0.4461, "step": 108300 }, { "epoch": 3.81, "learning_rate": 1.0188222222222223e-05, "loss": 0.4418, "step": 108350 }, { "epoch": 3.82, "learning_rate": 1.0182666666666667e-05, "loss": 0.478, "step": 108400 }, { "epoch": 3.82, "learning_rate": 1.0177111111111112e-05, "loss": 0.4202, "step": 108450 }, { "epoch": 3.82, "learning_rate": 1.0171555555555557e-05, "loss": 0.4754, "step": 108500 }, { "epoch": 3.82, "learning_rate": 1.0166e-05, "loss": 0.4216, "step": 108550 }, { "epoch": 3.82, "learning_rate": 1.0160444444444446e-05, "loss": 0.4475, "step": 108600 }, { "epoch": 3.83, "learning_rate": 1.015488888888889e-05, "loss": 0.4294, "step": 108650 }, { "epoch": 3.83, "learning_rate": 1.0149333333333333e-05, "loss": 0.4586, "step": 108700 }, { "epoch": 3.83, "learning_rate": 1.014377777777778e-05, "loss": 0.4344, "step": 108750 }, { "epoch": 3.83, "learning_rate": 1.0138222222222223e-05, "loss": 0.4761, "step": 108800 }, { "epoch": 3.83, "learning_rate": 1.0132666666666669e-05, "loss": 0.4285, "step": 108850 }, { "epoch": 3.83, "learning_rate": 1.0127111111111112e-05, "loss": 0.4649, "step": 108900 }, { "epoch": 3.84, "learning_rate": 1.0121555555555556e-05, "loss": 0.4415, "step": 108950 }, { "epoch": 3.84, "learning_rate": 1.0116000000000001e-05, "loss": 0.4144, "step": 109000 }, { "epoch": 3.84, "learning_rate": 1.0110444444444445e-05, "loss": 0.4389, "step": 109050 }, { "epoch": 3.84, "learning_rate": 1.0104888888888892e-05, "loss": 0.5292, "step": 109100 }, { "epoch": 3.84, "learning_rate": 1.0099333333333335e-05, "loss": 0.4279, "step": 109150 }, { "epoch": 3.84, "learning_rate": 1.0093777777777779e-05, "loss": 0.4596, "step": 109200 }, { "epoch": 3.85, "learning_rate": 1.0088222222222224e-05, "loss": 0.4773, "step": 109250 }, { "epoch": 3.85, "learning_rate": 1.0082666666666667e-05, "loss": 0.4377, "step": 109300 }, { "epoch": 3.85, "learning_rate": 1.0077111111111111e-05, "loss": 0.4601, "step": 109350 }, { "epoch": 3.85, "learning_rate": 1.0071666666666669e-05, "loss": 0.5526, "step": 109400 }, { "epoch": 3.85, "learning_rate": 1.0066111111111112e-05, "loss": 0.4266, "step": 109450 }, { "epoch": 3.86, "learning_rate": 1.0060555555555556e-05, "loss": 0.4785, "step": 109500 }, { "epoch": 3.86, "learning_rate": 1.0055000000000001e-05, "loss": 0.4616, "step": 109550 }, { "epoch": 3.86, "learning_rate": 1.0049444444444445e-05, "loss": 0.4658, "step": 109600 }, { "epoch": 3.86, "learning_rate": 1.0043888888888892e-05, "loss": 0.4833, "step": 109650 }, { "epoch": 3.86, "learning_rate": 1.0038333333333335e-05, "loss": 0.4537, "step": 109700 }, { "epoch": 3.86, "learning_rate": 1.0032777777777779e-05, "loss": 0.4547, "step": 109750 }, { "epoch": 3.87, "learning_rate": 1.0027222222222224e-05, "loss": 0.4198, "step": 109800 }, { "epoch": 3.87, "learning_rate": 1.0021666666666668e-05, "loss": 0.4491, "step": 109850 }, { "epoch": 3.87, "learning_rate": 1.0016111111111111e-05, "loss": 0.4576, "step": 109900 }, { "epoch": 3.87, "learning_rate": 1.0010555555555556e-05, "loss": 0.4215, "step": 109950 }, { "epoch": 3.87, "learning_rate": 1.0005e-05, "loss": 0.4189, "step": 110000 }, { "epoch": 3.87, "eval_loss": 0.27238038182258606, "eval_runtime": 41.2531, "eval_samples_per_second": 34.422, "eval_steps_per_second": 2.157, "eval_wer": 0.19941907960424798, "step": 110000 }, { "epoch": 3.87, "learning_rate": 9.999444444444445e-06, "loss": 0.4601, "step": 110050 }, { "epoch": 3.88, "learning_rate": 9.99388888888889e-06, "loss": 0.4764, "step": 110100 }, { "epoch": 3.88, "learning_rate": 9.988333333333334e-06, "loss": 0.4198, "step": 110150 }, { "epoch": 3.88, "learning_rate": 9.98277777777778e-06, "loss": 0.4227, "step": 110200 }, { "epoch": 3.88, "learning_rate": 9.977222222222223e-06, "loss": 0.4299, "step": 110250 }, { "epoch": 3.88, "learning_rate": 9.971666666666668e-06, "loss": 0.4144, "step": 110300 }, { "epoch": 3.89, "learning_rate": 9.966111111111112e-06, "loss": 0.4433, "step": 110350 }, { "epoch": 3.89, "learning_rate": 9.960555555555557e-06, "loss": 0.4175, "step": 110400 }, { "epoch": 3.89, "learning_rate": 9.955000000000002e-06, "loss": 0.4434, "step": 110450 }, { "epoch": 3.89, "learning_rate": 9.949444444444446e-06, "loss": 0.4167, "step": 110500 }, { "epoch": 3.89, "learning_rate": 9.94388888888889e-06, "loss": 0.4373, "step": 110550 }, { "epoch": 3.89, "learning_rate": 9.938333333333334e-06, "loss": 0.4668, "step": 110600 }, { "epoch": 3.9, "learning_rate": 9.93277777777778e-06, "loss": 0.4319, "step": 110650 }, { "epoch": 3.9, "learning_rate": 9.927222222222223e-06, "loss": 0.4541, "step": 110700 }, { "epoch": 3.9, "learning_rate": 9.921666666666667e-06, "loss": 0.435, "step": 110750 }, { "epoch": 3.9, "learning_rate": 9.916111111111112e-06, "loss": 0.4288, "step": 110800 }, { "epoch": 3.9, "learning_rate": 9.910555555555557e-06, "loss": 0.4791, "step": 110850 }, { "epoch": 3.9, "learning_rate": 9.905000000000001e-06, "loss": 0.4394, "step": 110900 }, { "epoch": 3.91, "learning_rate": 9.899444444444444e-06, "loss": 0.4358, "step": 110950 }, { "epoch": 3.91, "learning_rate": 9.89388888888889e-06, "loss": 0.4305, "step": 111000 }, { "epoch": 3.91, "learning_rate": 9.888333333333335e-06, "loss": 0.4632, "step": 111050 }, { "epoch": 3.91, "learning_rate": 9.882777777777778e-06, "loss": 0.4121, "step": 111100 }, { "epoch": 3.91, "learning_rate": 9.877222222222222e-06, "loss": 0.4203, "step": 111150 }, { "epoch": 3.92, "learning_rate": 9.871666666666667e-06, "loss": 0.4407, "step": 111200 }, { "epoch": 3.92, "learning_rate": 9.866111111111113e-06, "loss": 0.4261, "step": 111250 }, { "epoch": 3.92, "learning_rate": 9.860555555555556e-06, "loss": 0.4626, "step": 111300 }, { "epoch": 3.92, "learning_rate": 9.855000000000001e-06, "loss": 0.4856, "step": 111350 }, { "epoch": 3.92, "learning_rate": 9.849444444444445e-06, "loss": 0.4507, "step": 111400 }, { "epoch": 3.92, "learning_rate": 9.84388888888889e-06, "loss": 0.4469, "step": 111450 }, { "epoch": 3.93, "learning_rate": 9.838333333333334e-06, "loss": 0.4458, "step": 111500 }, { "epoch": 3.93, "learning_rate": 9.832777777777779e-06, "loss": 0.4198, "step": 111550 }, { "epoch": 3.93, "learning_rate": 9.827222222222224e-06, "loss": 0.4967, "step": 111600 }, { "epoch": 3.93, "learning_rate": 9.821666666666668e-06, "loss": 0.4686, "step": 111650 }, { "epoch": 3.93, "learning_rate": 9.816111111111111e-06, "loss": 0.4457, "step": 111700 }, { "epoch": 3.93, "learning_rate": 9.810555555555557e-06, "loss": 0.4014, "step": 111750 }, { "epoch": 3.94, "learning_rate": 9.805000000000002e-06, "loss": 0.4368, "step": 111800 }, { "epoch": 3.94, "learning_rate": 9.799444444444445e-06, "loss": 0.4404, "step": 111850 }, { "epoch": 3.94, "learning_rate": 9.793888888888889e-06, "loss": 0.4167, "step": 111900 }, { "epoch": 3.94, "learning_rate": 9.788444444444445e-06, "loss": 0.4256, "step": 111950 }, { "epoch": 3.94, "learning_rate": 9.78288888888889e-06, "loss": 0.4452, "step": 112000 }, { "epoch": 3.95, "learning_rate": 9.777333333333334e-06, "loss": 0.4503, "step": 112050 }, { "epoch": 3.95, "learning_rate": 9.771777777777779e-06, "loss": 0.4329, "step": 112100 }, { "epoch": 3.95, "learning_rate": 9.766222222222223e-06, "loss": 0.4453, "step": 112150 }, { "epoch": 3.95, "learning_rate": 9.760666666666668e-06, "loss": 0.4257, "step": 112200 }, { "epoch": 3.95, "learning_rate": 9.755111111111111e-06, "loss": 0.4625, "step": 112250 }, { "epoch": 3.95, "learning_rate": 9.749555555555557e-06, "loss": 0.4129, "step": 112300 }, { "epoch": 3.96, "learning_rate": 9.744000000000002e-06, "loss": 0.4264, "step": 112350 }, { "epoch": 3.96, "learning_rate": 9.738444444444445e-06, "loss": 0.436, "step": 112400 }, { "epoch": 3.96, "learning_rate": 9.732888888888889e-06, "loss": 0.4045, "step": 112450 }, { "epoch": 3.96, "learning_rate": 9.727333333333334e-06, "loss": 0.4526, "step": 112500 }, { "epoch": 3.96, "eval_loss": 0.25956958532333374, "eval_runtime": 24.255, "eval_samples_per_second": 58.545, "eval_steps_per_second": 3.669, "eval_wer": 0.19179449941000273, "step": 112500 }, { "epoch": 3.96, "learning_rate": 9.72177777777778e-06, "loss": 0.6924, "step": 112550 }, { "epoch": 3.96, "learning_rate": 9.716222222222223e-06, "loss": 0.4805, "step": 112600 }, { "epoch": 3.97, "learning_rate": 9.710666666666667e-06, "loss": 0.4556, "step": 112650 }, { "epoch": 3.97, "learning_rate": 9.705111111111112e-06, "loss": 0.4293, "step": 112700 }, { "epoch": 3.97, "learning_rate": 9.699555555555557e-06, "loss": 0.446, "step": 112750 }, { "epoch": 3.97, "learning_rate": 9.694e-06, "loss": 0.4481, "step": 112800 }, { "epoch": 3.97, "learning_rate": 9.688444444444444e-06, "loss": 0.4372, "step": 112850 }, { "epoch": 3.98, "learning_rate": 9.68288888888889e-06, "loss": 0.4325, "step": 112900 }, { "epoch": 3.98, "learning_rate": 9.677333333333335e-06, "loss": 0.5179, "step": 112950 }, { "epoch": 3.98, "learning_rate": 9.671777777777778e-06, "loss": 0.4439, "step": 113000 }, { "epoch": 3.98, "learning_rate": 9.666222222222224e-06, "loss": 0.4547, "step": 113050 }, { "epoch": 3.98, "learning_rate": 9.660666666666667e-06, "loss": 0.4431, "step": 113100 }, { "epoch": 3.98, "learning_rate": 9.655111111111112e-06, "loss": 0.4366, "step": 113150 }, { "epoch": 3.99, "learning_rate": 9.649555555555556e-06, "loss": 0.5674, "step": 113200 }, { "epoch": 3.99, "learning_rate": 9.644000000000001e-06, "loss": 0.4573, "step": 113250 }, { "epoch": 3.99, "learning_rate": 9.638444444444445e-06, "loss": 0.4808, "step": 113300 }, { "epoch": 3.99, "learning_rate": 9.63288888888889e-06, "loss": 0.4201, "step": 113350 }, { "epoch": 3.99, "learning_rate": 9.627333333333334e-06, "loss": 0.4213, "step": 113400 }, { "epoch": 3.99, "learning_rate": 9.621777777777779e-06, "loss": 0.5612, "step": 113450 }, { "epoch": 4.0, "learning_rate": 9.616222222222224e-06, "loss": 0.4184, "step": 113500 }, { "epoch": 4.0, "learning_rate": 9.610666666666668e-06, "loss": 0.4402, "step": 113550 }, { "epoch": 4.0, "learning_rate": 9.605111111111111e-06, "loss": 0.5676, "step": 113600 }, { "epoch": 4.0, "learning_rate": 9.599555555555556e-06, "loss": 0.4413, "step": 113650 }, { "epoch": 4.0, "learning_rate": 9.594000000000002e-06, "loss": 0.4353, "step": 113700 }, { "epoch": 4.0, "learning_rate": 9.588444444444445e-06, "loss": 0.428, "step": 113750 }, { "epoch": 4.01, "learning_rate": 9.582888888888889e-06, "loss": 0.432, "step": 113800 }, { "epoch": 4.01, "learning_rate": 9.577333333333334e-06, "loss": 0.4249, "step": 113850 }, { "epoch": 4.01, "learning_rate": 9.57177777777778e-06, "loss": 0.4319, "step": 113900 }, { "epoch": 4.01, "learning_rate": 9.566222222222223e-06, "loss": 0.4262, "step": 113950 }, { "epoch": 4.01, "learning_rate": 9.560666666666666e-06, "loss": 0.4444, "step": 114000 }, { "epoch": 4.02, "learning_rate": 9.555111111111112e-06, "loss": 0.4353, "step": 114050 }, { "epoch": 4.02, "learning_rate": 9.549555555555557e-06, "loss": 0.4248, "step": 114100 }, { "epoch": 4.02, "learning_rate": 9.544e-06, "loss": 0.4213, "step": 114150 }, { "epoch": 4.02, "learning_rate": 9.538444444444446e-06, "loss": 0.4387, "step": 114200 }, { "epoch": 4.02, "learning_rate": 9.53288888888889e-06, "loss": 0.4388, "step": 114250 }, { "epoch": 4.02, "learning_rate": 9.527333333333334e-06, "loss": 0.4327, "step": 114300 }, { "epoch": 4.03, "learning_rate": 9.521777777777778e-06, "loss": 0.4367, "step": 114350 }, { "epoch": 4.03, "learning_rate": 9.516222222222223e-06, "loss": 0.4418, "step": 114400 }, { "epoch": 4.03, "learning_rate": 9.510666666666667e-06, "loss": 0.4205, "step": 114450 }, { "epoch": 4.03, "learning_rate": 9.505111111111112e-06, "loss": 0.4249, "step": 114500 }, { "epoch": 4.03, "learning_rate": 9.499555555555556e-06, "loss": 0.4448, "step": 114550 }, { "epoch": 4.03, "learning_rate": 9.494000000000001e-06, "loss": 0.4253, "step": 114600 }, { "epoch": 4.04, "learning_rate": 9.488444444444446e-06, "loss": 0.4156, "step": 114650 }, { "epoch": 4.04, "learning_rate": 9.48288888888889e-06, "loss": 0.4236, "step": 114700 }, { "epoch": 4.04, "learning_rate": 9.477333333333333e-06, "loss": 0.4381, "step": 114750 }, { "epoch": 4.04, "learning_rate": 9.471777777777779e-06, "loss": 0.4673, "step": 114800 }, { "epoch": 4.04, "learning_rate": 9.466222222222224e-06, "loss": 0.44, "step": 114850 }, { "epoch": 4.05, "learning_rate": 9.460666666666667e-06, "loss": 0.4183, "step": 114900 }, { "epoch": 4.05, "learning_rate": 9.455111111111111e-06, "loss": 0.4309, "step": 114950 }, { "epoch": 4.05, "learning_rate": 9.449555555555556e-06, "loss": 0.4755, "step": 115000 }, { "epoch": 4.05, "eval_loss": 0.258281409740448, "eval_runtime": 18.9345, "eval_samples_per_second": 74.996, "eval_steps_per_second": 4.7, "eval_wer": 0.18997912317327767, "step": 115000 }, { "epoch": 4.05, "learning_rate": 9.444000000000001e-06, "loss": 0.4251, "step": 115050 }, { "epoch": 4.05, "learning_rate": 9.438444444444445e-06, "loss": 0.4383, "step": 115100 }, { "epoch": 4.05, "learning_rate": 9.432888888888889e-06, "loss": 0.4304, "step": 115150 }, { "epoch": 4.06, "learning_rate": 9.427333333333334e-06, "loss": 0.4487, "step": 115200 }, { "epoch": 4.06, "learning_rate": 9.421777777777779e-06, "loss": 0.4276, "step": 115250 }, { "epoch": 4.06, "learning_rate": 9.416222222222223e-06, "loss": 0.4471, "step": 115300 }, { "epoch": 4.06, "learning_rate": 9.410666666666668e-06, "loss": 0.4368, "step": 115350 }, { "epoch": 4.06, "learning_rate": 9.405111111111111e-06, "loss": 0.43, "step": 115400 }, { "epoch": 4.06, "learning_rate": 9.399555555555557e-06, "loss": 0.4601, "step": 115450 }, { "epoch": 4.07, "learning_rate": 9.394e-06, "loss": 0.4203, "step": 115500 }, { "epoch": 4.07, "learning_rate": 9.388444444444445e-06, "loss": 0.4555, "step": 115550 }, { "epoch": 4.07, "learning_rate": 9.382888888888889e-06, "loss": 0.5295, "step": 115600 }, { "epoch": 4.07, "learning_rate": 9.377333333333334e-06, "loss": 0.4143, "step": 115650 }, { "epoch": 4.07, "learning_rate": 9.371777777777778e-06, "loss": 0.4206, "step": 115700 }, { "epoch": 4.08, "learning_rate": 9.366222222222223e-06, "loss": 0.4301, "step": 115750 }, { "epoch": 4.08, "learning_rate": 9.360666666666668e-06, "loss": 0.4565, "step": 115800 }, { "epoch": 4.08, "learning_rate": 9.355111111111112e-06, "loss": 0.4247, "step": 115850 }, { "epoch": 4.08, "learning_rate": 9.349555555555555e-06, "loss": 0.4238, "step": 115900 }, { "epoch": 4.08, "learning_rate": 9.344e-06, "loss": 0.4454, "step": 115950 }, { "epoch": 4.08, "learning_rate": 9.338444444444446e-06, "loss": 0.4674, "step": 116000 }, { "epoch": 4.09, "learning_rate": 9.33288888888889e-06, "loss": 0.4261, "step": 116050 }, { "epoch": 4.09, "learning_rate": 9.327333333333333e-06, "loss": 0.3913, "step": 116100 }, { "epoch": 4.09, "learning_rate": 9.321888888888889e-06, "loss": 0.4674, "step": 116150 }, { "epoch": 4.09, "learning_rate": 9.316333333333334e-06, "loss": 0.4377, "step": 116200 }, { "epoch": 4.09, "learning_rate": 9.310777777777778e-06, "loss": 0.4322, "step": 116250 }, { "epoch": 4.09, "learning_rate": 9.305222222222223e-06, "loss": 0.426, "step": 116300 }, { "epoch": 4.1, "learning_rate": 9.299666666666668e-06, "loss": 0.4402, "step": 116350 }, { "epoch": 4.1, "learning_rate": 9.294111111111112e-06, "loss": 0.4542, "step": 116400 }, { "epoch": 4.1, "learning_rate": 9.288555555555555e-06, "loss": 0.424, "step": 116450 }, { "epoch": 4.1, "learning_rate": 9.283e-06, "loss": 0.4426, "step": 116500 }, { "epoch": 4.1, "learning_rate": 9.277444444444446e-06, "loss": 0.4763, "step": 116550 }, { "epoch": 4.11, "learning_rate": 9.27188888888889e-06, "loss": 0.4433, "step": 116600 }, { "epoch": 4.11, "learning_rate": 9.266333333333333e-06, "loss": 0.4407, "step": 116650 }, { "epoch": 4.11, "learning_rate": 9.260777777777778e-06, "loss": 0.4103, "step": 116700 }, { "epoch": 4.11, "learning_rate": 9.255222222222224e-06, "loss": 0.4111, "step": 116750 }, { "epoch": 4.11, "learning_rate": 9.249666666666667e-06, "loss": 0.4128, "step": 116800 }, { "epoch": 4.11, "learning_rate": 9.24411111111111e-06, "loss": 0.4186, "step": 116850 }, { "epoch": 4.12, "learning_rate": 9.238555555555556e-06, "loss": 0.4351, "step": 116900 }, { "epoch": 4.12, "learning_rate": 9.233000000000001e-06, "loss": 0.4249, "step": 116950 }, { "epoch": 4.12, "learning_rate": 9.227444444444445e-06, "loss": 0.4947, "step": 117000 }, { "epoch": 4.12, "learning_rate": 9.221888888888888e-06, "loss": 0.4369, "step": 117050 }, { "epoch": 4.12, "learning_rate": 9.216333333333334e-06, "loss": 0.4118, "step": 117100 }, { "epoch": 4.12, "learning_rate": 9.210777777777779e-06, "loss": 0.4448, "step": 117150 }, { "epoch": 4.13, "learning_rate": 9.205222222222222e-06, "loss": 0.4371, "step": 117200 }, { "epoch": 4.13, "learning_rate": 9.199666666666668e-06, "loss": 0.4236, "step": 117250 }, { "epoch": 4.13, "learning_rate": 9.194111111111111e-06, "loss": 0.419, "step": 117300 }, { "epoch": 4.13, "learning_rate": 9.188555555555556e-06, "loss": 0.4259, "step": 117350 }, { "epoch": 4.13, "learning_rate": 9.183e-06, "loss": 0.4179, "step": 117400 }, { "epoch": 4.14, "learning_rate": 9.177444444444445e-06, "loss": 0.4235, "step": 117450 }, { "epoch": 4.14, "learning_rate": 9.17188888888889e-06, "loss": 0.4374, "step": 117500 }, { "epoch": 4.14, "eval_loss": 0.2589673399925232, "eval_runtime": 39.0454, "eval_samples_per_second": 36.368, "eval_steps_per_second": 2.279, "eval_wer": 0.19442679495325407, "step": 117500 }, { "epoch": 4.14, "learning_rate": 9.166333333333334e-06, "loss": 0.4416, "step": 117550 }, { "epoch": 4.14, "learning_rate": 9.160777777777778e-06, "loss": 0.4362, "step": 117600 }, { "epoch": 4.14, "learning_rate": 9.155222222222223e-06, "loss": 0.4043, "step": 117650 }, { "epoch": 4.14, "learning_rate": 9.149777777777779e-06, "loss": 0.6025, "step": 117700 }, { "epoch": 4.15, "learning_rate": 9.144222222222222e-06, "loss": 0.4304, "step": 117750 }, { "epoch": 4.15, "learning_rate": 9.138666666666668e-06, "loss": 0.5041, "step": 117800 }, { "epoch": 4.15, "learning_rate": 9.133111111111111e-06, "loss": 0.4548, "step": 117850 }, { "epoch": 4.15, "learning_rate": 9.127555555555557e-06, "loss": 0.4416, "step": 117900 }, { "epoch": 4.15, "learning_rate": 9.122e-06, "loss": 0.4303, "step": 117950 }, { "epoch": 4.15, "learning_rate": 9.116444444444445e-06, "loss": 0.4788, "step": 118000 }, { "epoch": 4.16, "learning_rate": 9.110888888888889e-06, "loss": 0.4082, "step": 118050 }, { "epoch": 4.16, "learning_rate": 9.105333333333334e-06, "loss": 0.4441, "step": 118100 }, { "epoch": 4.16, "learning_rate": 9.099777777777778e-06, "loss": 0.4429, "step": 118150 }, { "epoch": 4.16, "learning_rate": 9.094222222222223e-06, "loss": 0.4734, "step": 118200 }, { "epoch": 4.16, "learning_rate": 9.088666666666668e-06, "loss": 0.453, "step": 118250 }, { "epoch": 4.17, "learning_rate": 9.083111111111112e-06, "loss": 0.4298, "step": 118300 }, { "epoch": 4.17, "learning_rate": 9.077555555555555e-06, "loss": 0.4302, "step": 118350 }, { "epoch": 4.17, "learning_rate": 9.072e-06, "loss": 0.4255, "step": 118400 }, { "epoch": 4.17, "learning_rate": 9.066444444444446e-06, "loss": 0.4175, "step": 118450 }, { "epoch": 4.17, "learning_rate": 9.06088888888889e-06, "loss": 0.4251, "step": 118500 }, { "epoch": 4.17, "learning_rate": 9.055333333333333e-06, "loss": 0.4322, "step": 118550 }, { "epoch": 4.18, "learning_rate": 9.049777777777778e-06, "loss": 0.4239, "step": 118600 }, { "epoch": 4.18, "learning_rate": 9.044222222222223e-06, "loss": 0.4177, "step": 118650 }, { "epoch": 4.18, "learning_rate": 9.038666666666667e-06, "loss": 0.4972, "step": 118700 }, { "epoch": 4.18, "learning_rate": 9.033111111111112e-06, "loss": 0.4659, "step": 118750 }, { "epoch": 4.18, "learning_rate": 9.027555555555556e-06, "loss": 0.4127, "step": 118800 }, { "epoch": 4.18, "learning_rate": 9.022000000000001e-06, "loss": 0.4534, "step": 118850 }, { "epoch": 4.19, "learning_rate": 9.016444444444446e-06, "loss": 0.4222, "step": 118900 }, { "epoch": 4.19, "learning_rate": 9.01088888888889e-06, "loss": 0.4357, "step": 118950 }, { "epoch": 4.19, "learning_rate": 9.005333333333333e-06, "loss": 0.4237, "step": 119000 }, { "epoch": 4.19, "learning_rate": 8.999777777777779e-06, "loss": 0.4051, "step": 119050 }, { "epoch": 4.19, "learning_rate": 8.994222222222224e-06, "loss": 0.428, "step": 119100 }, { "epoch": 4.2, "learning_rate": 8.988666666666667e-06, "loss": 0.4602, "step": 119150 }, { "epoch": 4.2, "learning_rate": 8.983111111111111e-06, "loss": 0.4831, "step": 119200 }, { "epoch": 4.2, "learning_rate": 8.977555555555556e-06, "loss": 0.4238, "step": 119250 }, { "epoch": 4.2, "learning_rate": 8.972000000000002e-06, "loss": 0.4147, "step": 119300 }, { "epoch": 4.2, "learning_rate": 8.966444444444445e-06, "loss": 0.4164, "step": 119350 }, { "epoch": 4.2, "learning_rate": 8.96088888888889e-06, "loss": 0.4103, "step": 119400 }, { "epoch": 4.21, "learning_rate": 8.955333333333334e-06, "loss": 0.4108, "step": 119450 }, { "epoch": 4.21, "learning_rate": 8.949777777777779e-06, "loss": 0.4351, "step": 119500 }, { "epoch": 4.21, "learning_rate": 8.944222222222223e-06, "loss": 0.5185, "step": 119550 }, { "epoch": 4.21, "learning_rate": 8.938666666666668e-06, "loss": 0.4489, "step": 119600 }, { "epoch": 4.21, "learning_rate": 8.933111111111111e-06, "loss": 0.4219, "step": 119650 }, { "epoch": 4.21, "learning_rate": 8.927555555555557e-06, "loss": 0.4177, "step": 119700 }, { "epoch": 4.22, "learning_rate": 8.922e-06, "loss": 0.4416, "step": 119750 }, { "epoch": 4.22, "learning_rate": 8.916444444444446e-06, "loss": 0.5195, "step": 119800 }, { "epoch": 4.22, "learning_rate": 8.91088888888889e-06, "loss": 0.426, "step": 119850 }, { "epoch": 4.22, "learning_rate": 8.905333333333334e-06, "loss": 0.4407, "step": 119900 }, { "epoch": 4.22, "learning_rate": 8.899777777777778e-06, "loss": 0.4237, "step": 119950 }, { "epoch": 4.23, "learning_rate": 8.894222222222223e-06, "loss": 0.4155, "step": 120000 }, { "epoch": 4.23, "eval_loss": 0.26951727271080017, "eval_runtime": 24.9224, "eval_samples_per_second": 56.977, "eval_steps_per_second": 3.571, "eval_wer": 0.19606063356630662, "step": 120000 }, { "epoch": 4.23, "learning_rate": 8.888666666666668e-06, "loss": 0.4104, "step": 120050 }, { "epoch": 4.23, "learning_rate": 8.883111111111112e-06, "loss": 0.4126, "step": 120100 }, { "epoch": 4.23, "learning_rate": 8.877555555555556e-06, "loss": 0.4092, "step": 120150 }, { "epoch": 4.23, "learning_rate": 8.872e-06, "loss": 0.4253, "step": 120200 }, { "epoch": 4.23, "learning_rate": 8.866444444444446e-06, "loss": 0.4173, "step": 120250 }, { "epoch": 4.24, "learning_rate": 8.86088888888889e-06, "loss": 0.4167, "step": 120300 }, { "epoch": 4.24, "learning_rate": 8.855333333333333e-06, "loss": 0.437, "step": 120350 }, { "epoch": 4.24, "learning_rate": 8.849777777777778e-06, "loss": 0.4579, "step": 120400 }, { "epoch": 4.24, "learning_rate": 8.844222222222224e-06, "loss": 0.4462, "step": 120450 }, { "epoch": 4.24, "learning_rate": 8.838666666666667e-06, "loss": 0.4235, "step": 120500 }, { "epoch": 4.24, "learning_rate": 8.833111111111112e-06, "loss": 0.4218, "step": 120550 }, { "epoch": 4.25, "learning_rate": 8.827666666666668e-06, "loss": 0.456, "step": 120600 }, { "epoch": 4.25, "learning_rate": 8.822111111111112e-06, "loss": 0.4202, "step": 120650 }, { "epoch": 4.25, "learning_rate": 8.816555555555556e-06, "loss": 0.4381, "step": 120700 }, { "epoch": 4.25, "learning_rate": 8.811000000000001e-06, "loss": 0.4198, "step": 120750 }, { "epoch": 4.25, "learning_rate": 8.805444444444446e-06, "loss": 0.3988, "step": 120800 }, { "epoch": 4.25, "learning_rate": 8.79988888888889e-06, "loss": 0.491, "step": 120850 }, { "epoch": 4.26, "learning_rate": 8.794333333333333e-06, "loss": 0.5487, "step": 120900 }, { "epoch": 4.26, "learning_rate": 8.788777777777778e-06, "loss": 0.4352, "step": 120950 }, { "epoch": 4.26, "learning_rate": 8.783222222222224e-06, "loss": 0.4117, "step": 121000 }, { "epoch": 4.26, "learning_rate": 8.777666666666667e-06, "loss": 0.4183, "step": 121050 }, { "epoch": 4.26, "learning_rate": 8.772111111111113e-06, "loss": 0.4367, "step": 121100 }, { "epoch": 4.27, "learning_rate": 8.766555555555556e-06, "loss": 0.4219, "step": 121150 }, { "epoch": 4.27, "learning_rate": 8.761000000000001e-06, "loss": 0.4335, "step": 121200 }, { "epoch": 4.27, "learning_rate": 8.755444444444445e-06, "loss": 0.4408, "step": 121250 }, { "epoch": 4.27, "learning_rate": 8.74988888888889e-06, "loss": 0.3969, "step": 121300 }, { "epoch": 4.27, "learning_rate": 8.744333333333334e-06, "loss": 0.4182, "step": 121350 }, { "epoch": 4.27, "learning_rate": 8.738777777777779e-06, "loss": 0.4098, "step": 121400 }, { "epoch": 4.28, "learning_rate": 8.733222222222223e-06, "loss": 0.426, "step": 121450 }, { "epoch": 4.28, "learning_rate": 8.727666666666668e-06, "loss": 0.4341, "step": 121500 }, { "epoch": 4.28, "learning_rate": 8.722111111111113e-06, "loss": 0.4218, "step": 121550 }, { "epoch": 4.28, "learning_rate": 8.716555555555557e-06, "loss": 0.4353, "step": 121600 }, { "epoch": 4.28, "learning_rate": 8.711e-06, "loss": 0.4252, "step": 121650 }, { "epoch": 4.28, "learning_rate": 8.705444444444445e-06, "loss": 0.4307, "step": 121700 }, { "epoch": 4.29, "learning_rate": 8.69988888888889e-06, "loss": 0.4204, "step": 121750 }, { "epoch": 4.29, "learning_rate": 8.694333333333334e-06, "loss": 0.4307, "step": 121800 }, { "epoch": 4.29, "learning_rate": 8.688777777777778e-06, "loss": 0.401, "step": 121850 }, { "epoch": 4.29, "learning_rate": 8.683222222222223e-06, "loss": 0.4145, "step": 121900 }, { "epoch": 4.29, "learning_rate": 8.677666666666668e-06, "loss": 0.4519, "step": 121950 }, { "epoch": 4.3, "learning_rate": 8.672111111111112e-06, "loss": 0.4096, "step": 122000 }, { "epoch": 4.3, "learning_rate": 8.666555555555555e-06, "loss": 0.4577, "step": 122050 }, { "epoch": 4.3, "learning_rate": 8.661e-06, "loss": 0.4422, "step": 122100 }, { "epoch": 4.3, "learning_rate": 8.655444444444446e-06, "loss": 0.4524, "step": 122150 }, { "epoch": 4.3, "learning_rate": 8.64988888888889e-06, "loss": 0.4259, "step": 122200 }, { "epoch": 4.3, "learning_rate": 8.644333333333335e-06, "loss": 0.4715, "step": 122250 }, { "epoch": 4.31, "learning_rate": 8.638777777777778e-06, "loss": 0.4193, "step": 122300 }, { "epoch": 4.31, "learning_rate": 8.633222222222223e-06, "loss": 0.4365, "step": 122350 }, { "epoch": 4.31, "learning_rate": 8.627666666666667e-06, "loss": 0.4382, "step": 122400 }, { "epoch": 4.31, "learning_rate": 8.622111111111112e-06, "loss": 0.4023, "step": 122450 }, { "epoch": 4.31, "learning_rate": 8.616555555555556e-06, "loss": 0.4463, "step": 122500 }, { "epoch": 4.31, "eval_loss": 0.26047635078430176, "eval_runtime": 38.2142, "eval_samples_per_second": 37.159, "eval_steps_per_second": 2.329, "eval_wer": 0.1908868112916402, "step": 122500 }, { "epoch": 4.31, "learning_rate": 8.611000000000001e-06, "loss": 0.4438, "step": 122550 }, { "epoch": 4.32, "learning_rate": 8.605444444444445e-06, "loss": 0.411, "step": 122600 }, { "epoch": 4.32, "learning_rate": 8.59988888888889e-06, "loss": 0.483, "step": 122650 }, { "epoch": 4.32, "learning_rate": 8.594333333333335e-06, "loss": 0.4134, "step": 122700 }, { "epoch": 4.32, "learning_rate": 8.588777777777779e-06, "loss": 0.4147, "step": 122750 }, { "epoch": 4.32, "learning_rate": 8.583222222222222e-06, "loss": 0.4419, "step": 122800 }, { "epoch": 4.33, "learning_rate": 8.577666666666667e-06, "loss": 0.4296, "step": 122850 }, { "epoch": 4.33, "learning_rate": 8.572111111111113e-06, "loss": 0.4181, "step": 122900 }, { "epoch": 4.33, "learning_rate": 8.566555555555556e-06, "loss": 0.42, "step": 122950 }, { "epoch": 4.33, "learning_rate": 8.561e-06, "loss": 0.4156, "step": 123000 }, { "epoch": 4.33, "learning_rate": 8.555444444444445e-06, "loss": 0.439, "step": 123050 }, { "epoch": 4.33, "learning_rate": 8.54988888888889e-06, "loss": 0.4394, "step": 123100 }, { "epoch": 4.34, "learning_rate": 8.544333333333334e-06, "loss": 0.4242, "step": 123150 }, { "epoch": 4.34, "learning_rate": 8.538777777777777e-06, "loss": 0.4725, "step": 123200 }, { "epoch": 4.34, "learning_rate": 8.533222222222223e-06, "loss": 0.4143, "step": 123250 }, { "epoch": 4.34, "learning_rate": 8.527666666666668e-06, "loss": 0.4474, "step": 123300 }, { "epoch": 4.34, "learning_rate": 8.522111111111112e-06, "loss": 0.4137, "step": 123350 }, { "epoch": 4.34, "learning_rate": 8.516555555555557e-06, "loss": 0.4207, "step": 123400 }, { "epoch": 4.35, "learning_rate": 8.511e-06, "loss": 0.4154, "step": 123450 }, { "epoch": 4.35, "learning_rate": 8.505444444444446e-06, "loss": 0.4351, "step": 123500 }, { "epoch": 4.35, "learning_rate": 8.499888888888889e-06, "loss": 0.42, "step": 123550 }, { "epoch": 4.35, "learning_rate": 8.494333333333334e-06, "loss": 0.3893, "step": 123600 }, { "epoch": 4.35, "learning_rate": 8.488777777777778e-06, "loss": 0.4259, "step": 123650 }, { "epoch": 4.36, "learning_rate": 8.483222222222223e-06, "loss": 0.4115, "step": 123700 }, { "epoch": 4.36, "learning_rate": 8.477666666666667e-06, "loss": 0.4395, "step": 123750 }, { "epoch": 4.36, "learning_rate": 8.472111111111112e-06, "loss": 0.4023, "step": 123800 }, { "epoch": 4.36, "learning_rate": 8.466555555555557e-06, "loss": 0.4192, "step": 123850 }, { "epoch": 4.36, "learning_rate": 8.461e-06, "loss": 0.4525, "step": 123900 }, { "epoch": 4.36, "learning_rate": 8.455444444444444e-06, "loss": 0.4446, "step": 123950 }, { "epoch": 4.37, "learning_rate": 8.44988888888889e-06, "loss": 0.3942, "step": 124000 }, { "epoch": 4.37, "learning_rate": 8.444333333333335e-06, "loss": 0.4404, "step": 124050 }, { "epoch": 4.37, "learning_rate": 8.438777777777778e-06, "loss": 0.4633, "step": 124100 }, { "epoch": 4.37, "learning_rate": 8.433222222222222e-06, "loss": 0.4001, "step": 124150 }, { "epoch": 4.37, "learning_rate": 8.427666666666667e-06, "loss": 0.4, "step": 124200 }, { "epoch": 4.37, "learning_rate": 8.422111111111112e-06, "loss": 0.433, "step": 124250 }, { "epoch": 4.38, "learning_rate": 8.416555555555556e-06, "loss": 0.418, "step": 124300 }, { "epoch": 4.38, "learning_rate": 8.411e-06, "loss": 0.4291, "step": 124350 }, { "epoch": 4.38, "learning_rate": 8.405444444444445e-06, "loss": 0.413, "step": 124400 }, { "epoch": 4.38, "learning_rate": 8.39988888888889e-06, "loss": 0.4252, "step": 124450 }, { "epoch": 4.38, "learning_rate": 8.394333333333334e-06, "loss": 0.4484, "step": 124500 }, { "epoch": 4.39, "learning_rate": 8.38888888888889e-06, "loss": 0.6226, "step": 124550 }, { "epoch": 4.39, "learning_rate": 8.383333333333335e-06, "loss": 0.4139, "step": 124600 }, { "epoch": 4.39, "learning_rate": 8.377777777777779e-06, "loss": 0.4256, "step": 124650 }, { "epoch": 4.39, "learning_rate": 8.372222222222222e-06, "loss": 0.4212, "step": 124700 }, { "epoch": 4.39, "learning_rate": 8.366666666666667e-06, "loss": 0.4198, "step": 124750 }, { "epoch": 4.39, "learning_rate": 8.361111111111113e-06, "loss": 0.4221, "step": 124800 }, { "epoch": 4.4, "learning_rate": 8.355555555555556e-06, "loss": 0.4286, "step": 124850 }, { "epoch": 4.4, "learning_rate": 8.35e-06, "loss": 0.3963, "step": 124900 }, { "epoch": 4.4, "learning_rate": 8.344444444444445e-06, "loss": 0.4118, "step": 124950 }, { "epoch": 4.4, "learning_rate": 8.33888888888889e-06, "loss": 0.4007, "step": 125000 }, { "epoch": 4.4, "eval_loss": 0.25289013981819153, "eval_runtime": 23.8032, "eval_samples_per_second": 59.656, "eval_steps_per_second": 3.739, "eval_wer": 0.18907143505491514, "step": 125000 }, { "epoch": 4.4, "learning_rate": 8.333333333333334e-06, "loss": 0.4459, "step": 125050 }, { "epoch": 4.4, "learning_rate": 8.327777777777777e-06, "loss": 0.4174, "step": 125100 }, { "epoch": 4.41, "learning_rate": 8.322222222222223e-06, "loss": 0.4815, "step": 125150 }, { "epoch": 4.41, "learning_rate": 8.316666666666668e-06, "loss": 0.4469, "step": 125200 }, { "epoch": 4.41, "learning_rate": 8.311111111111111e-06, "loss": 0.4361, "step": 125250 }, { "epoch": 4.41, "learning_rate": 8.305555555555557e-06, "loss": 0.3834, "step": 125300 }, { "epoch": 4.41, "learning_rate": 8.3e-06, "loss": 0.4088, "step": 125350 }, { "epoch": 4.42, "learning_rate": 8.294444444444445e-06, "loss": 0.4328, "step": 125400 }, { "epoch": 4.42, "learning_rate": 8.288888888888889e-06, "loss": 0.4548, "step": 125450 }, { "epoch": 4.42, "learning_rate": 8.283333333333334e-06, "loss": 0.4313, "step": 125500 }, { "epoch": 4.42, "learning_rate": 8.277777777777778e-06, "loss": 0.4566, "step": 125550 }, { "epoch": 4.42, "learning_rate": 8.272222222222223e-06, "loss": 0.3875, "step": 125600 }, { "epoch": 4.42, "learning_rate": 8.266666666666667e-06, "loss": 0.421, "step": 125650 }, { "epoch": 4.43, "learning_rate": 8.261111111111112e-06, "loss": 0.4307, "step": 125700 }, { "epoch": 4.43, "learning_rate": 8.255555555555557e-06, "loss": 0.4198, "step": 125750 }, { "epoch": 4.43, "learning_rate": 8.25e-06, "loss": 0.4144, "step": 125800 }, { "epoch": 4.43, "learning_rate": 8.244444444444444e-06, "loss": 0.4036, "step": 125850 }, { "epoch": 4.43, "learning_rate": 8.23888888888889e-06, "loss": 0.5544, "step": 125900 }, { "epoch": 4.43, "learning_rate": 8.233333333333335e-06, "loss": 0.4207, "step": 125950 }, { "epoch": 4.44, "learning_rate": 8.227777777777778e-06, "loss": 0.4334, "step": 126000 }, { "epoch": 4.44, "learning_rate": 8.222222222222222e-06, "loss": 0.4333, "step": 126050 }, { "epoch": 4.44, "learning_rate": 8.216666666666667e-06, "loss": 0.4327, "step": 126100 }, { "epoch": 4.44, "learning_rate": 8.211111111111112e-06, "loss": 0.4389, "step": 126150 }, { "epoch": 4.44, "learning_rate": 8.205666666666667e-06, "loss": 0.4545, "step": 126200 }, { "epoch": 4.45, "learning_rate": 8.200111111111112e-06, "loss": 0.4123, "step": 126250 }, { "epoch": 4.45, "learning_rate": 8.194555555555557e-06, "loss": 0.4031, "step": 126300 }, { "epoch": 4.45, "learning_rate": 8.189e-06, "loss": 0.4163, "step": 126350 }, { "epoch": 4.45, "learning_rate": 8.183444444444444e-06, "loss": 0.4188, "step": 126400 }, { "epoch": 4.45, "learning_rate": 8.17788888888889e-06, "loss": 0.4294, "step": 126450 }, { "epoch": 4.45, "learning_rate": 8.172333333333335e-06, "loss": 0.4096, "step": 126500 }, { "epoch": 4.46, "learning_rate": 8.166777777777778e-06, "loss": 0.4238, "step": 126550 }, { "epoch": 4.46, "learning_rate": 8.161222222222222e-06, "loss": 0.4911, "step": 126600 }, { "epoch": 4.46, "learning_rate": 8.155666666666667e-06, "loss": 0.4127, "step": 126650 }, { "epoch": 4.46, "learning_rate": 8.150111111111112e-06, "loss": 0.4091, "step": 126700 }, { "epoch": 4.46, "learning_rate": 8.144555555555556e-06, "loss": 0.4582, "step": 126750 }, { "epoch": 4.46, "learning_rate": 8.139e-06, "loss": 0.437, "step": 126800 }, { "epoch": 4.47, "learning_rate": 8.133444444444445e-06, "loss": 0.4275, "step": 126850 }, { "epoch": 4.47, "learning_rate": 8.12788888888889e-06, "loss": 0.4271, "step": 126900 }, { "epoch": 4.47, "learning_rate": 8.122333333333334e-06, "loss": 0.4143, "step": 126950 }, { "epoch": 4.47, "learning_rate": 8.116777777777779e-06, "loss": 0.4273, "step": 127000 }, { "epoch": 4.47, "learning_rate": 8.111222222222222e-06, "loss": 0.422, "step": 127050 }, { "epoch": 4.48, "learning_rate": 8.105666666666668e-06, "loss": 0.4286, "step": 127100 }, { "epoch": 4.48, "learning_rate": 8.100111111111111e-06, "loss": 0.4087, "step": 127150 }, { "epoch": 4.48, "learning_rate": 8.094555555555556e-06, "loss": 0.48, "step": 127200 }, { "epoch": 4.48, "learning_rate": 8.089e-06, "loss": 0.4007, "step": 127250 }, { "epoch": 4.48, "learning_rate": 8.083444444444445e-06, "loss": 0.401, "step": 127300 }, { "epoch": 4.48, "learning_rate": 8.077888888888889e-06, "loss": 0.4747, "step": 127350 }, { "epoch": 4.49, "learning_rate": 8.072333333333334e-06, "loss": 0.4299, "step": 127400 }, { "epoch": 4.49, "learning_rate": 8.06677777777778e-06, "loss": 0.3924, "step": 127450 }, { "epoch": 4.49, "learning_rate": 8.061222222222223e-06, "loss": 0.4156, "step": 127500 }, { "epoch": 4.49, "eval_loss": 0.2567712068557739, "eval_runtime": 6.6995, "eval_samples_per_second": 211.957, "eval_steps_per_second": 13.285, "eval_wer": 0.19134065535082145, "step": 127500 }, { "epoch": 4.49, "learning_rate": 8.055666666666666e-06, "loss": 0.4249, "step": 127550 }, { "epoch": 4.49, "learning_rate": 8.050111111111112e-06, "loss": 0.4377, "step": 127600 }, { "epoch": 4.49, "learning_rate": 8.044555555555557e-06, "loss": 0.4069, "step": 127650 }, { "epoch": 4.5, "learning_rate": 8.039e-06, "loss": 0.4271, "step": 127700 }, { "epoch": 4.5, "learning_rate": 8.033444444444444e-06, "loss": 0.4011, "step": 127750 }, { "epoch": 4.5, "learning_rate": 8.02788888888889e-06, "loss": 0.473, "step": 127800 }, { "epoch": 4.5, "learning_rate": 8.022333333333335e-06, "loss": 0.4562, "step": 127850 }, { "epoch": 4.5, "learning_rate": 8.016777777777778e-06, "loss": 0.4099, "step": 127900 }, { "epoch": 4.5, "learning_rate": 8.011222222222222e-06, "loss": 0.4239, "step": 127950 }, { "epoch": 4.51, "learning_rate": 8.005666666666667e-06, "loss": 0.4282, "step": 128000 }, { "epoch": 4.51, "learning_rate": 8.000111111111112e-06, "loss": 0.3829, "step": 128050 }, { "epoch": 4.51, "learning_rate": 7.994555555555556e-06, "loss": 0.4724, "step": 128100 }, { "epoch": 4.51, "learning_rate": 7.989000000000001e-06, "loss": 0.4187, "step": 128150 }, { "epoch": 4.51, "learning_rate": 7.983444444444444e-06, "loss": 0.4611, "step": 128200 }, { "epoch": 4.52, "learning_rate": 7.97788888888889e-06, "loss": 0.4285, "step": 128250 }, { "epoch": 4.52, "learning_rate": 7.972333333333335e-06, "loss": 0.4482, "step": 128300 }, { "epoch": 4.52, "learning_rate": 7.966777777777779e-06, "loss": 0.4661, "step": 128350 }, { "epoch": 4.52, "learning_rate": 7.961222222222222e-06, "loss": 0.4221, "step": 128400 }, { "epoch": 4.52, "learning_rate": 7.955666666666667e-06, "loss": 0.4083, "step": 128450 }, { "epoch": 4.52, "learning_rate": 7.950111111111113e-06, "loss": 0.3883, "step": 128500 }, { "epoch": 4.53, "learning_rate": 7.944555555555556e-06, "loss": 0.4302, "step": 128550 }, { "epoch": 4.53, "learning_rate": 7.939000000000001e-06, "loss": 0.4398, "step": 128600 }, { "epoch": 4.53, "learning_rate": 7.933444444444445e-06, "loss": 0.4336, "step": 128650 }, { "epoch": 4.53, "learning_rate": 7.92788888888889e-06, "loss": 0.4262, "step": 128700 }, { "epoch": 4.53, "learning_rate": 7.922333333333334e-06, "loss": 0.397, "step": 128750 }, { "epoch": 4.53, "learning_rate": 7.916777777777779e-06, "loss": 0.4435, "step": 128800 }, { "epoch": 4.54, "learning_rate": 7.911222222222223e-06, "loss": 0.4215, "step": 128850 }, { "epoch": 4.54, "learning_rate": 7.905666666666668e-06, "loss": 0.4219, "step": 128900 }, { "epoch": 4.54, "learning_rate": 7.900111111111111e-06, "loss": 0.4285, "step": 128950 }, { "epoch": 4.54, "learning_rate": 7.894555555555557e-06, "loss": 0.4394, "step": 129000 }, { "epoch": 4.54, "learning_rate": 7.889000000000002e-06, "loss": 0.4344, "step": 129050 }, { "epoch": 4.55, "learning_rate": 7.883444444444445e-06, "loss": 0.435, "step": 129100 }, { "epoch": 4.55, "learning_rate": 7.877888888888889e-06, "loss": 0.4249, "step": 129150 }, { "epoch": 4.55, "learning_rate": 7.872333333333334e-06, "loss": 0.4618, "step": 129200 }, { "epoch": 4.55, "learning_rate": 7.86677777777778e-06, "loss": 0.4796, "step": 129250 }, { "epoch": 4.55, "learning_rate": 7.861222222222223e-06, "loss": 0.4397, "step": 129300 }, { "epoch": 4.55, "learning_rate": 7.855666666666667e-06, "loss": 0.4568, "step": 129350 }, { "epoch": 4.56, "learning_rate": 7.850111111111112e-06, "loss": 0.4128, "step": 129400 }, { "epoch": 4.56, "learning_rate": 7.844555555555557e-06, "loss": 0.4137, "step": 129450 }, { "epoch": 4.56, "learning_rate": 7.839e-06, "loss": 0.4334, "step": 129500 }, { "epoch": 4.56, "learning_rate": 7.833444444444444e-06, "loss": 0.4018, "step": 129550 }, { "epoch": 4.56, "learning_rate": 7.82788888888889e-06, "loss": 0.4283, "step": 129600 }, { "epoch": 4.56, "learning_rate": 7.822333333333335e-06, "loss": 0.4478, "step": 129650 }, { "epoch": 4.57, "learning_rate": 7.816777777777778e-06, "loss": 0.4246, "step": 129700 }, { "epoch": 4.57, "learning_rate": 7.811222222222224e-06, "loss": 0.4902, "step": 129750 }, { "epoch": 4.57, "learning_rate": 7.805666666666667e-06, "loss": 0.4549, "step": 129800 }, { "epoch": 4.57, "learning_rate": 7.800111111111112e-06, "loss": 0.4256, "step": 129850 }, { "epoch": 4.57, "learning_rate": 7.794555555555556e-06, "loss": 0.4648, "step": 129900 }, { "epoch": 4.58, "learning_rate": 7.789000000000001e-06, "loss": 0.4186, "step": 129950 }, { "epoch": 4.58, "learning_rate": 7.783444444444445e-06, "loss": 0.4124, "step": 130000 }, { "epoch": 4.58, "eval_loss": 0.25591251254081726, "eval_runtime": 13.7422, "eval_samples_per_second": 103.331, "eval_steps_per_second": 6.476, "eval_wer": 0.18888989743124263, "step": 130000 }, { "epoch": 4.58, "learning_rate": 7.77788888888889e-06, "loss": 0.4182, "step": 130050 }, { "epoch": 4.58, "learning_rate": 7.772333333333334e-06, "loss": 0.41, "step": 130100 }, { "epoch": 4.58, "learning_rate": 7.766777777777779e-06, "loss": 0.3967, "step": 130150 }, { "epoch": 4.58, "learning_rate": 7.761222222222224e-06, "loss": 0.415, "step": 130200 }, { "epoch": 4.59, "learning_rate": 7.755666666666668e-06, "loss": 0.4861, "step": 130250 }, { "epoch": 4.59, "learning_rate": 7.750111111111111e-06, "loss": 0.4179, "step": 130300 }, { "epoch": 4.59, "learning_rate": 7.744555555555556e-06, "loss": 0.417, "step": 130350 }, { "epoch": 4.59, "learning_rate": 7.739000000000002e-06, "loss": 0.4061, "step": 130400 }, { "epoch": 4.59, "learning_rate": 7.733444444444445e-06, "loss": 0.4098, "step": 130450 }, { "epoch": 4.59, "learning_rate": 7.727888888888889e-06, "loss": 0.5971, "step": 130500 }, { "epoch": 4.6, "learning_rate": 7.722333333333334e-06, "loss": 0.4586, "step": 130550 }, { "epoch": 4.6, "learning_rate": 7.71677777777778e-06, "loss": 0.4342, "step": 130600 }, { "epoch": 4.6, "learning_rate": 7.711222222222223e-06, "loss": 0.5056, "step": 130650 }, { "epoch": 4.6, "learning_rate": 7.705666666666666e-06, "loss": 0.4647, "step": 130700 }, { "epoch": 4.6, "learning_rate": 7.700111111111112e-06, "loss": 0.4302, "step": 130750 }, { "epoch": 4.61, "learning_rate": 7.694555555555557e-06, "loss": 0.427, "step": 130800 }, { "epoch": 4.61, "learning_rate": 7.689e-06, "loss": 0.4205, "step": 130850 }, { "epoch": 4.61, "learning_rate": 7.683444444444446e-06, "loss": 0.4025, "step": 130900 }, { "epoch": 4.61, "learning_rate": 7.67788888888889e-06, "loss": 0.4171, "step": 130950 }, { "epoch": 4.61, "learning_rate": 7.672333333333334e-06, "loss": 0.4523, "step": 131000 }, { "epoch": 4.61, "learning_rate": 7.666777777777778e-06, "loss": 0.446, "step": 131050 }, { "epoch": 4.62, "learning_rate": 7.661222222222223e-06, "loss": 0.4255, "step": 131100 }, { "epoch": 4.62, "learning_rate": 7.655666666666667e-06, "loss": 0.4066, "step": 131150 }, { "epoch": 4.62, "learning_rate": 7.650111111111112e-06, "loss": 0.4485, "step": 131200 }, { "epoch": 4.62, "learning_rate": 7.644555555555556e-06, "loss": 0.4072, "step": 131250 }, { "epoch": 4.62, "learning_rate": 7.639000000000001e-06, "loss": 0.4288, "step": 131300 }, { "epoch": 4.62, "learning_rate": 7.633444444444446e-06, "loss": 0.4363, "step": 131350 }, { "epoch": 4.63, "learning_rate": 7.627888888888889e-06, "loss": 0.4275, "step": 131400 }, { "epoch": 4.63, "learning_rate": 7.622333333333334e-06, "loss": 0.4593, "step": 131450 }, { "epoch": 4.63, "learning_rate": 7.6167777777777785e-06, "loss": 0.4396, "step": 131500 }, { "epoch": 4.63, "learning_rate": 7.611333333333334e-06, "loss": 0.5174, "step": 131550 }, { "epoch": 4.63, "learning_rate": 7.605777777777779e-06, "loss": 0.4277, "step": 131600 }, { "epoch": 4.64, "learning_rate": 7.600222222222223e-06, "loss": 0.4219, "step": 131650 }, { "epoch": 4.64, "learning_rate": 7.594666666666667e-06, "loss": 0.4002, "step": 131700 }, { "epoch": 4.64, "learning_rate": 7.589111111111111e-06, "loss": 0.3981, "step": 131750 }, { "epoch": 4.64, "learning_rate": 7.5835555555555566e-06, "loss": 0.4031, "step": 131800 }, { "epoch": 4.64, "learning_rate": 7.578000000000001e-06, "loss": 0.5326, "step": 131850 }, { "epoch": 4.64, "learning_rate": 7.572444444444445e-06, "loss": 0.4339, "step": 131900 }, { "epoch": 4.65, "learning_rate": 7.566888888888889e-06, "loss": 0.3858, "step": 131950 }, { "epoch": 4.65, "learning_rate": 7.561333333333334e-06, "loss": 0.3974, "step": 132000 }, { "epoch": 4.65, "learning_rate": 7.555777777777779e-06, "loss": 0.5978, "step": 132050 }, { "epoch": 4.65, "learning_rate": 7.550222222222223e-06, "loss": 0.4056, "step": 132100 }, { "epoch": 4.65, "learning_rate": 7.5446666666666665e-06, "loss": 0.4251, "step": 132150 }, { "epoch": 4.65, "learning_rate": 7.539111111111112e-06, "loss": 0.4302, "step": 132200 }, { "epoch": 4.66, "learning_rate": 7.533555555555556e-06, "loss": 0.5335, "step": 132250 }, { "epoch": 4.66, "learning_rate": 7.528000000000001e-06, "loss": 0.4492, "step": 132300 }, { "epoch": 4.66, "learning_rate": 7.522444444444446e-06, "loss": 0.3989, "step": 132350 }, { "epoch": 4.66, "learning_rate": 7.516888888888889e-06, "loss": 0.4463, "step": 132400 }, { "epoch": 4.66, "learning_rate": 7.511333333333334e-06, "loss": 0.4414, "step": 132450 }, { "epoch": 4.67, "learning_rate": 7.505777777777778e-06, "loss": 0.4085, "step": 132500 }, { "epoch": 4.67, "eval_loss": 0.26099899411201477, "eval_runtime": 9.5247, "eval_samples_per_second": 149.086, "eval_steps_per_second": 9.344, "eval_wer": 0.19215757465734773, "step": 132500 }, { "epoch": 4.67, "learning_rate": 7.5002222222222235e-06, "loss": 0.4296, "step": 132550 }, { "epoch": 4.67, "learning_rate": 7.494666666666667e-06, "loss": 0.415, "step": 132600 }, { "epoch": 4.67, "learning_rate": 7.4891111111111114e-06, "loss": 0.4392, "step": 132650 }, { "epoch": 4.67, "learning_rate": 7.483555555555556e-06, "loss": 0.4135, "step": 132700 }, { "epoch": 4.67, "learning_rate": 7.478000000000001e-06, "loss": 0.4049, "step": 132750 }, { "epoch": 4.68, "learning_rate": 7.4724444444444455e-06, "loss": 0.4018, "step": 132800 }, { "epoch": 4.68, "learning_rate": 7.466888888888889e-06, "loss": 0.4366, "step": 132850 }, { "epoch": 4.68, "learning_rate": 7.4613333333333334e-06, "loss": 0.4174, "step": 132900 }, { "epoch": 4.68, "learning_rate": 7.455777777777779e-06, "loss": 0.454, "step": 132950 }, { "epoch": 4.68, "learning_rate": 7.450222222222223e-06, "loss": 0.4026, "step": 133000 }, { "epoch": 4.68, "learning_rate": 7.4446666666666675e-06, "loss": 0.4391, "step": 133050 }, { "epoch": 4.69, "learning_rate": 7.439111111111111e-06, "loss": 0.4258, "step": 133100 }, { "epoch": 4.69, "learning_rate": 7.433555555555556e-06, "loss": 0.5237, "step": 133150 }, { "epoch": 4.69, "learning_rate": 7.428000000000001e-06, "loss": 0.4477, "step": 133200 }, { "epoch": 4.69, "learning_rate": 7.422444444444445e-06, "loss": 0.4183, "step": 133250 }, { "epoch": 4.69, "learning_rate": 7.416888888888889e-06, "loss": 0.4287, "step": 133300 }, { "epoch": 4.7, "learning_rate": 7.411333333333334e-06, "loss": 0.4452, "step": 133350 }, { "epoch": 4.7, "learning_rate": 7.405777777777778e-06, "loss": 0.4206, "step": 133400 }, { "epoch": 4.7, "learning_rate": 7.400222222222223e-06, "loss": 0.4187, "step": 133450 }, { "epoch": 4.7, "learning_rate": 7.394666666666668e-06, "loss": 0.3999, "step": 133500 }, { "epoch": 4.7, "learning_rate": 7.3891111111111115e-06, "loss": 0.4153, "step": 133550 }, { "epoch": 4.7, "learning_rate": 7.383555555555556e-06, "loss": 0.4441, "step": 133600 }, { "epoch": 4.71, "learning_rate": 7.378e-06, "loss": 0.4521, "step": 133650 }, { "epoch": 4.71, "learning_rate": 7.372444444444446e-06, "loss": 0.4325, "step": 133700 }, { "epoch": 4.71, "learning_rate": 7.367000000000001e-06, "loss": 0.4215, "step": 133750 }, { "epoch": 4.71, "learning_rate": 7.361444444444445e-06, "loss": 0.3884, "step": 133800 }, { "epoch": 4.71, "learning_rate": 7.355888888888889e-06, "loss": 0.4179, "step": 133850 }, { "epoch": 4.71, "learning_rate": 7.350333333333334e-06, "loss": 0.4121, "step": 133900 }, { "epoch": 4.72, "learning_rate": 7.344777777777778e-06, "loss": 0.4459, "step": 133950 }, { "epoch": 4.72, "learning_rate": 7.339222222222223e-06, "loss": 0.4326, "step": 134000 }, { "epoch": 4.72, "learning_rate": 7.333666666666666e-06, "loss": 0.5749, "step": 134050 }, { "epoch": 4.72, "learning_rate": 7.328111111111112e-06, "loss": 0.4129, "step": 134100 }, { "epoch": 4.72, "learning_rate": 7.322555555555556e-06, "loss": 0.4514, "step": 134150 }, { "epoch": 4.73, "learning_rate": 7.317111111111111e-06, "loss": 0.427, "step": 134200 }, { "epoch": 4.73, "learning_rate": 7.3115555555555565e-06, "loss": 0.413, "step": 134250 }, { "epoch": 4.73, "learning_rate": 7.306000000000001e-06, "loss": 0.4161, "step": 134300 }, { "epoch": 4.73, "learning_rate": 7.300444444444445e-06, "loss": 0.4417, "step": 134350 }, { "epoch": 4.73, "learning_rate": 7.294888888888889e-06, "loss": 0.4181, "step": 134400 }, { "epoch": 4.73, "learning_rate": 7.289333333333334e-06, "loss": 0.3973, "step": 134450 }, { "epoch": 4.74, "learning_rate": 7.2837777777777785e-06, "loss": 0.4214, "step": 134500 }, { "epoch": 4.74, "learning_rate": 7.278222222222223e-06, "loss": 0.4319, "step": 134550 }, { "epoch": 4.74, "learning_rate": 7.2726666666666664e-06, "loss": 0.413, "step": 134600 }, { "epoch": 4.74, "learning_rate": 7.267111111111112e-06, "loss": 0.4058, "step": 134650 }, { "epoch": 4.74, "learning_rate": 7.261555555555556e-06, "loss": 0.4113, "step": 134700 }, { "epoch": 4.74, "learning_rate": 7.2560000000000005e-06, "loss": 0.4223, "step": 134750 }, { "epoch": 4.75, "learning_rate": 7.250444444444446e-06, "loss": 0.3949, "step": 134800 }, { "epoch": 4.75, "learning_rate": 7.244888888888889e-06, "loss": 0.4225, "step": 134850 }, { "epoch": 4.75, "learning_rate": 7.239333333333334e-06, "loss": 0.4361, "step": 134900 }, { "epoch": 4.75, "learning_rate": 7.233777777777778e-06, "loss": 0.4238, "step": 134950 }, { "epoch": 4.75, "learning_rate": 7.228222222222223e-06, "loss": 0.4474, "step": 135000 }, { "epoch": 4.75, "eval_loss": 0.2588209807872772, "eval_runtime": 15.8071, "eval_samples_per_second": 89.833, "eval_steps_per_second": 5.63, "eval_wer": 0.19606063356630662, "step": 135000 }, { "epoch": 4.75, "learning_rate": 7.222666666666667e-06, "loss": 0.3867, "step": 135050 }, { "epoch": 4.76, "learning_rate": 7.217111111111111e-06, "loss": 0.4111, "step": 135100 }, { "epoch": 4.76, "learning_rate": 7.211555555555556e-06, "loss": 0.4436, "step": 135150 }, { "epoch": 4.76, "learning_rate": 7.206000000000001e-06, "loss": 0.4442, "step": 135200 }, { "epoch": 4.76, "learning_rate": 7.200444444444445e-06, "loss": 0.508, "step": 135250 }, { "epoch": 4.76, "learning_rate": 7.194888888888889e-06, "loss": 0.4338, "step": 135300 }, { "epoch": 4.77, "learning_rate": 7.189333333333333e-06, "loss": 0.4081, "step": 135350 }, { "epoch": 4.77, "learning_rate": 7.183777777777779e-06, "loss": 0.4171, "step": 135400 }, { "epoch": 4.77, "learning_rate": 7.178222222222223e-06, "loss": 0.4395, "step": 135450 }, { "epoch": 4.77, "learning_rate": 7.172666666666667e-06, "loss": 0.4138, "step": 135500 }, { "epoch": 4.77, "learning_rate": 7.167111111111111e-06, "loss": 0.4253, "step": 135550 }, { "epoch": 4.77, "learning_rate": 7.161555555555556e-06, "loss": 0.4189, "step": 135600 }, { "epoch": 4.78, "learning_rate": 7.156000000000001e-06, "loss": 0.4035, "step": 135650 }, { "epoch": 4.78, "learning_rate": 7.150444444444445e-06, "loss": 0.4028, "step": 135700 }, { "epoch": 4.78, "learning_rate": 7.1448888888888886e-06, "loss": 0.4734, "step": 135750 }, { "epoch": 4.78, "learning_rate": 7.139333333333334e-06, "loss": 0.4181, "step": 135800 }, { "epoch": 4.78, "learning_rate": 7.133777777777778e-06, "loss": 0.4099, "step": 135850 }, { "epoch": 4.78, "learning_rate": 7.128222222222223e-06, "loss": 0.4054, "step": 135900 }, { "epoch": 4.79, "learning_rate": 7.122666666666668e-06, "loss": 0.412, "step": 135950 }, { "epoch": 4.79, "learning_rate": 7.1171111111111114e-06, "loss": 0.419, "step": 136000 }, { "epoch": 4.79, "learning_rate": 7.111555555555556e-06, "loss": 0.4033, "step": 136050 }, { "epoch": 4.79, "learning_rate": 7.106000000000001e-06, "loss": 0.3971, "step": 136100 }, { "epoch": 4.79, "learning_rate": 7.1004444444444455e-06, "loss": 0.4563, "step": 136150 }, { "epoch": 4.8, "learning_rate": 7.094888888888889e-06, "loss": 0.4371, "step": 136200 }, { "epoch": 4.8, "learning_rate": 7.0893333333333334e-06, "loss": 0.4147, "step": 136250 }, { "epoch": 4.8, "learning_rate": 7.083777777777779e-06, "loss": 0.4189, "step": 136300 }, { "epoch": 4.8, "learning_rate": 7.078222222222223e-06, "loss": 0.5114, "step": 136350 }, { "epoch": 4.8, "learning_rate": 7.0726666666666675e-06, "loss": 0.4161, "step": 136400 }, { "epoch": 4.8, "learning_rate": 7.067111111111111e-06, "loss": 0.4067, "step": 136450 }, { "epoch": 4.81, "learning_rate": 7.061555555555556e-06, "loss": 0.4415, "step": 136500 }, { "epoch": 4.81, "learning_rate": 7.056000000000001e-06, "loss": 0.3959, "step": 136550 }, { "epoch": 4.81, "learning_rate": 7.050444444444445e-06, "loss": 0.4, "step": 136600 }, { "epoch": 4.81, "learning_rate": 7.04488888888889e-06, "loss": 0.4461, "step": 136650 }, { "epoch": 4.81, "learning_rate": 7.039333333333334e-06, "loss": 0.4081, "step": 136700 }, { "epoch": 4.81, "learning_rate": 7.033777777777778e-06, "loss": 0.4578, "step": 136750 }, { "epoch": 4.82, "learning_rate": 7.028222222222223e-06, "loss": 0.4155, "step": 136800 }, { "epoch": 4.82, "learning_rate": 7.022666666666668e-06, "loss": 0.4155, "step": 136850 }, { "epoch": 4.82, "learning_rate": 7.0171111111111115e-06, "loss": 0.3985, "step": 136900 }, { "epoch": 4.82, "learning_rate": 7.011555555555556e-06, "loss": 0.4071, "step": 136950 }, { "epoch": 4.82, "learning_rate": 7.006e-06, "loss": 0.4599, "step": 137000 }, { "epoch": 4.83, "learning_rate": 7.000444444444446e-06, "loss": 0.4074, "step": 137050 }, { "epoch": 4.83, "learning_rate": 6.99488888888889e-06, "loss": 0.4025, "step": 137100 }, { "epoch": 4.83, "learning_rate": 6.9893333333333336e-06, "loss": 0.3951, "step": 137150 }, { "epoch": 4.83, "learning_rate": 6.983777777777778e-06, "loss": 0.4045, "step": 137200 }, { "epoch": 4.83, "learning_rate": 6.978222222222223e-06, "loss": 0.4166, "step": 137250 }, { "epoch": 4.83, "learning_rate": 6.972666666666668e-06, "loss": 0.4622, "step": 137300 }, { "epoch": 4.84, "learning_rate": 6.967111111111111e-06, "loss": 0.405, "step": 137350 }, { "epoch": 4.84, "learning_rate": 6.9615555555555556e-06, "loss": 0.4224, "step": 137400 }, { "epoch": 4.84, "learning_rate": 6.956000000000001e-06, "loss": 0.3908, "step": 137450 }, { "epoch": 4.84, "learning_rate": 6.950444444444445e-06, "loss": 0.4098, "step": 137500 }, { "epoch": 4.84, "eval_loss": 0.2512412369251251, "eval_runtime": 14.7039, "eval_samples_per_second": 96.573, "eval_steps_per_second": 6.053, "eval_wer": 0.18770990287737133, "step": 137500 }, { "epoch": 4.84, "learning_rate": 6.94488888888889e-06, "loss": 0.3996, "step": 137550 }, { "epoch": 4.84, "learning_rate": 6.939333333333333e-06, "loss": 0.4487, "step": 137600 }, { "epoch": 4.85, "learning_rate": 6.9337777777777784e-06, "loss": 0.4216, "step": 137650 }, { "epoch": 4.85, "learning_rate": 6.928222222222223e-06, "loss": 0.4494, "step": 137700 }, { "epoch": 4.85, "learning_rate": 6.922666666666667e-06, "loss": 0.4241, "step": 137750 }, { "epoch": 4.85, "learning_rate": 6.9171111111111125e-06, "loss": 0.4154, "step": 137800 }, { "epoch": 4.85, "learning_rate": 6.911555555555556e-06, "loss": 0.4356, "step": 137850 }, { "epoch": 4.86, "learning_rate": 6.9060000000000005e-06, "loss": 0.4148, "step": 137900 }, { "epoch": 4.86, "learning_rate": 6.900444444444445e-06, "loss": 0.381, "step": 137950 }, { "epoch": 4.86, "learning_rate": 6.89488888888889e-06, "loss": 0.407, "step": 138000 }, { "epoch": 4.86, "learning_rate": 6.889333333333334e-06, "loss": 0.3977, "step": 138050 }, { "epoch": 4.86, "learning_rate": 6.883777777777778e-06, "loss": 0.4305, "step": 138100 }, { "epoch": 4.86, "learning_rate": 6.8782222222222225e-06, "loss": 0.4445, "step": 138150 }, { "epoch": 4.87, "learning_rate": 6.872666666666668e-06, "loss": 0.4055, "step": 138200 }, { "epoch": 4.87, "learning_rate": 6.867111111111112e-06, "loss": 0.4219, "step": 138250 }, { "epoch": 4.87, "learning_rate": 6.861555555555556e-06, "loss": 0.4242, "step": 138300 }, { "epoch": 4.87, "learning_rate": 6.856e-06, "loss": 0.3949, "step": 138350 }, { "epoch": 4.87, "learning_rate": 6.850444444444445e-06, "loss": 0.3962, "step": 138400 }, { "epoch": 4.87, "learning_rate": 6.84488888888889e-06, "loss": 0.4144, "step": 138450 }, { "epoch": 4.88, "learning_rate": 6.839333333333333e-06, "loss": 0.4106, "step": 138500 }, { "epoch": 4.88, "learning_rate": 6.833777777777778e-06, "loss": 0.4126, "step": 138550 }, { "epoch": 4.88, "learning_rate": 6.828222222222223e-06, "loss": 0.4538, "step": 138600 }, { "epoch": 4.88, "learning_rate": 6.822666666666667e-06, "loss": 0.3963, "step": 138650 }, { "epoch": 4.88, "learning_rate": 6.817111111111112e-06, "loss": 0.4173, "step": 138700 }, { "epoch": 4.89, "learning_rate": 6.811555555555555e-06, "loss": 0.4057, "step": 138750 }, { "epoch": 4.89, "learning_rate": 6.8060000000000006e-06, "loss": 0.4144, "step": 138800 }, { "epoch": 4.89, "learning_rate": 6.800444444444445e-06, "loss": 0.3944, "step": 138850 }, { "epoch": 4.89, "learning_rate": 6.794888888888889e-06, "loss": 0.3867, "step": 138900 }, { "epoch": 4.89, "learning_rate": 6.789333333333335e-06, "loss": 0.4364, "step": 138950 }, { "epoch": 4.89, "learning_rate": 6.783777777777778e-06, "loss": 0.4018, "step": 139000 }, { "epoch": 4.9, "learning_rate": 6.778222222222223e-06, "loss": 0.4336, "step": 139050 }, { "epoch": 4.9, "learning_rate": 6.772666666666667e-06, "loss": 0.4008, "step": 139100 }, { "epoch": 4.9, "learning_rate": 6.767111111111112e-06, "loss": 0.3967, "step": 139150 }, { "epoch": 4.9, "learning_rate": 6.761555555555556e-06, "loss": 0.3967, "step": 139200 }, { "epoch": 4.9, "learning_rate": 6.756e-06, "loss": 0.3952, "step": 139250 }, { "epoch": 4.9, "learning_rate": 6.750444444444445e-06, "loss": 0.4424, "step": 139300 }, { "epoch": 4.91, "learning_rate": 6.74488888888889e-06, "loss": 0.3976, "step": 139350 }, { "epoch": 4.91, "learning_rate": 6.739333333333334e-06, "loss": 0.4425, "step": 139400 }, { "epoch": 4.91, "learning_rate": 6.733777777777778e-06, "loss": 0.427, "step": 139450 }, { "epoch": 4.91, "learning_rate": 6.728222222222223e-06, "loss": 0.4003, "step": 139500 }, { "epoch": 4.91, "learning_rate": 6.7226666666666675e-06, "loss": 0.3756, "step": 139550 }, { "epoch": 4.92, "learning_rate": 6.717111111111112e-06, "loss": 0.4194, "step": 139600 }, { "epoch": 4.92, "learning_rate": 6.7115555555555554e-06, "loss": 0.4467, "step": 139650 }, { "epoch": 4.92, "learning_rate": 6.706000000000001e-06, "loss": 0.4036, "step": 139700 }, { "epoch": 4.92, "learning_rate": 6.700444444444445e-06, "loss": 0.4065, "step": 139750 }, { "epoch": 4.92, "learning_rate": 6.6948888888888895e-06, "loss": 0.4246, "step": 139800 }, { "epoch": 4.92, "learning_rate": 6.689333333333335e-06, "loss": 0.4382, "step": 139850 }, { "epoch": 4.93, "learning_rate": 6.683777777777778e-06, "loss": 0.4135, "step": 139900 }, { "epoch": 4.93, "learning_rate": 6.678222222222223e-06, "loss": 0.4553, "step": 139950 }, { "epoch": 4.93, "learning_rate": 6.672666666666667e-06, "loss": 0.3941, "step": 140000 }, { "epoch": 4.93, "eval_loss": 0.25490421056747437, "eval_runtime": 7.0414, "eval_samples_per_second": 201.664, "eval_steps_per_second": 12.639, "eval_wer": 0.18907143505491514, "step": 140000 }, { "epoch": 4.93, "learning_rate": 6.667111111111112e-06, "loss": 0.4064, "step": 140050 }, { "epoch": 4.93, "learning_rate": 6.661555555555556e-06, "loss": 0.4092, "step": 140100 }, { "epoch": 4.93, "learning_rate": 6.656e-06, "loss": 0.419, "step": 140150 }, { "epoch": 4.94, "learning_rate": 6.650444444444445e-06, "loss": 0.4102, "step": 140200 }, { "epoch": 4.94, "learning_rate": 6.64488888888889e-06, "loss": 0.4891, "step": 140250 }, { "epoch": 4.94, "learning_rate": 6.639333333333334e-06, "loss": 0.4411, "step": 140300 }, { "epoch": 4.94, "learning_rate": 6.633777777777778e-06, "loss": 0.418, "step": 140350 }, { "epoch": 4.94, "learning_rate": 6.628222222222222e-06, "loss": 0.4204, "step": 140400 }, { "epoch": 4.95, "learning_rate": 6.622666666666668e-06, "loss": 0.4311, "step": 140450 }, { "epoch": 4.95, "learning_rate": 6.617111111111112e-06, "loss": 0.4481, "step": 140500 }, { "epoch": 4.95, "learning_rate": 6.611555555555556e-06, "loss": 0.426, "step": 140550 }, { "epoch": 4.95, "learning_rate": 6.606e-06, "loss": 0.4269, "step": 140600 }, { "epoch": 4.95, "learning_rate": 6.600444444444445e-06, "loss": 0.419, "step": 140650 }, { "epoch": 4.95, "learning_rate": 6.59488888888889e-06, "loss": 0.4136, "step": 140700 }, { "epoch": 4.96, "learning_rate": 6.589333333333334e-06, "loss": 0.4456, "step": 140750 }, { "epoch": 4.96, "learning_rate": 6.58388888888889e-06, "loss": 0.4261, "step": 140800 }, { "epoch": 4.96, "learning_rate": 6.5783333333333344e-06, "loss": 0.4731, "step": 140850 }, { "epoch": 4.96, "learning_rate": 6.572777777777778e-06, "loss": 0.4151, "step": 140900 }, { "epoch": 4.96, "learning_rate": 6.567222222222222e-06, "loss": 0.4229, "step": 140950 }, { "epoch": 4.96, "learning_rate": 6.561666666666668e-06, "loss": 0.3799, "step": 141000 }, { "epoch": 4.97, "learning_rate": 6.556111111111112e-06, "loss": 0.4387, "step": 141050 }, { "epoch": 4.97, "learning_rate": 6.550555555555556e-06, "loss": 0.4236, "step": 141100 }, { "epoch": 4.97, "learning_rate": 6.545e-06, "loss": 0.4439, "step": 141150 }, { "epoch": 4.97, "learning_rate": 6.539444444444445e-06, "loss": 0.3836, "step": 141200 }, { "epoch": 4.97, "learning_rate": 6.53388888888889e-06, "loss": 0.4317, "step": 141250 }, { "epoch": 4.98, "learning_rate": 6.528333333333334e-06, "loss": 0.409, "step": 141300 }, { "epoch": 4.98, "learning_rate": 6.522777777777778e-06, "loss": 0.4054, "step": 141350 }, { "epoch": 4.98, "learning_rate": 6.517222222222223e-06, "loss": 0.3979, "step": 141400 }, { "epoch": 4.98, "learning_rate": 6.511666666666667e-06, "loss": 0.4034, "step": 141450 }, { "epoch": 4.98, "learning_rate": 6.506111111111112e-06, "loss": 0.4386, "step": 141500 }, { "epoch": 4.98, "learning_rate": 6.500555555555557e-06, "loss": 0.3856, "step": 141550 }, { "epoch": 4.99, "learning_rate": 6.4950000000000005e-06, "loss": 0.5087, "step": 141600 }, { "epoch": 4.99, "learning_rate": 6.489444444444445e-06, "loss": 0.4024, "step": 141650 }, { "epoch": 4.99, "learning_rate": 6.483888888888889e-06, "loss": 0.4464, "step": 141700 }, { "epoch": 4.99, "learning_rate": 6.4783333333333346e-06, "loss": 0.4691, "step": 141750 }, { "epoch": 4.99, "learning_rate": 6.472777777777778e-06, "loss": 0.421, "step": 141800 }, { "epoch": 4.99, "learning_rate": 6.4672222222222225e-06, "loss": 0.4306, "step": 141850 }, { "epoch": 5.0, "learning_rate": 6.461666666666667e-06, "loss": 0.4017, "step": 141900 }, { "epoch": 5.0, "learning_rate": 6.456111111111112e-06, "loss": 0.4217, "step": 141950 }, { "epoch": 5.0, "learning_rate": 6.4505555555555566e-06, "loss": 0.4342, "step": 142000 }, { "epoch": 5.0, "learning_rate": 6.445e-06, "loss": 0.4361, "step": 142050 }, { "epoch": 5.0, "learning_rate": 6.4394444444444445e-06, "loss": 0.404, "step": 142100 }, { "epoch": 5.0, "learning_rate": 6.43388888888889e-06, "loss": 0.4175, "step": 142150 }, { "epoch": 5.01, "learning_rate": 6.428333333333334e-06, "loss": 0.4326, "step": 142200 }, { "epoch": 5.01, "learning_rate": 6.422777777777778e-06, "loss": 0.3891, "step": 142250 }, { "epoch": 5.01, "learning_rate": 6.417222222222222e-06, "loss": 0.3882, "step": 142300 }, { "epoch": 5.01, "learning_rate": 6.411666666666667e-06, "loss": 0.3944, "step": 142350 }, { "epoch": 5.01, "learning_rate": 6.406111111111112e-06, "loss": 0.4341, "step": 142400 }, { "epoch": 5.02, "learning_rate": 6.400555555555556e-06, "loss": 0.407, "step": 142450 }, { "epoch": 5.02, "learning_rate": 6.395e-06, "loss": 0.3917, "step": 142500 }, { "epoch": 5.02, "eval_loss": 0.2544367015361786, "eval_runtime": 28.0429, "eval_samples_per_second": 50.637, "eval_steps_per_second": 3.174, "eval_wer": 0.18634837069982754, "step": 142500 }, { "epoch": 5.02, "learning_rate": 6.389444444444445e-06, "loss": 0.4045, "step": 142550 }, { "epoch": 5.02, "learning_rate": 6.383888888888889e-06, "loss": 0.3953, "step": 142600 }, { "epoch": 5.02, "learning_rate": 6.378333333333334e-06, "loss": 0.417, "step": 142650 }, { "epoch": 5.02, "learning_rate": 6.372777777777779e-06, "loss": 0.411, "step": 142700 }, { "epoch": 5.03, "learning_rate": 6.367222222222223e-06, "loss": 0.4508, "step": 142750 }, { "epoch": 5.03, "learning_rate": 6.361666666666667e-06, "loss": 0.4111, "step": 142800 }, { "epoch": 5.03, "learning_rate": 6.3561111111111114e-06, "loss": 0.416, "step": 142850 }, { "epoch": 5.03, "learning_rate": 6.350555555555557e-06, "loss": 0.4043, "step": 142900 }, { "epoch": 5.03, "learning_rate": 6.345e-06, "loss": 0.4192, "step": 142950 }, { "epoch": 5.03, "learning_rate": 6.339444444444445e-06, "loss": 0.422, "step": 143000 }, { "epoch": 5.04, "learning_rate": 6.333888888888889e-06, "loss": 0.4196, "step": 143050 }, { "epoch": 5.04, "learning_rate": 6.328444444444445e-06, "loss": 0.4181, "step": 143100 }, { "epoch": 5.04, "learning_rate": 6.3228888888888895e-06, "loss": 0.475, "step": 143150 }, { "epoch": 5.04, "learning_rate": 6.317333333333334e-06, "loss": 0.4456, "step": 143200 }, { "epoch": 5.04, "learning_rate": 6.3117777777777774e-06, "loss": 0.3975, "step": 143250 }, { "epoch": 5.05, "learning_rate": 6.306222222222223e-06, "loss": 0.4444, "step": 143300 }, { "epoch": 5.05, "learning_rate": 6.300666666666667e-06, "loss": 0.4084, "step": 143350 }, { "epoch": 5.05, "learning_rate": 6.2951111111111115e-06, "loss": 0.4025, "step": 143400 }, { "epoch": 5.05, "learning_rate": 6.289555555555557e-06, "loss": 0.4305, "step": 143450 }, { "epoch": 5.05, "learning_rate": 6.284e-06, "loss": 0.3901, "step": 143500 }, { "epoch": 5.05, "learning_rate": 6.278444444444445e-06, "loss": 0.4184, "step": 143550 }, { "epoch": 5.06, "learning_rate": 6.272888888888889e-06, "loss": 0.4582, "step": 143600 }, { "epoch": 5.06, "learning_rate": 6.267333333333334e-06, "loss": 0.4246, "step": 143650 }, { "epoch": 5.06, "learning_rate": 6.261777777777779e-06, "loss": 0.4329, "step": 143700 }, { "epoch": 5.06, "learning_rate": 6.256222222222222e-06, "loss": 0.4435, "step": 143750 }, { "epoch": 5.06, "learning_rate": 6.250666666666667e-06, "loss": 0.4002, "step": 143800 }, { "epoch": 5.06, "learning_rate": 6.245111111111112e-06, "loss": 0.4227, "step": 143850 }, { "epoch": 5.07, "learning_rate": 6.239555555555556e-06, "loss": 0.4287, "step": 143900 }, { "epoch": 5.07, "learning_rate": 6.234e-06, "loss": 0.3843, "step": 143950 }, { "epoch": 5.07, "learning_rate": 6.228444444444444e-06, "loss": 0.4394, "step": 144000 }, { "epoch": 5.07, "learning_rate": 6.22288888888889e-06, "loss": 0.4021, "step": 144050 }, { "epoch": 5.07, "learning_rate": 6.217333333333334e-06, "loss": 0.4024, "step": 144100 }, { "epoch": 5.08, "learning_rate": 6.211777777777778e-06, "loss": 0.4578, "step": 144150 }, { "epoch": 5.08, "learning_rate": 6.206222222222222e-06, "loss": 0.3966, "step": 144200 }, { "epoch": 5.08, "learning_rate": 6.200666666666667e-06, "loss": 0.4765, "step": 144250 }, { "epoch": 5.08, "learning_rate": 6.195111111111112e-06, "loss": 0.4187, "step": 144300 }, { "epoch": 5.08, "learning_rate": 6.189555555555556e-06, "loss": 0.396, "step": 144350 }, { "epoch": 5.08, "learning_rate": 6.184e-06, "loss": 0.4493, "step": 144400 }, { "epoch": 5.09, "learning_rate": 6.178444444444445e-06, "loss": 0.4103, "step": 144450 }, { "epoch": 5.09, "learning_rate": 6.172888888888889e-06, "loss": 0.4141, "step": 144500 }, { "epoch": 5.09, "learning_rate": 6.1673333333333345e-06, "loss": 0.5361, "step": 144550 }, { "epoch": 5.09, "learning_rate": 6.161777777777779e-06, "loss": 0.3998, "step": 144600 }, { "epoch": 5.09, "learning_rate": 6.1562222222222224e-06, "loss": 0.3824, "step": 144650 }, { "epoch": 5.09, "learning_rate": 6.150666666666667e-06, "loss": 0.4205, "step": 144700 }, { "epoch": 5.1, "learning_rate": 6.145111111111112e-06, "loss": 0.401, "step": 144750 }, { "epoch": 5.1, "learning_rate": 6.1395555555555565e-06, "loss": 0.4236, "step": 144800 }, { "epoch": 5.1, "learning_rate": 6.134e-06, "loss": 0.4421, "step": 144850 }, { "epoch": 5.1, "learning_rate": 6.1284444444444445e-06, "loss": 0.4303, "step": 144900 }, { "epoch": 5.1, "learning_rate": 6.12288888888889e-06, "loss": 0.3873, "step": 144950 }, { "epoch": 5.11, "learning_rate": 6.117333333333334e-06, "loss": 0.4324, "step": 145000 }, { "epoch": 5.11, "eval_loss": 0.2564394176006317, "eval_runtime": 10.0112, "eval_samples_per_second": 141.841, "eval_steps_per_second": 8.89, "eval_wer": 0.1881637469365526, "step": 145000 }, { "epoch": 5.11, "learning_rate": 6.1117777777777785e-06, "loss": 0.4306, "step": 145050 }, { "epoch": 5.11, "learning_rate": 6.106222222222222e-06, "loss": 0.3917, "step": 145100 }, { "epoch": 5.11, "learning_rate": 6.100666666666667e-06, "loss": 0.4011, "step": 145150 }, { "epoch": 5.11, "learning_rate": 6.0952222222222225e-06, "loss": 0.3994, "step": 145200 }, { "epoch": 5.11, "learning_rate": 6.089777777777778e-06, "loss": 0.3962, "step": 145250 }, { "epoch": 5.12, "learning_rate": 6.084222222222222e-06, "loss": 0.4295, "step": 145300 }, { "epoch": 5.12, "learning_rate": 6.078666666666667e-06, "loss": 0.4001, "step": 145350 }, { "epoch": 5.12, "learning_rate": 6.073111111111112e-06, "loss": 0.3867, "step": 145400 }, { "epoch": 5.12, "learning_rate": 6.067555555555556e-06, "loss": 0.4182, "step": 145450 }, { "epoch": 5.12, "learning_rate": 6.062e-06, "loss": 0.5453, "step": 145500 }, { "epoch": 5.12, "learning_rate": 6.056444444444445e-06, "loss": 0.4221, "step": 145550 }, { "epoch": 5.13, "learning_rate": 6.050888888888889e-06, "loss": 0.4339, "step": 145600 }, { "epoch": 5.13, "learning_rate": 6.045333333333334e-06, "loss": 0.4329, "step": 145650 }, { "epoch": 5.13, "learning_rate": 6.039777777777777e-06, "loss": 0.4385, "step": 145700 }, { "epoch": 5.13, "learning_rate": 6.034222222222223e-06, "loss": 0.4453, "step": 145750 }, { "epoch": 5.13, "learning_rate": 6.028666666666667e-06, "loss": 0.4161, "step": 145800 }, { "epoch": 5.14, "learning_rate": 6.023111111111111e-06, "loss": 0.418, "step": 145850 }, { "epoch": 5.14, "learning_rate": 6.017555555555557e-06, "loss": 0.4124, "step": 145900 }, { "epoch": 5.14, "learning_rate": 6.012e-06, "loss": 0.3987, "step": 145950 }, { "epoch": 5.14, "learning_rate": 6.006444444444445e-06, "loss": 0.4083, "step": 146000 }, { "epoch": 5.14, "learning_rate": 6.000888888888889e-06, "loss": 0.4173, "step": 146050 }, { "epoch": 5.14, "learning_rate": 5.995333333333334e-06, "loss": 0.4171, "step": 146100 }, { "epoch": 5.15, "learning_rate": 5.989777777777779e-06, "loss": 0.3984, "step": 146150 }, { "epoch": 5.15, "learning_rate": 5.984222222222222e-06, "loss": 0.4111, "step": 146200 }, { "epoch": 5.15, "learning_rate": 5.9786666666666675e-06, "loss": 0.4967, "step": 146250 }, { "epoch": 5.15, "learning_rate": 5.973111111111112e-06, "loss": 0.407, "step": 146300 }, { "epoch": 5.15, "learning_rate": 5.967555555555556e-06, "loss": 0.3956, "step": 146350 }, { "epoch": 5.15, "learning_rate": 5.962e-06, "loss": 0.4248, "step": 146400 }, { "epoch": 5.16, "learning_rate": 5.956444444444445e-06, "loss": 0.3893, "step": 146450 }, { "epoch": 5.16, "learning_rate": 5.9508888888888895e-06, "loss": 0.3855, "step": 146500 }, { "epoch": 5.16, "learning_rate": 5.945333333333334e-06, "loss": 0.3996, "step": 146550 }, { "epoch": 5.16, "learning_rate": 5.939777777777779e-06, "loss": 0.4218, "step": 146600 }, { "epoch": 5.16, "learning_rate": 5.934222222222223e-06, "loss": 0.4133, "step": 146650 }, { "epoch": 5.17, "learning_rate": 5.928666666666667e-06, "loss": 0.3936, "step": 146700 }, { "epoch": 5.17, "learning_rate": 5.9231111111111115e-06, "loss": 0.4614, "step": 146750 }, { "epoch": 5.17, "learning_rate": 5.917666666666667e-06, "loss": 0.3952, "step": 146800 }, { "epoch": 5.17, "learning_rate": 5.912111111111112e-06, "loss": 0.4814, "step": 146850 }, { "epoch": 5.17, "learning_rate": 5.906555555555556e-06, "loss": 0.4245, "step": 146900 }, { "epoch": 5.17, "learning_rate": 5.901e-06, "loss": 0.4131, "step": 146950 }, { "epoch": 5.18, "learning_rate": 5.895444444444445e-06, "loss": 0.4067, "step": 147000 }, { "epoch": 5.18, "learning_rate": 5.8898888888888896e-06, "loss": 0.4119, "step": 147050 }, { "epoch": 5.18, "learning_rate": 5.884333333333334e-06, "loss": 0.4137, "step": 147100 }, { "epoch": 5.18, "learning_rate": 5.878777777777779e-06, "loss": 0.4117, "step": 147150 }, { "epoch": 5.18, "learning_rate": 5.873222222222223e-06, "loss": 0.4177, "step": 147200 }, { "epoch": 5.18, "learning_rate": 5.867666666666667e-06, "loss": 0.4273, "step": 147250 }, { "epoch": 5.19, "learning_rate": 5.862111111111112e-06, "loss": 0.3993, "step": 147300 }, { "epoch": 5.19, "learning_rate": 5.856555555555557e-06, "loss": 0.452, "step": 147350 }, { "epoch": 5.19, "learning_rate": 5.851e-06, "loss": 0.407, "step": 147400 }, { "epoch": 5.19, "learning_rate": 5.845444444444445e-06, "loss": 0.4237, "step": 147450 }, { "epoch": 5.19, "learning_rate": 5.839888888888889e-06, "loss": 0.4255, "step": 147500 }, { "epoch": 5.19, "eval_loss": 0.2535807490348816, "eval_runtime": 8.7579, "eval_samples_per_second": 162.139, "eval_steps_per_second": 10.162, "eval_wer": 0.1885268221838976, "step": 147500 }, { "epoch": 5.2, "learning_rate": 5.8343333333333345e-06, "loss": 0.4077, "step": 147550 }, { "epoch": 5.2, "learning_rate": 5.828777777777779e-06, "loss": 0.3912, "step": 147600 }, { "epoch": 5.2, "learning_rate": 5.823222222222222e-06, "loss": 0.423, "step": 147650 }, { "epoch": 5.2, "learning_rate": 5.817666666666667e-06, "loss": 0.4006, "step": 147700 }, { "epoch": 5.2, "learning_rate": 5.812111111111112e-06, "loss": 0.4821, "step": 147750 }, { "epoch": 5.2, "learning_rate": 5.8065555555555565e-06, "loss": 0.4047, "step": 147800 }, { "epoch": 5.21, "learning_rate": 5.801e-06, "loss": 0.3877, "step": 147850 }, { "epoch": 5.21, "learning_rate": 5.7954444444444444e-06, "loss": 0.4203, "step": 147900 }, { "epoch": 5.21, "learning_rate": 5.78988888888889e-06, "loss": 0.3871, "step": 147950 }, { "epoch": 5.21, "learning_rate": 5.784333333333334e-06, "loss": 0.4298, "step": 148000 }, { "epoch": 5.21, "learning_rate": 5.7787777777777785e-06, "loss": 0.4447, "step": 148050 }, { "epoch": 5.21, "learning_rate": 5.773222222222222e-06, "loss": 0.3885, "step": 148100 }, { "epoch": 5.22, "learning_rate": 5.767666666666667e-06, "loss": 0.4136, "step": 148150 }, { "epoch": 5.22, "learning_rate": 5.762111111111112e-06, "loss": 0.4059, "step": 148200 }, { "epoch": 5.22, "learning_rate": 5.756555555555556e-06, "loss": 0.4172, "step": 148250 }, { "epoch": 5.22, "learning_rate": 5.751e-06, "loss": 0.4011, "step": 148300 }, { "epoch": 5.22, "learning_rate": 5.745444444444445e-06, "loss": 0.3978, "step": 148350 }, { "epoch": 5.22, "learning_rate": 5.739888888888889e-06, "loss": 0.5641, "step": 148400 }, { "epoch": 5.23, "learning_rate": 5.734333333333334e-06, "loss": 0.3937, "step": 148450 }, { "epoch": 5.23, "learning_rate": 5.728777777777779e-06, "loss": 0.4271, "step": 148500 }, { "epoch": 5.23, "learning_rate": 5.7232222222222225e-06, "loss": 0.4173, "step": 148550 }, { "epoch": 5.23, "learning_rate": 5.717666666666667e-06, "loss": 0.4055, "step": 148600 }, { "epoch": 5.23, "learning_rate": 5.712111111111111e-06, "loss": 0.4385, "step": 148650 }, { "epoch": 5.24, "learning_rate": 5.706555555555557e-06, "loss": 0.4852, "step": 148700 }, { "epoch": 5.24, "learning_rate": 5.701000000000001e-06, "loss": 0.4301, "step": 148750 }, { "epoch": 5.24, "learning_rate": 5.6954444444444445e-06, "loss": 0.4216, "step": 148800 }, { "epoch": 5.24, "learning_rate": 5.689888888888889e-06, "loss": 0.4111, "step": 148850 }, { "epoch": 5.24, "learning_rate": 5.684333333333334e-06, "loss": 0.397, "step": 148900 }, { "epoch": 5.24, "learning_rate": 5.678777777777779e-06, "loss": 0.42, "step": 148950 }, { "epoch": 5.25, "learning_rate": 5.673222222222222e-06, "loss": 0.4008, "step": 149000 }, { "epoch": 5.25, "learning_rate": 5.6676666666666666e-06, "loss": 0.426, "step": 149050 }, { "epoch": 5.25, "learning_rate": 5.662111111111112e-06, "loss": 0.4027, "step": 149100 }, { "epoch": 5.25, "learning_rate": 5.656555555555556e-06, "loss": 0.4291, "step": 149150 }, { "epoch": 5.25, "learning_rate": 5.651000000000001e-06, "loss": 0.3783, "step": 149200 }, { "epoch": 5.25, "learning_rate": 5.645444444444444e-06, "loss": 0.421, "step": 149250 }, { "epoch": 5.26, "learning_rate": 5.639888888888889e-06, "loss": 0.4142, "step": 149300 }, { "epoch": 5.26, "learning_rate": 5.634333333333334e-06, "loss": 0.4032, "step": 149350 }, { "epoch": 5.26, "learning_rate": 5.628777777777778e-06, "loss": 0.3971, "step": 149400 }, { "epoch": 5.26, "learning_rate": 5.623222222222222e-06, "loss": 0.4428, "step": 149450 }, { "epoch": 5.26, "learning_rate": 5.617666666666667e-06, "loss": 0.425, "step": 149500 }, { "epoch": 5.27, "learning_rate": 5.6121111111111114e-06, "loss": 0.411, "step": 149550 }, { "epoch": 5.27, "learning_rate": 5.606555555555556e-06, "loss": 0.3981, "step": 149600 }, { "epoch": 5.27, "learning_rate": 5.601000000000001e-06, "loss": 0.4307, "step": 149650 }, { "epoch": 5.27, "learning_rate": 5.595444444444445e-06, "loss": 0.3935, "step": 149700 }, { "epoch": 5.27, "learning_rate": 5.589888888888889e-06, "loss": 0.5055, "step": 149750 }, { "epoch": 5.27, "learning_rate": 5.5843333333333335e-06, "loss": 0.4058, "step": 149800 }, { "epoch": 5.28, "learning_rate": 5.578777777777779e-06, "loss": 0.3875, "step": 149850 }, { "epoch": 5.28, "learning_rate": 5.573222222222223e-06, "loss": 0.4668, "step": 149900 }, { "epoch": 5.28, "learning_rate": 5.567666666666667e-06, "loss": 0.4046, "step": 149950 }, { "epoch": 5.28, "learning_rate": 5.562111111111111e-06, "loss": 0.3894, "step": 150000 }, { "epoch": 5.28, "eval_loss": 0.2538159489631653, "eval_runtime": 16.098, "eval_samples_per_second": 88.21, "eval_steps_per_second": 5.529, "eval_wer": 0.18598529545248252, "step": 150000 }, { "epoch": 5.28, "learning_rate": 5.556555555555556e-06, "loss": 0.4164, "step": 150050 }, { "epoch": 5.28, "learning_rate": 5.551000000000001e-06, "loss": 0.4155, "step": 150100 }, { "epoch": 5.29, "learning_rate": 5.545444444444444e-06, "loss": 0.4015, "step": 150150 }, { "epoch": 5.29, "learning_rate": 5.539888888888889e-06, "loss": 0.3845, "step": 150200 }, { "epoch": 5.29, "learning_rate": 5.534333333333334e-06, "loss": 0.401, "step": 150250 }, { "epoch": 5.29, "learning_rate": 5.528777777777778e-06, "loss": 0.4235, "step": 150300 }, { "epoch": 5.29, "learning_rate": 5.523222222222223e-06, "loss": 0.398, "step": 150350 }, { "epoch": 5.3, "learning_rate": 5.517666666666667e-06, "loss": 0.416, "step": 150400 }, { "epoch": 5.3, "learning_rate": 5.5121111111111115e-06, "loss": 0.4649, "step": 150450 }, { "epoch": 5.3, "learning_rate": 5.506555555555556e-06, "loss": 0.4125, "step": 150500 }, { "epoch": 5.3, "learning_rate": 5.501000000000001e-06, "loss": 0.396, "step": 150550 }, { "epoch": 5.3, "learning_rate": 5.495444444444445e-06, "loss": 0.4404, "step": 150600 }, { "epoch": 5.3, "learning_rate": 5.489888888888889e-06, "loss": 0.4351, "step": 150650 }, { "epoch": 5.31, "learning_rate": 5.4843333333333336e-06, "loss": 0.4209, "step": 150700 }, { "epoch": 5.31, "learning_rate": 5.478777777777779e-06, "loss": 0.3951, "step": 150750 }, { "epoch": 5.31, "learning_rate": 5.473222222222223e-06, "loss": 0.396, "step": 150800 }, { "epoch": 5.31, "learning_rate": 5.467777777777778e-06, "loss": 0.5726, "step": 150850 }, { "epoch": 5.31, "learning_rate": 5.462222222222223e-06, "loss": 0.4307, "step": 150900 }, { "epoch": 5.31, "learning_rate": 5.456666666666666e-06, "loss": 0.5352, "step": 150950 }, { "epoch": 5.32, "learning_rate": 5.451111111111112e-06, "loss": 0.5237, "step": 151000 }, { "epoch": 5.32, "learning_rate": 5.445555555555556e-06, "loss": 0.4101, "step": 151050 }, { "epoch": 5.32, "learning_rate": 5.4400000000000004e-06, "loss": 0.4041, "step": 151100 }, { "epoch": 5.32, "learning_rate": 5.434444444444444e-06, "loss": 0.4226, "step": 151150 }, { "epoch": 5.32, "learning_rate": 5.428888888888889e-06, "loss": 0.3869, "step": 151200 }, { "epoch": 5.33, "learning_rate": 5.423333333333334e-06, "loss": 0.4172, "step": 151250 }, { "epoch": 5.33, "learning_rate": 5.417777777777778e-06, "loss": 0.4358, "step": 151300 }, { "epoch": 5.33, "learning_rate": 5.412222222222223e-06, "loss": 0.3955, "step": 151350 }, { "epoch": 5.33, "learning_rate": 5.406666666666667e-06, "loss": 0.4001, "step": 151400 }, { "epoch": 5.33, "learning_rate": 5.401111111111111e-06, "loss": 0.4556, "step": 151450 }, { "epoch": 5.33, "learning_rate": 5.3955555555555565e-06, "loss": 0.4122, "step": 151500 }, { "epoch": 5.34, "learning_rate": 5.390000000000001e-06, "loss": 0.3985, "step": 151550 }, { "epoch": 5.34, "learning_rate": 5.3844444444444445e-06, "loss": 0.4299, "step": 151600 }, { "epoch": 5.34, "learning_rate": 5.378888888888889e-06, "loss": 0.4024, "step": 151650 }, { "epoch": 5.34, "learning_rate": 5.373333333333334e-06, "loss": 0.4186, "step": 151700 }, { "epoch": 5.34, "learning_rate": 5.3677777777777785e-06, "loss": 0.404, "step": 151750 }, { "epoch": 5.34, "learning_rate": 5.362222222222223e-06, "loss": 0.4016, "step": 151800 }, { "epoch": 5.35, "learning_rate": 5.3566666666666665e-06, "loss": 0.3947, "step": 151850 }, { "epoch": 5.35, "learning_rate": 5.351111111111112e-06, "loss": 0.4115, "step": 151900 }, { "epoch": 5.35, "learning_rate": 5.345555555555556e-06, "loss": 0.4368, "step": 151950 }, { "epoch": 5.35, "learning_rate": 5.3400000000000005e-06, "loss": 0.4055, "step": 152000 }, { "epoch": 5.35, "learning_rate": 5.334444444444446e-06, "loss": 0.4334, "step": 152050 }, { "epoch": 5.36, "learning_rate": 5.328888888888889e-06, "loss": 0.4046, "step": 152100 }, { "epoch": 5.36, "learning_rate": 5.323333333333334e-06, "loss": 0.4122, "step": 152150 }, { "epoch": 5.36, "learning_rate": 5.317777777777778e-06, "loss": 0.4166, "step": 152200 }, { "epoch": 5.36, "learning_rate": 5.312222222222223e-06, "loss": 0.3837, "step": 152250 }, { "epoch": 5.36, "learning_rate": 5.306666666666667e-06, "loss": 0.4242, "step": 152300 }, { "epoch": 5.36, "learning_rate": 5.301111111111111e-06, "loss": 0.4341, "step": 152350 }, { "epoch": 5.37, "learning_rate": 5.295555555555556e-06, "loss": 0.3887, "step": 152400 }, { "epoch": 5.37, "learning_rate": 5.290000000000001e-06, "loss": 0.4658, "step": 152450 }, { "epoch": 5.37, "learning_rate": 5.2844444444444454e-06, "loss": 0.4108, "step": 152500 }, { "epoch": 5.37, "eval_loss": 0.2538858652114868, "eval_runtime": 11.3962, "eval_samples_per_second": 124.602, "eval_steps_per_second": 7.81, "eval_wer": 0.18598529545248252, "step": 152500 }, { "epoch": 5.37, "learning_rate": 5.278888888888889e-06, "loss": 0.421, "step": 152550 }, { "epoch": 5.37, "learning_rate": 5.273333333333333e-06, "loss": 0.3979, "step": 152600 }, { "epoch": 5.37, "learning_rate": 5.267777777777779e-06, "loss": 0.3787, "step": 152650 }, { "epoch": 5.38, "learning_rate": 5.262222222222223e-06, "loss": 0.3909, "step": 152700 }, { "epoch": 5.38, "learning_rate": 5.256666666666667e-06, "loss": 0.404, "step": 152750 }, { "epoch": 5.38, "learning_rate": 5.251111111111111e-06, "loss": 0.4016, "step": 152800 }, { "epoch": 5.38, "learning_rate": 5.245555555555556e-06, "loss": 0.3983, "step": 152850 }, { "epoch": 5.38, "learning_rate": 5.240000000000001e-06, "loss": 0.3887, "step": 152900 }, { "epoch": 5.39, "learning_rate": 5.234444444444445e-06, "loss": 0.3979, "step": 152950 }, { "epoch": 5.39, "learning_rate": 5.228888888888889e-06, "loss": 0.4006, "step": 153000 }, { "epoch": 5.39, "learning_rate": 5.223333333333334e-06, "loss": 0.4022, "step": 153050 }, { "epoch": 5.39, "learning_rate": 5.217777777777778e-06, "loss": 0.3897, "step": 153100 }, { "epoch": 5.39, "learning_rate": 5.212222222222223e-06, "loss": 0.3981, "step": 153150 }, { "epoch": 5.39, "learning_rate": 5.206666666666668e-06, "loss": 0.4292, "step": 153200 }, { "epoch": 5.4, "learning_rate": 5.2011111111111115e-06, "loss": 0.385, "step": 153250 }, { "epoch": 5.4, "learning_rate": 5.195555555555556e-06, "loss": 0.4122, "step": 153300 }, { "epoch": 5.4, "learning_rate": 5.19e-06, "loss": 0.3968, "step": 153350 }, { "epoch": 5.4, "learning_rate": 5.1844444444444455e-06, "loss": 0.4011, "step": 153400 }, { "epoch": 5.4, "learning_rate": 5.178888888888889e-06, "loss": 0.4001, "step": 153450 }, { "epoch": 5.4, "learning_rate": 5.1733333333333335e-06, "loss": 0.4342, "step": 153500 }, { "epoch": 5.41, "learning_rate": 5.167777777777778e-06, "loss": 0.4079, "step": 153550 }, { "epoch": 5.41, "learning_rate": 5.162222222222223e-06, "loss": 0.4052, "step": 153600 }, { "epoch": 5.41, "learning_rate": 5.1566666666666676e-06, "loss": 0.6829, "step": 153650 }, { "epoch": 5.41, "learning_rate": 5.151111111111111e-06, "loss": 0.4202, "step": 153700 }, { "epoch": 5.41, "learning_rate": 5.1455555555555555e-06, "loss": 0.4533, "step": 153750 }, { "epoch": 5.42, "learning_rate": 5.140000000000001e-06, "loss": 0.391, "step": 153800 }, { "epoch": 5.42, "learning_rate": 5.134444444444445e-06, "loss": 0.3939, "step": 153850 }, { "epoch": 5.42, "learning_rate": 5.128888888888889e-06, "loss": 0.4052, "step": 153900 }, { "epoch": 5.42, "learning_rate": 5.123333333333333e-06, "loss": 0.4315, "step": 153950 }, { "epoch": 5.42, "learning_rate": 5.117777777777778e-06, "loss": 0.39, "step": 154000 }, { "epoch": 5.42, "learning_rate": 5.112222222222223e-06, "loss": 0.4629, "step": 154050 }, { "epoch": 5.43, "learning_rate": 5.106666666666667e-06, "loss": 0.3944, "step": 154100 }, { "epoch": 5.43, "learning_rate": 5.101111111111111e-06, "loss": 0.4448, "step": 154150 }, { "epoch": 5.43, "learning_rate": 5.095555555555556e-06, "loss": 0.3966, "step": 154200 }, { "epoch": 5.43, "learning_rate": 5.09e-06, "loss": 0.4008, "step": 154250 }, { "epoch": 5.43, "learning_rate": 5.084555555555556e-06, "loss": 0.4228, "step": 154300 }, { "epoch": 5.43, "learning_rate": 5.079000000000001e-06, "loss": 0.3975, "step": 154350 }, { "epoch": 5.44, "learning_rate": 5.073444444444445e-06, "loss": 0.3887, "step": 154400 }, { "epoch": 5.44, "learning_rate": 5.067888888888889e-06, "loss": 0.4182, "step": 154450 }, { "epoch": 5.44, "learning_rate": 5.062333333333333e-06, "loss": 0.4061, "step": 154500 }, { "epoch": 5.44, "learning_rate": 5.0567777777777785e-06, "loss": 0.4139, "step": 154550 }, { "epoch": 5.44, "learning_rate": 5.051222222222223e-06, "loss": 0.4199, "step": 154600 }, { "epoch": 5.45, "learning_rate": 5.045666666666667e-06, "loss": 0.3986, "step": 154650 }, { "epoch": 5.45, "learning_rate": 5.040111111111111e-06, "loss": 0.3866, "step": 154700 }, { "epoch": 5.45, "learning_rate": 5.034555555555556e-06, "loss": 0.4325, "step": 154750 }, { "epoch": 5.45, "learning_rate": 5.0290000000000005e-06, "loss": 0.3803, "step": 154800 }, { "epoch": 5.45, "learning_rate": 5.023444444444445e-06, "loss": 0.3876, "step": 154850 }, { "epoch": 5.45, "learning_rate": 5.0178888888888884e-06, "loss": 0.5047, "step": 154900 }, { "epoch": 5.46, "learning_rate": 5.012333333333334e-06, "loss": 0.3985, "step": 154950 }, { "epoch": 5.46, "learning_rate": 5.006777777777778e-06, "loss": 0.4312, "step": 155000 }, { "epoch": 5.46, "eval_loss": 0.25258883833885193, "eval_runtime": 10.5523, "eval_samples_per_second": 134.567, "eval_steps_per_second": 8.434, "eval_wer": 0.1848960697104475, "step": 155000 }, { "epoch": 5.46, "learning_rate": 5.0012222222222225e-06, "loss": 0.4051, "step": 155050 }, { "epoch": 5.46, "learning_rate": 4.995666666666667e-06, "loss": 0.3959, "step": 155100 }, { "epoch": 5.46, "learning_rate": 4.990111111111111e-06, "loss": 0.3956, "step": 155150 }, { "epoch": 5.46, "learning_rate": 4.984555555555556e-06, "loss": 0.4118, "step": 155200 }, { "epoch": 5.47, "learning_rate": 4.979e-06, "loss": 0.3928, "step": 155250 }, { "epoch": 5.47, "learning_rate": 4.9734444444444445e-06, "loss": 0.4044, "step": 155300 }, { "epoch": 5.47, "learning_rate": 4.967888888888889e-06, "loss": 0.4189, "step": 155350 }, { "epoch": 5.47, "learning_rate": 4.962333333333334e-06, "loss": 0.401, "step": 155400 }, { "epoch": 5.47, "learning_rate": 4.956777777777778e-06, "loss": 0.4379, "step": 155450 }, { "epoch": 5.47, "learning_rate": 4.951222222222223e-06, "loss": 0.4135, "step": 155500 }, { "epoch": 5.48, "learning_rate": 4.945666666666667e-06, "loss": 0.3908, "step": 155550 }, { "epoch": 5.48, "learning_rate": 4.940111111111112e-06, "loss": 0.4324, "step": 155600 }, { "epoch": 5.48, "learning_rate": 4.934555555555556e-06, "loss": 0.4143, "step": 155650 }, { "epoch": 5.48, "learning_rate": 4.929000000000001e-06, "loss": 0.4124, "step": 155700 }, { "epoch": 5.48, "learning_rate": 4.923444444444445e-06, "loss": 0.3639, "step": 155750 }, { "epoch": 5.49, "learning_rate": 4.917888888888889e-06, "loss": 0.4011, "step": 155800 }, { "epoch": 5.49, "learning_rate": 4.912333333333334e-06, "loss": 0.443, "step": 155850 }, { "epoch": 5.49, "learning_rate": 4.906777777777778e-06, "loss": 0.4026, "step": 155900 }, { "epoch": 5.49, "learning_rate": 4.901222222222223e-06, "loss": 0.4124, "step": 155950 }, { "epoch": 5.49, "learning_rate": 4.895666666666667e-06, "loss": 0.4258, "step": 156000 }, { "epoch": 5.49, "learning_rate": 4.890111111111111e-06, "loss": 0.4011, "step": 156050 }, { "epoch": 5.5, "learning_rate": 4.884555555555556e-06, "loss": 0.4144, "step": 156100 }, { "epoch": 5.5, "learning_rate": 4.879e-06, "loss": 0.4382, "step": 156150 }, { "epoch": 5.5, "learning_rate": 4.8734444444444455e-06, "loss": 0.4175, "step": 156200 }, { "epoch": 5.5, "learning_rate": 4.867888888888889e-06, "loss": 0.4263, "step": 156250 }, { "epoch": 5.5, "learning_rate": 4.862333333333334e-06, "loss": 0.41, "step": 156300 }, { "epoch": 5.5, "learning_rate": 4.856777777777778e-06, "loss": 0.42, "step": 156350 }, { "epoch": 5.51, "learning_rate": 4.851222222222223e-06, "loss": 0.4585, "step": 156400 }, { "epoch": 5.51, "learning_rate": 4.845666666666667e-06, "loss": 0.3824, "step": 156450 }, { "epoch": 5.51, "learning_rate": 4.840111111111112e-06, "loss": 0.4098, "step": 156500 }, { "epoch": 5.51, "learning_rate": 4.834555555555556e-06, "loss": 0.3991, "step": 156550 }, { "epoch": 5.51, "learning_rate": 4.829000000000001e-06, "loss": 0.4668, "step": 156600 }, { "epoch": 5.52, "learning_rate": 4.823444444444445e-06, "loss": 0.3932, "step": 156650 }, { "epoch": 5.52, "learning_rate": 4.8178888888888895e-06, "loss": 0.3921, "step": 156700 }, { "epoch": 5.52, "learning_rate": 4.812333333333334e-06, "loss": 0.3694, "step": 156750 }, { "epoch": 5.52, "learning_rate": 4.806777777777778e-06, "loss": 0.3917, "step": 156800 }, { "epoch": 5.52, "learning_rate": 4.801222222222223e-06, "loss": 0.3887, "step": 156850 }, { "epoch": 5.52, "learning_rate": 4.795666666666667e-06, "loss": 0.4251, "step": 156900 }, { "epoch": 5.53, "learning_rate": 4.7901111111111115e-06, "loss": 0.4132, "step": 156950 }, { "epoch": 5.53, "learning_rate": 4.784555555555556e-06, "loss": 0.3887, "step": 157000 }, { "epoch": 5.53, "learning_rate": 4.779e-06, "loss": 0.415, "step": 157050 }, { "epoch": 5.53, "learning_rate": 4.773444444444445e-06, "loss": 0.4037, "step": 157100 }, { "epoch": 5.53, "learning_rate": 4.767888888888889e-06, "loss": 0.4283, "step": 157150 }, { "epoch": 5.53, "learning_rate": 4.7623333333333335e-06, "loss": 0.4067, "step": 157200 }, { "epoch": 5.54, "learning_rate": 4.756777777777778e-06, "loss": 0.388, "step": 157250 }, { "epoch": 5.54, "learning_rate": 4.751222222222222e-06, "loss": 0.4, "step": 157300 }, { "epoch": 5.54, "learning_rate": 4.745666666666668e-06, "loss": 0.4037, "step": 157350 }, { "epoch": 5.54, "learning_rate": 4.740111111111111e-06, "loss": 0.407, "step": 157400 }, { "epoch": 5.54, "learning_rate": 4.734555555555556e-06, "loss": 0.4192, "step": 157450 }, { "epoch": 5.55, "learning_rate": 4.729e-06, "loss": 0.3786, "step": 157500 }, { "epoch": 5.55, "eval_loss": 0.25038447976112366, "eval_runtime": 8.3439, "eval_samples_per_second": 170.183, "eval_steps_per_second": 10.666, "eval_wer": 0.1837160751565762, "step": 157500 }, { "epoch": 5.55, "learning_rate": 4.723555555555556e-06, "loss": 0.3845, "step": 157550 }, { "epoch": 5.55, "learning_rate": 4.718e-06, "loss": 0.3814, "step": 157600 }, { "epoch": 5.55, "learning_rate": 4.712444444444445e-06, "loss": 0.4311, "step": 157650 }, { "epoch": 5.55, "learning_rate": 4.706888888888889e-06, "loss": 0.4062, "step": 157700 }, { "epoch": 5.55, "learning_rate": 4.701333333333334e-06, "loss": 0.4053, "step": 157750 }, { "epoch": 5.56, "learning_rate": 4.695777777777778e-06, "loss": 0.4334, "step": 157800 }, { "epoch": 5.56, "learning_rate": 4.690222222222222e-06, "loss": 0.4158, "step": 157850 }, { "epoch": 5.56, "learning_rate": 4.684666666666667e-06, "loss": 0.3948, "step": 157900 }, { "epoch": 5.56, "learning_rate": 4.679111111111111e-06, "loss": 0.4021, "step": 157950 }, { "epoch": 5.56, "learning_rate": 4.6735555555555565e-06, "loss": 0.4238, "step": 158000 }, { "epoch": 5.56, "learning_rate": 4.668e-06, "loss": 0.4536, "step": 158050 }, { "epoch": 5.57, "learning_rate": 4.662444444444445e-06, "loss": 0.4308, "step": 158100 }, { "epoch": 5.57, "learning_rate": 4.656888888888889e-06, "loss": 0.3932, "step": 158150 }, { "epoch": 5.57, "learning_rate": 4.651333333333334e-06, "loss": 0.3874, "step": 158200 }, { "epoch": 5.57, "learning_rate": 4.645777777777778e-06, "loss": 0.3973, "step": 158250 }, { "epoch": 5.57, "learning_rate": 4.640222222222223e-06, "loss": 0.392, "step": 158300 }, { "epoch": 5.58, "learning_rate": 4.634666666666667e-06, "loss": 0.4107, "step": 158350 }, { "epoch": 5.58, "learning_rate": 4.629111111111112e-06, "loss": 0.4161, "step": 158400 }, { "epoch": 5.58, "learning_rate": 4.623555555555556e-06, "loss": 0.4386, "step": 158450 }, { "epoch": 5.58, "learning_rate": 4.6180000000000005e-06, "loss": 0.3856, "step": 158500 }, { "epoch": 5.58, "learning_rate": 4.612444444444445e-06, "loss": 0.3778, "step": 158550 }, { "epoch": 5.58, "learning_rate": 4.606888888888889e-06, "loss": 0.4445, "step": 158600 }, { "epoch": 5.59, "learning_rate": 4.601333333333334e-06, "loss": 0.428, "step": 158650 }, { "epoch": 5.59, "learning_rate": 4.595777777777778e-06, "loss": 0.4291, "step": 158700 }, { "epoch": 5.59, "learning_rate": 4.5902222222222225e-06, "loss": 0.4649, "step": 158750 }, { "epoch": 5.59, "learning_rate": 4.584666666666667e-06, "loss": 0.4152, "step": 158800 }, { "epoch": 5.59, "learning_rate": 4.579111111111111e-06, "loss": 0.4089, "step": 158850 }, { "epoch": 5.59, "learning_rate": 4.573555555555556e-06, "loss": 0.426, "step": 158900 }, { "epoch": 5.6, "learning_rate": 4.568e-06, "loss": 0.3924, "step": 158950 }, { "epoch": 5.6, "learning_rate": 4.5624444444444445e-06, "loss": 0.5319, "step": 159000 }, { "epoch": 5.6, "learning_rate": 4.556888888888889e-06, "loss": 0.449, "step": 159050 }, { "epoch": 5.6, "learning_rate": 4.551333333333333e-06, "loss": 0.4105, "step": 159100 }, { "epoch": 5.6, "learning_rate": 4.545777777777779e-06, "loss": 0.4141, "step": 159150 }, { "epoch": 5.61, "learning_rate": 4.540222222222222e-06, "loss": 0.4259, "step": 159200 }, { "epoch": 5.61, "learning_rate": 4.534666666666667e-06, "loss": 0.3698, "step": 159250 }, { "epoch": 5.61, "learning_rate": 4.529111111111111e-06, "loss": 0.4344, "step": 159300 }, { "epoch": 5.61, "learning_rate": 4.523555555555556e-06, "loss": 0.386, "step": 159350 }, { "epoch": 5.61, "learning_rate": 4.518e-06, "loss": 0.4253, "step": 159400 }, { "epoch": 5.61, "learning_rate": 4.512444444444445e-06, "loss": 0.4126, "step": 159450 }, { "epoch": 5.62, "learning_rate": 4.5068888888888894e-06, "loss": 0.4159, "step": 159500 }, { "epoch": 5.62, "learning_rate": 4.501333333333334e-06, "loss": 0.3995, "step": 159550 }, { "epoch": 5.62, "learning_rate": 4.495777777777778e-06, "loss": 0.3948, "step": 159600 }, { "epoch": 5.62, "learning_rate": 4.490222222222223e-06, "loss": 0.3936, "step": 159650 }, { "epoch": 5.62, "learning_rate": 4.484666666666667e-06, "loss": 0.3933, "step": 159700 }, { "epoch": 5.62, "learning_rate": 4.4791111111111114e-06, "loss": 0.3927, "step": 159750 }, { "epoch": 5.63, "learning_rate": 4.473555555555556e-06, "loss": 0.441, "step": 159800 }, { "epoch": 5.63, "learning_rate": 4.468e-06, "loss": 0.396, "step": 159850 }, { "epoch": 5.63, "learning_rate": 4.462444444444445e-06, "loss": 0.4239, "step": 159900 }, { "epoch": 5.63, "learning_rate": 4.45688888888889e-06, "loss": 0.4084, "step": 159950 }, { "epoch": 5.63, "learning_rate": 4.4513333333333335e-06, "loss": 0.4033, "step": 160000 }, { "epoch": 5.63, "eval_loss": 0.2515707015991211, "eval_runtime": 8.4329, "eval_samples_per_second": 168.388, "eval_steps_per_second": 10.554, "eval_wer": 0.18516837614595624, "step": 160000 }, { "epoch": 5.64, "learning_rate": 4.445777777777779e-06, "loss": 0.397, "step": 160050 }, { "epoch": 5.64, "learning_rate": 4.440222222222222e-06, "loss": 0.3982, "step": 160100 }, { "epoch": 5.64, "learning_rate": 4.4346666666666675e-06, "loss": 0.4066, "step": 160150 }, { "epoch": 5.64, "learning_rate": 4.429111111111111e-06, "loss": 0.4165, "step": 160200 }, { "epoch": 5.64, "learning_rate": 4.423555555555556e-06, "loss": 0.4243, "step": 160250 }, { "epoch": 5.64, "learning_rate": 4.418000000000001e-06, "loss": 0.403, "step": 160300 }, { "epoch": 5.65, "learning_rate": 4.412444444444445e-06, "loss": 0.5007, "step": 160350 }, { "epoch": 5.65, "learning_rate": 4.4068888888888895e-06, "loss": 0.391, "step": 160400 }, { "epoch": 5.65, "learning_rate": 4.401333333333334e-06, "loss": 0.3941, "step": 160450 }, { "epoch": 5.65, "learning_rate": 4.395777777777778e-06, "loss": 0.3998, "step": 160500 }, { "epoch": 5.65, "learning_rate": 4.390222222222223e-06, "loss": 0.4516, "step": 160550 }, { "epoch": 5.65, "learning_rate": 4.384666666666667e-06, "loss": 0.4164, "step": 160600 }, { "epoch": 5.66, "learning_rate": 4.3791111111111116e-06, "loss": 0.3815, "step": 160650 }, { "epoch": 5.66, "learning_rate": 4.373555555555556e-06, "loss": 0.3863, "step": 160700 }, { "epoch": 5.66, "learning_rate": 4.368e-06, "loss": 0.3992, "step": 160750 }, { "epoch": 5.66, "learning_rate": 4.362444444444445e-06, "loss": 0.4241, "step": 160800 }, { "epoch": 5.66, "learning_rate": 4.356888888888889e-06, "loss": 0.3973, "step": 160850 }, { "epoch": 5.67, "learning_rate": 4.3513333333333336e-06, "loss": 0.4397, "step": 160900 }, { "epoch": 5.67, "learning_rate": 4.345777777777778e-06, "loss": 0.3916, "step": 160950 }, { "epoch": 5.67, "learning_rate": 4.340222222222222e-06, "loss": 0.424, "step": 161000 }, { "epoch": 5.67, "learning_rate": 4.334777777777778e-06, "loss": 0.4579, "step": 161050 }, { "epoch": 5.67, "learning_rate": 4.329222222222223e-06, "loss": 0.3861, "step": 161100 }, { "epoch": 5.67, "learning_rate": 4.323666666666667e-06, "loss": 0.4166, "step": 161150 }, { "epoch": 5.68, "learning_rate": 4.318111111111112e-06, "loss": 0.4211, "step": 161200 }, { "epoch": 5.68, "learning_rate": 4.312555555555556e-06, "loss": 0.399, "step": 161250 }, { "epoch": 5.68, "learning_rate": 4.3070000000000004e-06, "loss": 0.4193, "step": 161300 }, { "epoch": 5.68, "learning_rate": 4.301444444444445e-06, "loss": 0.4205, "step": 161350 }, { "epoch": 5.68, "learning_rate": 4.295888888888889e-06, "loss": 0.4067, "step": 161400 }, { "epoch": 5.68, "learning_rate": 4.290333333333334e-06, "loss": 0.4071, "step": 161450 }, { "epoch": 5.69, "learning_rate": 4.284777777777778e-06, "loss": 0.4013, "step": 161500 }, { "epoch": 5.69, "learning_rate": 4.2792222222222225e-06, "loss": 0.4606, "step": 161550 }, { "epoch": 5.69, "learning_rate": 4.273666666666667e-06, "loss": 0.3916, "step": 161600 }, { "epoch": 5.69, "learning_rate": 4.268111111111111e-06, "loss": 0.4008, "step": 161650 }, { "epoch": 5.69, "learning_rate": 4.262555555555556e-06, "loss": 0.444, "step": 161700 }, { "epoch": 5.7, "learning_rate": 4.257000000000001e-06, "loss": 0.3839, "step": 161750 }, { "epoch": 5.7, "learning_rate": 4.2514444444444445e-06, "loss": 0.4074, "step": 161800 }, { "epoch": 5.7, "learning_rate": 4.24588888888889e-06, "loss": 0.4197, "step": 161850 }, { "epoch": 5.7, "learning_rate": 4.240333333333333e-06, "loss": 0.3965, "step": 161900 }, { "epoch": 5.7, "learning_rate": 4.2347777777777785e-06, "loss": 0.3855, "step": 161950 }, { "epoch": 5.7, "learning_rate": 4.229222222222222e-06, "loss": 0.3911, "step": 162000 }, { "epoch": 5.71, "learning_rate": 4.223666666666667e-06, "loss": 0.4988, "step": 162050 }, { "epoch": 5.71, "learning_rate": 4.218111111111112e-06, "loss": 0.4059, "step": 162100 }, { "epoch": 5.71, "learning_rate": 4.212555555555556e-06, "loss": 0.42, "step": 162150 }, { "epoch": 5.71, "learning_rate": 4.2070000000000005e-06, "loss": 0.3697, "step": 162200 }, { "epoch": 5.71, "learning_rate": 4.201444444444445e-06, "loss": 0.4188, "step": 162250 }, { "epoch": 5.71, "learning_rate": 4.195888888888889e-06, "loss": 0.4313, "step": 162300 }, { "epoch": 5.72, "learning_rate": 4.190333333333334e-06, "loss": 0.4532, "step": 162350 }, { "epoch": 5.72, "learning_rate": 4.184777777777778e-06, "loss": 0.4021, "step": 162400 }, { "epoch": 5.72, "learning_rate": 4.1792222222222226e-06, "loss": 0.4849, "step": 162450 }, { "epoch": 5.72, "learning_rate": 4.173666666666667e-06, "loss": 0.3973, "step": 162500 }, { "epoch": 5.72, "eval_loss": 0.2569618225097656, "eval_runtime": 8.6385, "eval_samples_per_second": 164.381, "eval_steps_per_second": 10.303, "eval_wer": 0.1869837523826813, "step": 162500 }, { "epoch": 5.72, "learning_rate": 4.168111111111111e-06, "loss": 0.4164, "step": 162550 }, { "epoch": 5.72, "learning_rate": 4.162555555555556e-06, "loss": 0.4414, "step": 162600 }, { "epoch": 5.73, "learning_rate": 4.157e-06, "loss": 0.4385, "step": 162650 }, { "epoch": 5.73, "learning_rate": 4.151444444444445e-06, "loss": 0.3953, "step": 162700 }, { "epoch": 5.73, "learning_rate": 4.145888888888889e-06, "loss": 0.4262, "step": 162750 }, { "epoch": 5.73, "learning_rate": 4.140333333333333e-06, "loss": 0.5113, "step": 162800 }, { "epoch": 5.73, "learning_rate": 4.134777777777778e-06, "loss": 0.5719, "step": 162850 }, { "epoch": 5.74, "learning_rate": 4.129222222222223e-06, "loss": 0.4229, "step": 162900 }, { "epoch": 5.74, "learning_rate": 4.123666666666667e-06, "loss": 0.3871, "step": 162950 }, { "epoch": 5.74, "learning_rate": 4.118111111111112e-06, "loss": 0.4302, "step": 163000 }, { "epoch": 5.74, "learning_rate": 4.112555555555555e-06, "loss": 0.384, "step": 163050 }, { "epoch": 5.74, "learning_rate": 4.107000000000001e-06, "loss": 0.4076, "step": 163100 }, { "epoch": 5.74, "learning_rate": 4.101444444444444e-06, "loss": 0.4059, "step": 163150 }, { "epoch": 5.75, "learning_rate": 4.096e-06, "loss": 0.3943, "step": 163200 }, { "epoch": 5.75, "learning_rate": 4.090444444444445e-06, "loss": 0.392, "step": 163250 }, { "epoch": 5.75, "learning_rate": 4.084888888888889e-06, "loss": 0.3827, "step": 163300 }, { "epoch": 5.75, "learning_rate": 4.0793333333333335e-06, "loss": 0.3786, "step": 163350 }, { "epoch": 5.75, "learning_rate": 4.073777777777778e-06, "loss": 0.4217, "step": 163400 }, { "epoch": 5.75, "learning_rate": 4.068222222222222e-06, "loss": 0.4307, "step": 163450 }, { "epoch": 5.76, "learning_rate": 4.062666666666667e-06, "loss": 0.3679, "step": 163500 }, { "epoch": 5.76, "learning_rate": 4.057111111111112e-06, "loss": 0.4032, "step": 163550 }, { "epoch": 5.76, "learning_rate": 4.0515555555555555e-06, "loss": 0.3964, "step": 163600 }, { "epoch": 5.76, "learning_rate": 4.046000000000001e-06, "loss": 0.4458, "step": 163650 }, { "epoch": 5.76, "learning_rate": 4.040444444444444e-06, "loss": 0.4194, "step": 163700 }, { "epoch": 5.77, "learning_rate": 4.0348888888888895e-06, "loss": 0.3944, "step": 163750 }, { "epoch": 5.77, "learning_rate": 4.029333333333333e-06, "loss": 0.3858, "step": 163800 }, { "epoch": 5.77, "learning_rate": 4.023777777777778e-06, "loss": 0.3908, "step": 163850 }, { "epoch": 5.77, "learning_rate": 4.018222222222223e-06, "loss": 0.377, "step": 163900 }, { "epoch": 5.77, "learning_rate": 4.012666666666667e-06, "loss": 0.42, "step": 163950 }, { "epoch": 5.77, "learning_rate": 4.0071111111111116e-06, "loss": 0.3969, "step": 164000 }, { "epoch": 5.78, "learning_rate": 4.001555555555556e-06, "loss": 0.41, "step": 164050 }, { "epoch": 5.78, "learning_rate": 3.996e-06, "loss": 0.4111, "step": 164100 }, { "epoch": 5.78, "learning_rate": 3.990444444444445e-06, "loss": 0.4041, "step": 164150 }, { "epoch": 5.78, "learning_rate": 3.984888888888889e-06, "loss": 0.3975, "step": 164200 }, { "epoch": 5.78, "learning_rate": 3.9793333333333336e-06, "loss": 0.4018, "step": 164250 }, { "epoch": 5.78, "learning_rate": 3.973777777777778e-06, "loss": 0.3957, "step": 164300 }, { "epoch": 5.79, "learning_rate": 3.968222222222222e-06, "loss": 0.4239, "step": 164350 }, { "epoch": 5.79, "learning_rate": 3.962666666666667e-06, "loss": 0.419, "step": 164400 }, { "epoch": 5.79, "learning_rate": 3.957111111111111e-06, "loss": 0.4122, "step": 164450 }, { "epoch": 5.79, "learning_rate": 3.951555555555556e-06, "loss": 0.3994, "step": 164500 }, { "epoch": 5.79, "learning_rate": 3.946e-06, "loss": 0.4028, "step": 164550 }, { "epoch": 5.8, "learning_rate": 3.940444444444444e-06, "loss": 0.3833, "step": 164600 }, { "epoch": 5.8, "learning_rate": 3.934888888888889e-06, "loss": 0.4133, "step": 164650 }, { "epoch": 5.8, "learning_rate": 3.929333333333334e-06, "loss": 0.4199, "step": 164700 }, { "epoch": 5.8, "learning_rate": 3.923777777777778e-06, "loss": 0.3909, "step": 164750 }, { "epoch": 5.8, "learning_rate": 3.918222222222223e-06, "loss": 0.438, "step": 164800 }, { "epoch": 5.8, "learning_rate": 3.912666666666666e-06, "loss": 0.4173, "step": 164850 }, { "epoch": 5.81, "learning_rate": 3.907111111111112e-06, "loss": 0.3935, "step": 164900 }, { "epoch": 5.81, "learning_rate": 3.901555555555556e-06, "loss": 0.4045, "step": 164950 }, { "epoch": 5.81, "learning_rate": 3.8960000000000005e-06, "loss": 0.3994, "step": 165000 }, { "epoch": 5.81, "eval_loss": 0.24991491436958313, "eval_runtime": 6.8648, "eval_samples_per_second": 206.854, "eval_steps_per_second": 12.965, "eval_wer": 0.18462376327493873, "step": 165000 }, { "epoch": 5.81, "learning_rate": 3.890444444444445e-06, "loss": 0.4364, "step": 165050 }, { "epoch": 5.81, "learning_rate": 3.884888888888889e-06, "loss": 0.3816, "step": 165100 }, { "epoch": 5.81, "learning_rate": 3.879333333333334e-06, "loss": 0.3942, "step": 165150 }, { "epoch": 5.82, "learning_rate": 3.873777777777778e-06, "loss": 0.3784, "step": 165200 }, { "epoch": 5.82, "learning_rate": 3.8682222222222225e-06, "loss": 0.3708, "step": 165250 }, { "epoch": 5.82, "learning_rate": 3.862666666666667e-06, "loss": 0.3918, "step": 165300 }, { "epoch": 5.82, "learning_rate": 3.857111111111111e-06, "loss": 0.4379, "step": 165350 }, { "epoch": 5.82, "learning_rate": 3.851555555555556e-06, "loss": 0.4001, "step": 165400 }, { "epoch": 5.83, "learning_rate": 3.846e-06, "loss": 0.3812, "step": 165450 }, { "epoch": 5.83, "learning_rate": 3.840444444444445e-06, "loss": 0.38, "step": 165500 }, { "epoch": 5.83, "learning_rate": 3.834888888888889e-06, "loss": 0.3945, "step": 165550 }, { "epoch": 5.83, "learning_rate": 3.829333333333334e-06, "loss": 0.3814, "step": 165600 }, { "epoch": 5.83, "learning_rate": 3.823777777777778e-06, "loss": 0.4033, "step": 165650 }, { "epoch": 5.83, "learning_rate": 3.818222222222223e-06, "loss": 0.3954, "step": 165700 }, { "epoch": 5.84, "learning_rate": 3.8126666666666665e-06, "loss": 0.3962, "step": 165750 }, { "epoch": 5.84, "learning_rate": 3.8071111111111114e-06, "loss": 0.404, "step": 165800 }, { "epoch": 5.84, "learning_rate": 3.801555555555556e-06, "loss": 0.3753, "step": 165850 }, { "epoch": 5.84, "learning_rate": 3.796e-06, "loss": 0.4155, "step": 165900 }, { "epoch": 5.84, "learning_rate": 3.790444444444445e-06, "loss": 0.3947, "step": 165950 }, { "epoch": 5.84, "learning_rate": 3.785e-06, "loss": 0.4453, "step": 166000 }, { "epoch": 5.85, "learning_rate": 3.779444444444445e-06, "loss": 0.3914, "step": 166050 }, { "epoch": 5.85, "learning_rate": 3.773888888888889e-06, "loss": 0.4422, "step": 166100 }, { "epoch": 5.85, "learning_rate": 3.768333333333334e-06, "loss": 0.3996, "step": 166150 }, { "epoch": 5.85, "learning_rate": 3.762777777777778e-06, "loss": 0.3944, "step": 166200 }, { "epoch": 5.85, "learning_rate": 3.7572222222222226e-06, "loss": 0.3938, "step": 166250 }, { "epoch": 5.86, "learning_rate": 3.7516666666666666e-06, "loss": 0.4158, "step": 166300 }, { "epoch": 5.86, "learning_rate": 3.7461111111111114e-06, "loss": 0.441, "step": 166350 }, { "epoch": 5.86, "learning_rate": 3.7405555555555554e-06, "loss": 0.4113, "step": 166400 }, { "epoch": 5.86, "learning_rate": 3.7350000000000002e-06, "loss": 0.4162, "step": 166450 }, { "epoch": 5.86, "learning_rate": 3.729444444444445e-06, "loss": 0.4113, "step": 166500 }, { "epoch": 5.86, "learning_rate": 3.723888888888889e-06, "loss": 0.4051, "step": 166550 }, { "epoch": 5.87, "learning_rate": 3.718333333333334e-06, "loss": 0.4638, "step": 166600 }, { "epoch": 5.87, "learning_rate": 3.712777777777778e-06, "loss": 0.4171, "step": 166650 }, { "epoch": 5.87, "learning_rate": 3.7072222222222227e-06, "loss": 0.3854, "step": 166700 }, { "epoch": 5.87, "learning_rate": 3.7016666666666667e-06, "loss": 0.598, "step": 166750 }, { "epoch": 5.87, "learning_rate": 3.6962222222222227e-06, "loss": 0.5155, "step": 166800 }, { "epoch": 5.87, "learning_rate": 3.6906666666666667e-06, "loss": 0.3876, "step": 166850 }, { "epoch": 5.88, "learning_rate": 3.6851111111111115e-06, "loss": 0.4293, "step": 166900 }, { "epoch": 5.88, "learning_rate": 3.6795555555555555e-06, "loss": 0.4007, "step": 166950 }, { "epoch": 5.88, "learning_rate": 3.6740000000000003e-06, "loss": 0.3977, "step": 167000 }, { "epoch": 5.88, "learning_rate": 3.6684444444444443e-06, "loss": 0.3714, "step": 167050 }, { "epoch": 5.88, "learning_rate": 3.662888888888889e-06, "loss": 0.414, "step": 167100 }, { "epoch": 5.89, "learning_rate": 3.657333333333334e-06, "loss": 0.4018, "step": 167150 }, { "epoch": 5.89, "learning_rate": 3.651777777777778e-06, "loss": 0.4062, "step": 167200 }, { "epoch": 5.89, "learning_rate": 3.6462222222222228e-06, "loss": 0.434, "step": 167250 }, { "epoch": 5.89, "learning_rate": 3.6406666666666667e-06, "loss": 0.3857, "step": 167300 }, { "epoch": 5.89, "learning_rate": 3.6351111111111116e-06, "loss": 0.4899, "step": 167350 }, { "epoch": 5.89, "learning_rate": 3.6295555555555555e-06, "loss": 0.4109, "step": 167400 }, { "epoch": 5.9, "learning_rate": 3.6240000000000004e-06, "loss": 0.4527, "step": 167450 }, { "epoch": 5.9, "learning_rate": 3.6184444444444448e-06, "loss": 0.4183, "step": 167500 }, { "epoch": 5.9, "eval_loss": 0.24885150790214539, "eval_runtime": 7.3566, "eval_samples_per_second": 193.025, "eval_steps_per_second": 12.098, "eval_wer": 0.1835345375329037, "step": 167500 }, { "epoch": 5.9, "learning_rate": 3.612888888888889e-06, "loss": 0.4257, "step": 167550 }, { "epoch": 5.9, "learning_rate": 3.607333333333334e-06, "loss": 0.4054, "step": 167600 }, { "epoch": 5.9, "learning_rate": 3.601777777777778e-06, "loss": 0.3837, "step": 167650 }, { "epoch": 5.9, "learning_rate": 3.596222222222223e-06, "loss": 0.4104, "step": 167700 }, { "epoch": 5.91, "learning_rate": 3.590666666666667e-06, "loss": 0.39, "step": 167750 }, { "epoch": 5.91, "learning_rate": 3.5851111111111116e-06, "loss": 0.3846, "step": 167800 }, { "epoch": 5.91, "learning_rate": 3.579555555555556e-06, "loss": 0.3851, "step": 167850 }, { "epoch": 5.91, "learning_rate": 3.5740000000000004e-06, "loss": 0.401, "step": 167900 }, { "epoch": 5.91, "learning_rate": 3.568444444444445e-06, "loss": 0.3758, "step": 167950 }, { "epoch": 5.92, "learning_rate": 3.5628888888888892e-06, "loss": 0.4459, "step": 168000 }, { "epoch": 5.92, "learning_rate": 3.5573333333333336e-06, "loss": 0.4034, "step": 168050 }, { "epoch": 5.92, "learning_rate": 3.551777777777778e-06, "loss": 0.4013, "step": 168100 }, { "epoch": 5.92, "learning_rate": 3.5462222222222224e-06, "loss": 0.4027, "step": 168150 }, { "epoch": 5.92, "learning_rate": 3.540666666666667e-06, "loss": 0.3965, "step": 168200 }, { "epoch": 5.92, "learning_rate": 3.5351111111111112e-06, "loss": 0.3793, "step": 168250 }, { "epoch": 5.93, "learning_rate": 3.529555555555556e-06, "loss": 0.3913, "step": 168300 }, { "epoch": 5.93, "learning_rate": 3.524e-06, "loss": 0.4175, "step": 168350 }, { "epoch": 5.93, "learning_rate": 3.518444444444445e-06, "loss": 0.4085, "step": 168400 }, { "epoch": 5.93, "learning_rate": 3.512888888888889e-06, "loss": 0.4064, "step": 168450 }, { "epoch": 5.93, "learning_rate": 3.5073333333333337e-06, "loss": 0.4085, "step": 168500 }, { "epoch": 5.93, "learning_rate": 3.5017777777777777e-06, "loss": 0.3869, "step": 168550 }, { "epoch": 5.94, "learning_rate": 3.4962222222222225e-06, "loss": 0.4533, "step": 168600 }, { "epoch": 5.94, "learning_rate": 3.4906666666666673e-06, "loss": 0.396, "step": 168650 }, { "epoch": 5.94, "learning_rate": 3.4851111111111113e-06, "loss": 0.3862, "step": 168700 }, { "epoch": 5.94, "learning_rate": 3.479555555555556e-06, "loss": 0.4053, "step": 168750 }, { "epoch": 5.94, "learning_rate": 3.474e-06, "loss": 0.3872, "step": 168800 }, { "epoch": 5.95, "learning_rate": 3.468444444444445e-06, "loss": 0.3753, "step": 168850 }, { "epoch": 5.95, "learning_rate": 3.462888888888889e-06, "loss": 0.4234, "step": 168900 }, { "epoch": 5.95, "learning_rate": 3.4573333333333337e-06, "loss": 0.3991, "step": 168950 }, { "epoch": 5.95, "learning_rate": 3.4517777777777777e-06, "loss": 0.4237, "step": 169000 }, { "epoch": 5.95, "learning_rate": 3.4462222222222226e-06, "loss": 0.4007, "step": 169050 }, { "epoch": 5.95, "learning_rate": 3.440666666666667e-06, "loss": 0.3923, "step": 169100 }, { "epoch": 5.96, "learning_rate": 3.4351111111111114e-06, "loss": 0.4003, "step": 169150 }, { "epoch": 5.96, "learning_rate": 3.4295555555555558e-06, "loss": 0.399, "step": 169200 }, { "epoch": 5.96, "learning_rate": 3.424e-06, "loss": 0.4032, "step": 169250 }, { "epoch": 5.96, "learning_rate": 3.418444444444445e-06, "loss": 0.3715, "step": 169300 }, { "epoch": 5.96, "learning_rate": 3.412888888888889e-06, "loss": 0.3813, "step": 169350 }, { "epoch": 5.96, "learning_rate": 3.407333333333334e-06, "loss": 0.4208, "step": 169400 }, { "epoch": 5.97, "learning_rate": 3.401777777777778e-06, "loss": 0.3924, "step": 169450 }, { "epoch": 5.97, "learning_rate": 3.3962222222222226e-06, "loss": 0.3813, "step": 169500 }, { "epoch": 5.97, "learning_rate": 3.390666666666667e-06, "loss": 0.4045, "step": 169550 }, { "epoch": 5.97, "learning_rate": 3.3851111111111114e-06, "loss": 0.4034, "step": 169600 }, { "epoch": 5.97, "learning_rate": 3.379555555555556e-06, "loss": 0.4194, "step": 169650 }, { "epoch": 5.97, "learning_rate": 3.3740000000000002e-06, "loss": 0.4067, "step": 169700 }, { "epoch": 5.98, "learning_rate": 3.3684444444444446e-06, "loss": 0.3869, "step": 169750 }, { "epoch": 5.98, "learning_rate": 3.3628888888888895e-06, "loss": 0.4381, "step": 169800 }, { "epoch": 5.98, "learning_rate": 3.3573333333333334e-06, "loss": 0.4135, "step": 169850 }, { "epoch": 5.98, "learning_rate": 3.3517777777777783e-06, "loss": 0.3853, "step": 169900 }, { "epoch": 5.98, "learning_rate": 3.3462222222222222e-06, "loss": 0.5047, "step": 169950 }, { "epoch": 5.99, "learning_rate": 3.340666666666667e-06, "loss": 0.3826, "step": 170000 }, { "epoch": 5.99, "eval_loss": 0.2467884123325348, "eval_runtime": 7.6202, "eval_samples_per_second": 186.346, "eval_steps_per_second": 11.679, "eval_wer": 0.184714532086775, "step": 170000 }, { "epoch": 5.99, "learning_rate": 3.335111111111111e-06, "loss": 0.4102, "step": 170050 }, { "epoch": 5.99, "learning_rate": 3.329555555555556e-06, "loss": 0.4393, "step": 170100 }, { "epoch": 5.99, "learning_rate": 3.324e-06, "loss": 0.5222, "step": 170150 }, { "epoch": 5.99, "learning_rate": 3.3184444444444447e-06, "loss": 0.3969, "step": 170200 }, { "epoch": 5.99, "learning_rate": 3.3128888888888895e-06, "loss": 0.427, "step": 170250 }, { "epoch": 6.0, "learning_rate": 3.3073333333333335e-06, "loss": 0.416, "step": 170300 }, { "epoch": 6.0, "learning_rate": 3.3017777777777783e-06, "loss": 0.3845, "step": 170350 }, { "epoch": 6.0, "learning_rate": 3.2962222222222223e-06, "loss": 0.4042, "step": 170400 }, { "epoch": 6.0, "learning_rate": 3.290666666666667e-06, "loss": 0.3815, "step": 170450 }, { "epoch": 6.0, "learning_rate": 3.285111111111111e-06, "loss": 0.4156, "step": 170500 }, { "epoch": 6.0, "learning_rate": 3.279555555555556e-06, "loss": 0.38, "step": 170550 }, { "epoch": 6.01, "learning_rate": 3.2740000000000003e-06, "loss": 0.4082, "step": 170600 }, { "epoch": 6.01, "learning_rate": 3.2684444444444447e-06, "loss": 0.4086, "step": 170650 }, { "epoch": 6.01, "learning_rate": 3.262888888888889e-06, "loss": 0.4064, "step": 170700 }, { "epoch": 6.01, "learning_rate": 3.2573333333333335e-06, "loss": 0.3819, "step": 170750 }, { "epoch": 6.01, "learning_rate": 3.251777777777778e-06, "loss": 0.3734, "step": 170800 }, { "epoch": 6.02, "learning_rate": 3.2462222222222224e-06, "loss": 0.3849, "step": 170850 }, { "epoch": 6.02, "learning_rate": 3.2406666666666668e-06, "loss": 0.3958, "step": 170900 }, { "epoch": 6.02, "learning_rate": 3.2351111111111116e-06, "loss": 0.399, "step": 170950 }, { "epoch": 6.02, "learning_rate": 3.229555555555556e-06, "loss": 0.4089, "step": 171000 }, { "epoch": 6.02, "learning_rate": 3.2240000000000004e-06, "loss": 0.3961, "step": 171050 }, { "epoch": 6.02, "learning_rate": 3.218444444444445e-06, "loss": 0.3875, "step": 171100 }, { "epoch": 6.03, "learning_rate": 3.212888888888889e-06, "loss": 0.4018, "step": 171150 }, { "epoch": 6.03, "learning_rate": 3.2073333333333336e-06, "loss": 0.4169, "step": 171200 }, { "epoch": 6.03, "learning_rate": 3.201777777777778e-06, "loss": 0.4019, "step": 171250 }, { "epoch": 6.03, "learning_rate": 3.1962222222222224e-06, "loss": 0.4134, "step": 171300 }, { "epoch": 6.03, "learning_rate": 3.190666666666667e-06, "loss": 0.392, "step": 171350 }, { "epoch": 6.03, "learning_rate": 3.1851111111111116e-06, "loss": 0.4148, "step": 171400 }, { "epoch": 6.04, "learning_rate": 3.1795555555555556e-06, "loss": 0.4369, "step": 171450 }, { "epoch": 6.04, "learning_rate": 3.1740000000000004e-06, "loss": 0.3844, "step": 171500 }, { "epoch": 6.04, "learning_rate": 3.1684444444444444e-06, "loss": 0.4142, "step": 171550 }, { "epoch": 6.04, "learning_rate": 3.1628888888888892e-06, "loss": 0.4009, "step": 171600 }, { "epoch": 6.04, "learning_rate": 3.1573333333333332e-06, "loss": 0.3849, "step": 171650 }, { "epoch": 6.05, "learning_rate": 3.151777777777778e-06, "loss": 0.4015, "step": 171700 }, { "epoch": 6.05, "learning_rate": 3.146222222222223e-06, "loss": 0.374, "step": 171750 }, { "epoch": 6.05, "learning_rate": 3.140666666666667e-06, "loss": 0.4017, "step": 171800 }, { "epoch": 6.05, "learning_rate": 3.1351111111111117e-06, "loss": 0.3826, "step": 171850 }, { "epoch": 6.05, "learning_rate": 3.1295555555555557e-06, "loss": 0.3818, "step": 171900 }, { "epoch": 6.05, "learning_rate": 3.1240000000000005e-06, "loss": 0.4122, "step": 171950 }, { "epoch": 6.06, "learning_rate": 3.1184444444444445e-06, "loss": 0.4191, "step": 172000 }, { "epoch": 6.06, "learning_rate": 3.1128888888888893e-06, "loss": 0.3958, "step": 172050 }, { "epoch": 6.06, "learning_rate": 3.1073333333333333e-06, "loss": 0.4054, "step": 172100 }, { "epoch": 6.06, "learning_rate": 3.101777777777778e-06, "loss": 0.413, "step": 172150 }, { "epoch": 6.06, "learning_rate": 3.0962222222222225e-06, "loss": 0.3815, "step": 172200 }, { "epoch": 6.06, "learning_rate": 3.090666666666667e-06, "loss": 0.4079, "step": 172250 }, { "epoch": 6.07, "learning_rate": 3.0851111111111113e-06, "loss": 0.4177, "step": 172300 }, { "epoch": 6.07, "learning_rate": 3.0795555555555557e-06, "loss": 0.4217, "step": 172350 }, { "epoch": 6.07, "learning_rate": 3.074e-06, "loss": 0.3685, "step": 172400 }, { "epoch": 6.07, "learning_rate": 3.0684444444444445e-06, "loss": 0.3915, "step": 172450 }, { "epoch": 6.07, "learning_rate": 3.062888888888889e-06, "loss": 0.4103, "step": 172500 }, { "epoch": 6.07, "eval_loss": 0.2476934790611267, "eval_runtime": 26.0832, "eval_samples_per_second": 54.441, "eval_steps_per_second": 3.412, "eval_wer": 0.18062993555414358, "step": 172500 }, { "epoch": 6.08, "learning_rate": 3.0573333333333338e-06, "loss": 0.4267, "step": 172550 }, { "epoch": 6.08, "learning_rate": 3.0517777777777777e-06, "loss": 0.3951, "step": 172600 }, { "epoch": 6.08, "learning_rate": 3.0462222222222226e-06, "loss": 0.4135, "step": 172650 }, { "epoch": 6.08, "learning_rate": 3.040666666666667e-06, "loss": 0.4254, "step": 172700 }, { "epoch": 6.08, "learning_rate": 3.0351111111111114e-06, "loss": 0.39, "step": 172750 }, { "epoch": 6.08, "learning_rate": 3.0295555555555558e-06, "loss": 0.3972, "step": 172800 }, { "epoch": 6.09, "learning_rate": 3.024e-06, "loss": 0.3875, "step": 172850 }, { "epoch": 6.09, "learning_rate": 3.018444444444445e-06, "loss": 0.4124, "step": 172900 }, { "epoch": 6.09, "learning_rate": 3.012888888888889e-06, "loss": 0.4326, "step": 172950 }, { "epoch": 6.09, "learning_rate": 3.007333333333334e-06, "loss": 0.4173, "step": 173000 }, { "epoch": 6.09, "learning_rate": 3.001777777777778e-06, "loss": 0.3872, "step": 173050 }, { "epoch": 6.09, "learning_rate": 2.9962222222222226e-06, "loss": 0.385, "step": 173100 }, { "epoch": 6.1, "learning_rate": 2.9906666666666666e-06, "loss": 0.4175, "step": 173150 }, { "epoch": 6.1, "learning_rate": 2.9852222222222226e-06, "loss": 0.378, "step": 173200 }, { "epoch": 6.1, "learning_rate": 2.9796666666666666e-06, "loss": 0.3806, "step": 173250 }, { "epoch": 6.1, "learning_rate": 2.9741111111111115e-06, "loss": 0.3893, "step": 173300 }, { "epoch": 6.1, "learning_rate": 2.9685555555555554e-06, "loss": 0.4038, "step": 173350 }, { "epoch": 6.11, "learning_rate": 2.9630000000000003e-06, "loss": 0.3798, "step": 173400 }, { "epoch": 6.11, "learning_rate": 2.9574444444444442e-06, "loss": 0.4101, "step": 173450 }, { "epoch": 6.11, "learning_rate": 2.951888888888889e-06, "loss": 0.3959, "step": 173500 }, { "epoch": 6.11, "learning_rate": 2.946333333333334e-06, "loss": 0.4183, "step": 173550 }, { "epoch": 6.11, "learning_rate": 2.940777777777778e-06, "loss": 0.3976, "step": 173600 }, { "epoch": 6.11, "learning_rate": 2.9352222222222227e-06, "loss": 0.402, "step": 173650 }, { "epoch": 6.12, "learning_rate": 2.9296666666666667e-06, "loss": 0.4192, "step": 173700 }, { "epoch": 6.12, "learning_rate": 2.9241111111111115e-06, "loss": 0.3996, "step": 173750 }, { "epoch": 6.12, "learning_rate": 2.9185555555555555e-06, "loss": 0.4116, "step": 173800 }, { "epoch": 6.12, "learning_rate": 2.9130000000000003e-06, "loss": 0.5279, "step": 173850 }, { "epoch": 6.12, "learning_rate": 2.907444444444445e-06, "loss": 0.4845, "step": 173900 }, { "epoch": 6.12, "learning_rate": 2.901888888888889e-06, "loss": 0.3991, "step": 173950 }, { "epoch": 6.13, "learning_rate": 2.896333333333334e-06, "loss": 0.4528, "step": 174000 }, { "epoch": 6.13, "learning_rate": 2.890777777777778e-06, "loss": 0.4028, "step": 174050 }, { "epoch": 6.13, "learning_rate": 2.8852222222222228e-06, "loss": 0.3929, "step": 174100 }, { "epoch": 6.13, "learning_rate": 2.879777777777778e-06, "loss": 0.4202, "step": 174150 }, { "epoch": 6.13, "learning_rate": 2.8742222222222228e-06, "loss": 0.3754, "step": 174200 }, { "epoch": 6.14, "learning_rate": 2.8686666666666668e-06, "loss": 0.3777, "step": 174250 }, { "epoch": 6.14, "learning_rate": 2.8631111111111116e-06, "loss": 0.3902, "step": 174300 }, { "epoch": 6.14, "learning_rate": 2.8575555555555556e-06, "loss": 0.3955, "step": 174350 }, { "epoch": 6.14, "learning_rate": 2.8520000000000004e-06, "loss": 0.4139, "step": 174400 }, { "epoch": 6.14, "learning_rate": 2.8464444444444444e-06, "loss": 0.4044, "step": 174450 }, { "epoch": 6.14, "learning_rate": 2.840888888888889e-06, "loss": 0.4503, "step": 174500 }, { "epoch": 6.15, "learning_rate": 2.835333333333334e-06, "loss": 0.4019, "step": 174550 }, { "epoch": 6.15, "learning_rate": 2.829777777777778e-06, "loss": 0.3967, "step": 174600 }, { "epoch": 6.15, "learning_rate": 2.824222222222223e-06, "loss": 0.4007, "step": 174650 }, { "epoch": 6.15, "learning_rate": 2.818666666666667e-06, "loss": 0.4191, "step": 174700 }, { "epoch": 6.15, "learning_rate": 2.8131111111111116e-06, "loss": 0.4068, "step": 174750 }, { "epoch": 6.15, "learning_rate": 2.8075555555555556e-06, "loss": 0.3781, "step": 174800 }, { "epoch": 6.16, "learning_rate": 2.8020000000000004e-06, "loss": 0.3705, "step": 174850 }, { "epoch": 6.16, "learning_rate": 2.7964444444444444e-06, "loss": 0.4156, "step": 174900 }, { "epoch": 6.16, "learning_rate": 2.7908888888888893e-06, "loss": 0.4291, "step": 174950 }, { "epoch": 6.16, "learning_rate": 2.7853333333333337e-06, "loss": 0.4291, "step": 175000 }, { "epoch": 6.16, "eval_loss": 0.2491951584815979, "eval_runtime": 13.8172, "eval_samples_per_second": 102.771, "eval_steps_per_second": 6.441, "eval_wer": 0.1835345375329037, "step": 175000 }, { "epoch": 6.16, "learning_rate": 2.779777777777778e-06, "loss": 0.4085, "step": 175050 }, { "epoch": 6.17, "learning_rate": 2.7742222222222225e-06, "loss": 0.4202, "step": 175100 }, { "epoch": 6.17, "learning_rate": 2.768666666666667e-06, "loss": 0.3993, "step": 175150 }, { "epoch": 6.17, "learning_rate": 2.7631111111111113e-06, "loss": 0.3984, "step": 175200 }, { "epoch": 6.17, "learning_rate": 2.7575555555555557e-06, "loss": 0.4016, "step": 175250 }, { "epoch": 6.17, "learning_rate": 2.752e-06, "loss": 0.4041, "step": 175300 }, { "epoch": 6.17, "learning_rate": 2.746444444444445e-06, "loss": 0.4327, "step": 175350 }, { "epoch": 6.18, "learning_rate": 2.740888888888889e-06, "loss": 0.3942, "step": 175400 }, { "epoch": 6.18, "learning_rate": 2.7353333333333337e-06, "loss": 0.4046, "step": 175450 }, { "epoch": 6.18, "learning_rate": 2.7297777777777777e-06, "loss": 0.3677, "step": 175500 }, { "epoch": 6.18, "learning_rate": 2.7242222222222225e-06, "loss": 0.3936, "step": 175550 }, { "epoch": 6.18, "learning_rate": 2.7186666666666665e-06, "loss": 0.3757, "step": 175600 }, { "epoch": 6.18, "learning_rate": 2.7131111111111113e-06, "loss": 0.3892, "step": 175650 }, { "epoch": 6.19, "learning_rate": 2.707555555555556e-06, "loss": 0.3897, "step": 175700 }, { "epoch": 6.19, "learning_rate": 2.702e-06, "loss": 0.451, "step": 175750 }, { "epoch": 6.19, "learning_rate": 2.696444444444445e-06, "loss": 0.4063, "step": 175800 }, { "epoch": 6.19, "learning_rate": 2.690888888888889e-06, "loss": 0.4178, "step": 175850 }, { "epoch": 6.19, "learning_rate": 2.6853333333333338e-06, "loss": 0.439, "step": 175900 }, { "epoch": 6.19, "learning_rate": 2.6797777777777777e-06, "loss": 0.4667, "step": 175950 }, { "epoch": 6.2, "learning_rate": 2.6742222222222226e-06, "loss": 0.3755, "step": 176000 }, { "epoch": 6.2, "learning_rate": 2.6686666666666666e-06, "loss": 0.4391, "step": 176050 }, { "epoch": 6.2, "learning_rate": 2.6631111111111114e-06, "loss": 0.3829, "step": 176100 }, { "epoch": 6.2, "learning_rate": 2.657555555555556e-06, "loss": 0.3907, "step": 176150 }, { "epoch": 6.2, "learning_rate": 2.652e-06, "loss": 0.3847, "step": 176200 }, { "epoch": 6.21, "learning_rate": 2.646444444444445e-06, "loss": 0.3908, "step": 176250 }, { "epoch": 6.21, "learning_rate": 2.640888888888889e-06, "loss": 0.4224, "step": 176300 }, { "epoch": 6.21, "learning_rate": 2.635333333333334e-06, "loss": 0.3889, "step": 176350 }, { "epoch": 6.21, "learning_rate": 2.629777777777778e-06, "loss": 0.3877, "step": 176400 }, { "epoch": 6.21, "learning_rate": 2.6242222222222226e-06, "loss": 0.4193, "step": 176450 }, { "epoch": 6.21, "learning_rate": 2.618666666666667e-06, "loss": 0.3972, "step": 176500 }, { "epoch": 6.22, "learning_rate": 2.6131111111111114e-06, "loss": 0.3847, "step": 176550 }, { "epoch": 6.22, "learning_rate": 2.607555555555556e-06, "loss": 0.3933, "step": 176600 }, { "epoch": 6.22, "learning_rate": 2.6020000000000002e-06, "loss": 0.3827, "step": 176650 }, { "epoch": 6.22, "learning_rate": 2.5965555555555554e-06, "loss": 0.4162, "step": 176700 }, { "epoch": 6.22, "learning_rate": 2.5910000000000003e-06, "loss": 0.3909, "step": 176750 }, { "epoch": 6.22, "learning_rate": 2.5854444444444447e-06, "loss": 0.4106, "step": 176800 }, { "epoch": 6.23, "learning_rate": 2.579888888888889e-06, "loss": 0.4152, "step": 176850 }, { "epoch": 6.23, "learning_rate": 2.5743333333333335e-06, "loss": 0.3868, "step": 176900 }, { "epoch": 6.23, "learning_rate": 2.568777777777778e-06, "loss": 0.491, "step": 176950 }, { "epoch": 6.23, "learning_rate": 2.5632222222222227e-06, "loss": 0.3921, "step": 177000 }, { "epoch": 6.23, "learning_rate": 2.5576666666666667e-06, "loss": 0.3673, "step": 177050 }, { "epoch": 6.24, "learning_rate": 2.5521111111111115e-06, "loss": 0.3934, "step": 177100 }, { "epoch": 6.24, "learning_rate": 2.546555555555556e-06, "loss": 0.4097, "step": 177150 }, { "epoch": 6.24, "learning_rate": 2.5410000000000003e-06, "loss": 0.3811, "step": 177200 }, { "epoch": 6.24, "learning_rate": 2.5354444444444447e-06, "loss": 0.4299, "step": 177250 }, { "epoch": 6.24, "learning_rate": 2.529888888888889e-06, "loss": 0.4165, "step": 177300 }, { "epoch": 6.24, "learning_rate": 2.5243333333333335e-06, "loss": 0.4092, "step": 177350 }, { "epoch": 6.25, "learning_rate": 2.518777777777778e-06, "loss": 0.4304, "step": 177400 }, { "epoch": 6.25, "learning_rate": 2.5132222222222223e-06, "loss": 0.3964, "step": 177450 }, { "epoch": 6.25, "learning_rate": 2.507666666666667e-06, "loss": 0.4417, "step": 177500 }, { "epoch": 6.25, "eval_loss": 0.2463950514793396, "eval_runtime": 19.7439, "eval_samples_per_second": 71.921, "eval_steps_per_second": 4.508, "eval_wer": 0.18244531179086865, "step": 177500 }, { "epoch": 6.25, "learning_rate": 2.502111111111111e-06, "loss": 0.3689, "step": 177550 }, { "epoch": 6.25, "learning_rate": 2.4965555555555555e-06, "loss": 0.4154, "step": 177600 }, { "epoch": 6.25, "learning_rate": 2.491e-06, "loss": 0.401, "step": 177650 }, { "epoch": 6.26, "learning_rate": 2.4854444444444448e-06, "loss": 0.3934, "step": 177700 }, { "epoch": 6.26, "learning_rate": 2.479888888888889e-06, "loss": 0.4123, "step": 177750 }, { "epoch": 6.26, "learning_rate": 2.4743333333333336e-06, "loss": 0.406, "step": 177800 }, { "epoch": 6.26, "learning_rate": 2.468777777777778e-06, "loss": 0.4255, "step": 177850 }, { "epoch": 6.26, "learning_rate": 2.4632222222222224e-06, "loss": 0.4056, "step": 177900 }, { "epoch": 6.27, "learning_rate": 2.457666666666667e-06, "loss": 0.4159, "step": 177950 }, { "epoch": 6.27, "learning_rate": 2.452111111111111e-06, "loss": 0.4064, "step": 178000 }, { "epoch": 6.27, "learning_rate": 2.4465555555555556e-06, "loss": 0.3934, "step": 178050 }, { "epoch": 6.27, "learning_rate": 2.4410000000000004e-06, "loss": 0.4094, "step": 178100 }, { "epoch": 6.27, "learning_rate": 2.435444444444445e-06, "loss": 0.3973, "step": 178150 }, { "epoch": 6.27, "learning_rate": 2.4298888888888892e-06, "loss": 0.3744, "step": 178200 }, { "epoch": 6.28, "learning_rate": 2.4243333333333336e-06, "loss": 0.4374, "step": 178250 }, { "epoch": 6.28, "learning_rate": 2.418777777777778e-06, "loss": 0.3979, "step": 178300 }, { "epoch": 6.28, "learning_rate": 2.4132222222222224e-06, "loss": 0.3973, "step": 178350 }, { "epoch": 6.28, "learning_rate": 2.407666666666667e-06, "loss": 0.3686, "step": 178400 }, { "epoch": 6.28, "learning_rate": 2.4021111111111113e-06, "loss": 0.3936, "step": 178450 }, { "epoch": 6.28, "learning_rate": 2.3965555555555557e-06, "loss": 0.3745, "step": 178500 }, { "epoch": 6.29, "learning_rate": 2.391e-06, "loss": 0.48, "step": 178550 }, { "epoch": 6.29, "learning_rate": 2.3854444444444445e-06, "loss": 0.4073, "step": 178600 }, { "epoch": 6.29, "learning_rate": 2.3798888888888893e-06, "loss": 0.4022, "step": 178650 }, { "epoch": 6.29, "learning_rate": 2.3743333333333337e-06, "loss": 0.4035, "step": 178700 }, { "epoch": 6.29, "learning_rate": 2.368777777777778e-06, "loss": 0.3879, "step": 178750 }, { "epoch": 6.3, "learning_rate": 2.3632222222222225e-06, "loss": 0.3859, "step": 178800 }, { "epoch": 6.3, "learning_rate": 2.357666666666667e-06, "loss": 0.3828, "step": 178850 }, { "epoch": 6.3, "learning_rate": 2.3521111111111113e-06, "loss": 0.3993, "step": 178900 }, { "epoch": 6.3, "learning_rate": 2.3465555555555557e-06, "loss": 0.4705, "step": 178950 }, { "epoch": 6.3, "learning_rate": 2.341e-06, "loss": 0.4223, "step": 179000 }, { "epoch": 6.3, "learning_rate": 2.3354444444444445e-06, "loss": 0.3784, "step": 179050 }, { "epoch": 6.31, "learning_rate": 2.329888888888889e-06, "loss": 0.3861, "step": 179100 }, { "epoch": 6.31, "learning_rate": 2.3243333333333333e-06, "loss": 0.4026, "step": 179150 }, { "epoch": 6.31, "learning_rate": 2.3187777777777777e-06, "loss": 0.377, "step": 179200 }, { "epoch": 6.31, "learning_rate": 2.3132222222222226e-06, "loss": 0.3937, "step": 179250 }, { "epoch": 6.31, "learning_rate": 2.307666666666667e-06, "loss": 0.4287, "step": 179300 }, { "epoch": 6.31, "learning_rate": 2.3021111111111114e-06, "loss": 0.3966, "step": 179350 }, { "epoch": 6.32, "learning_rate": 2.2965555555555558e-06, "loss": 0.3795, "step": 179400 }, { "epoch": 6.32, "learning_rate": 2.291e-06, "loss": 0.4198, "step": 179450 }, { "epoch": 6.32, "learning_rate": 2.2854444444444446e-06, "loss": 0.3893, "step": 179500 }, { "epoch": 6.32, "learning_rate": 2.279888888888889e-06, "loss": 0.3966, "step": 179550 }, { "epoch": 6.32, "learning_rate": 2.2743333333333334e-06, "loss": 0.3829, "step": 179600 }, { "epoch": 6.33, "learning_rate": 2.268777777777778e-06, "loss": 0.3919, "step": 179650 }, { "epoch": 6.33, "learning_rate": 2.2632222222222226e-06, "loss": 0.4112, "step": 179700 }, { "epoch": 6.33, "learning_rate": 2.257666666666667e-06, "loss": 0.4183, "step": 179750 }, { "epoch": 6.33, "learning_rate": 2.2521111111111114e-06, "loss": 0.3956, "step": 179800 }, { "epoch": 6.33, "learning_rate": 2.246555555555556e-06, "loss": 0.3726, "step": 179850 }, { "epoch": 6.33, "learning_rate": 2.2410000000000002e-06, "loss": 0.3996, "step": 179900 }, { "epoch": 6.34, "learning_rate": 2.235555555555556e-06, "loss": 0.379, "step": 179950 }, { "epoch": 6.34, "learning_rate": 2.2300000000000002e-06, "loss": 0.3962, "step": 180000 }, { "epoch": 6.34, "eval_loss": 0.24757064878940582, "eval_runtime": 26.6913, "eval_samples_per_second": 53.201, "eval_steps_per_second": 3.334, "eval_wer": 0.18153762367250612, "step": 180000 }, { "epoch": 6.34, "learning_rate": 2.2244444444444447e-06, "loss": 0.4071, "step": 180050 }, { "epoch": 6.34, "learning_rate": 2.218888888888889e-06, "loss": 0.395, "step": 180100 }, { "epoch": 6.34, "learning_rate": 2.2134444444444447e-06, "loss": 0.3827, "step": 180150 }, { "epoch": 6.34, "learning_rate": 2.207888888888889e-06, "loss": 0.4155, "step": 180200 }, { "epoch": 6.35, "learning_rate": 2.2023333333333335e-06, "loss": 0.3822, "step": 180250 }, { "epoch": 6.35, "learning_rate": 2.196777777777778e-06, "loss": 0.4087, "step": 180300 }, { "epoch": 6.35, "learning_rate": 2.1912222222222223e-06, "loss": 0.4137, "step": 180350 }, { "epoch": 6.35, "learning_rate": 2.1856666666666667e-06, "loss": 0.3887, "step": 180400 }, { "epoch": 6.35, "learning_rate": 2.180111111111111e-06, "loss": 0.4206, "step": 180450 }, { "epoch": 6.36, "learning_rate": 2.174555555555556e-06, "loss": 0.3907, "step": 180500 }, { "epoch": 6.36, "learning_rate": 2.1690000000000003e-06, "loss": 0.4251, "step": 180550 }, { "epoch": 6.36, "learning_rate": 2.1634444444444447e-06, "loss": 0.4005, "step": 180600 }, { "epoch": 6.36, "learning_rate": 2.157888888888889e-06, "loss": 0.4297, "step": 180650 }, { "epoch": 6.36, "learning_rate": 2.1523333333333335e-06, "loss": 0.3798, "step": 180700 }, { "epoch": 6.36, "learning_rate": 2.146777777777778e-06, "loss": 0.4114, "step": 180750 }, { "epoch": 6.37, "learning_rate": 2.1412222222222223e-06, "loss": 0.4011, "step": 180800 }, { "epoch": 6.37, "learning_rate": 2.1356666666666667e-06, "loss": 0.3965, "step": 180850 }, { "epoch": 6.37, "learning_rate": 2.1301111111111116e-06, "loss": 0.4141, "step": 180900 }, { "epoch": 6.37, "learning_rate": 2.124555555555556e-06, "loss": 0.3739, "step": 180950 }, { "epoch": 6.37, "learning_rate": 2.1190000000000004e-06, "loss": 0.41, "step": 181000 }, { "epoch": 6.37, "learning_rate": 2.1134444444444448e-06, "loss": 0.3883, "step": 181050 }, { "epoch": 6.38, "learning_rate": 2.107888888888889e-06, "loss": 0.432, "step": 181100 }, { "epoch": 6.38, "learning_rate": 2.1023333333333336e-06, "loss": 0.4074, "step": 181150 }, { "epoch": 6.38, "learning_rate": 2.096777777777778e-06, "loss": 0.4035, "step": 181200 }, { "epoch": 6.38, "learning_rate": 2.0912222222222224e-06, "loss": 0.4177, "step": 181250 }, { "epoch": 6.38, "learning_rate": 2.085666666666667e-06, "loss": 0.4313, "step": 181300 }, { "epoch": 6.39, "learning_rate": 2.080111111111111e-06, "loss": 0.415, "step": 181350 }, { "epoch": 6.39, "learning_rate": 2.0745555555555556e-06, "loss": 0.3939, "step": 181400 }, { "epoch": 6.39, "learning_rate": 2.069e-06, "loss": 0.4813, "step": 181450 }, { "epoch": 6.39, "learning_rate": 2.0634444444444444e-06, "loss": 0.4022, "step": 181500 }, { "epoch": 6.39, "learning_rate": 2.057888888888889e-06, "loss": 0.422, "step": 181550 }, { "epoch": 6.39, "learning_rate": 2.0523333333333332e-06, "loss": 0.4333, "step": 181600 }, { "epoch": 6.4, "learning_rate": 2.0467777777777776e-06, "loss": 0.389, "step": 181650 }, { "epoch": 6.4, "learning_rate": 2.0412222222222225e-06, "loss": 0.4075, "step": 181700 }, { "epoch": 6.4, "learning_rate": 2.035666666666667e-06, "loss": 0.3868, "step": 181750 }, { "epoch": 6.4, "learning_rate": 2.0301111111111113e-06, "loss": 0.3921, "step": 181800 }, { "epoch": 6.4, "learning_rate": 2.0245555555555557e-06, "loss": 0.4083, "step": 181850 }, { "epoch": 6.4, "learning_rate": 2.019e-06, "loss": 0.3916, "step": 181900 }, { "epoch": 6.41, "learning_rate": 2.0134444444444445e-06, "loss": 0.548, "step": 181950 }, { "epoch": 6.41, "learning_rate": 2.007888888888889e-06, "loss": 0.3752, "step": 182000 }, { "epoch": 6.41, "learning_rate": 2.0023333333333337e-06, "loss": 0.4287, "step": 182050 }, { "epoch": 6.41, "learning_rate": 1.996777777777778e-06, "loss": 0.3958, "step": 182100 }, { "epoch": 6.41, "learning_rate": 1.9912222222222225e-06, "loss": 0.3948, "step": 182150 }, { "epoch": 6.42, "learning_rate": 1.985666666666667e-06, "loss": 0.3929, "step": 182200 }, { "epoch": 6.42, "learning_rate": 1.9801111111111113e-06, "loss": 0.3919, "step": 182250 }, { "epoch": 6.42, "learning_rate": 1.9745555555555557e-06, "loss": 0.3882, "step": 182300 }, { "epoch": 6.42, "learning_rate": 1.969e-06, "loss": 0.4077, "step": 182350 }, { "epoch": 6.42, "learning_rate": 1.9634444444444445e-06, "loss": 0.3875, "step": 182400 }, { "epoch": 6.42, "learning_rate": 1.9578888888888894e-06, "loss": 0.3839, "step": 182450 }, { "epoch": 6.43, "learning_rate": 1.9523333333333338e-06, "loss": 0.4633, "step": 182500 }, { "epoch": 6.43, "eval_loss": 0.2447100579738617, "eval_runtime": 25.1277, "eval_samples_per_second": 56.511, "eval_steps_per_second": 3.542, "eval_wer": 0.18180993010801488, "step": 182500 }, { "epoch": 6.43, "learning_rate": 1.946777777777778e-06, "loss": 0.421, "step": 182550 }, { "epoch": 6.43, "learning_rate": 1.9412222222222226e-06, "loss": 0.4032, "step": 182600 }, { "epoch": 6.43, "learning_rate": 1.935666666666667e-06, "loss": 0.4147, "step": 182650 }, { "epoch": 6.43, "learning_rate": 1.9302222222222226e-06, "loss": 0.4593, "step": 182700 }, { "epoch": 6.43, "learning_rate": 1.924666666666667e-06, "loss": 0.436, "step": 182750 }, { "epoch": 6.44, "learning_rate": 1.9191111111111114e-06, "loss": 0.3634, "step": 182800 }, { "epoch": 6.44, "learning_rate": 1.913555555555556e-06, "loss": 0.3997, "step": 182850 }, { "epoch": 6.44, "learning_rate": 1.908e-06, "loss": 0.4076, "step": 182900 }, { "epoch": 6.44, "learning_rate": 1.9024444444444446e-06, "loss": 0.3974, "step": 182950 }, { "epoch": 6.44, "learning_rate": 1.896888888888889e-06, "loss": 0.4027, "step": 183000 }, { "epoch": 6.44, "learning_rate": 1.8913333333333334e-06, "loss": 0.4083, "step": 183050 }, { "epoch": 6.45, "learning_rate": 1.885777777777778e-06, "loss": 0.3808, "step": 183100 }, { "epoch": 6.45, "learning_rate": 1.8802222222222224e-06, "loss": 0.3828, "step": 183150 }, { "epoch": 6.45, "learning_rate": 1.8746666666666668e-06, "loss": 0.4046, "step": 183200 }, { "epoch": 6.45, "learning_rate": 1.8691111111111112e-06, "loss": 0.3881, "step": 183250 }, { "epoch": 6.45, "learning_rate": 1.8635555555555556e-06, "loss": 0.3938, "step": 183300 }, { "epoch": 6.46, "learning_rate": 1.858e-06, "loss": 0.3873, "step": 183350 }, { "epoch": 6.46, "learning_rate": 1.8524444444444444e-06, "loss": 0.3899, "step": 183400 }, { "epoch": 6.46, "learning_rate": 1.8468888888888893e-06, "loss": 0.3999, "step": 183450 }, { "epoch": 6.46, "learning_rate": 1.8413333333333337e-06, "loss": 0.3914, "step": 183500 }, { "epoch": 6.46, "learning_rate": 1.835777777777778e-06, "loss": 0.3769, "step": 183550 }, { "epoch": 6.46, "learning_rate": 1.8302222222222225e-06, "loss": 0.4294, "step": 183600 }, { "epoch": 6.47, "learning_rate": 1.8246666666666669e-06, "loss": 0.4115, "step": 183650 }, { "epoch": 6.47, "learning_rate": 1.8191111111111113e-06, "loss": 0.4086, "step": 183700 }, { "epoch": 6.47, "learning_rate": 1.8135555555555557e-06, "loss": 0.4374, "step": 183750 }, { "epoch": 6.47, "learning_rate": 1.808e-06, "loss": 0.3632, "step": 183800 }, { "epoch": 6.47, "learning_rate": 1.8024444444444447e-06, "loss": 0.4184, "step": 183850 }, { "epoch": 6.47, "learning_rate": 1.7968888888888891e-06, "loss": 0.4161, "step": 183900 }, { "epoch": 6.48, "learning_rate": 1.7913333333333335e-06, "loss": 0.4656, "step": 183950 }, { "epoch": 6.48, "learning_rate": 1.785777777777778e-06, "loss": 0.3969, "step": 184000 }, { "epoch": 6.48, "learning_rate": 1.7802222222222223e-06, "loss": 0.4304, "step": 184050 }, { "epoch": 6.48, "learning_rate": 1.7746666666666667e-06, "loss": 0.4195, "step": 184100 }, { "epoch": 6.48, "learning_rate": 1.7691111111111111e-06, "loss": 0.4056, "step": 184150 }, { "epoch": 6.49, "learning_rate": 1.7635555555555555e-06, "loss": 0.4163, "step": 184200 }, { "epoch": 6.49, "learning_rate": 1.7580000000000004e-06, "loss": 0.3966, "step": 184250 }, { "epoch": 6.49, "learning_rate": 1.7524444444444448e-06, "loss": 0.3882, "step": 184300 }, { "epoch": 6.49, "learning_rate": 1.7468888888888892e-06, "loss": 0.3835, "step": 184350 }, { "epoch": 6.49, "learning_rate": 1.7413333333333336e-06, "loss": 0.4475, "step": 184400 }, { "epoch": 6.49, "learning_rate": 1.735777777777778e-06, "loss": 0.4092, "step": 184450 }, { "epoch": 6.5, "learning_rate": 1.7302222222222224e-06, "loss": 0.3988, "step": 184500 }, { "epoch": 6.5, "learning_rate": 1.7246666666666668e-06, "loss": 0.415, "step": 184550 }, { "epoch": 6.5, "learning_rate": 1.7191111111111112e-06, "loss": 0.3892, "step": 184600 }, { "epoch": 6.5, "learning_rate": 1.7135555555555558e-06, "loss": 0.379, "step": 184650 }, { "epoch": 6.5, "learning_rate": 1.7080000000000002e-06, "loss": 0.4072, "step": 184700 }, { "epoch": 6.5, "learning_rate": 1.7024444444444446e-06, "loss": 0.3989, "step": 184750 }, { "epoch": 6.51, "learning_rate": 1.696888888888889e-06, "loss": 0.3949, "step": 184800 }, { "epoch": 6.51, "learning_rate": 1.6913333333333334e-06, "loss": 0.3743, "step": 184850 }, { "epoch": 6.51, "learning_rate": 1.6857777777777778e-06, "loss": 0.3737, "step": 184900 }, { "epoch": 6.51, "learning_rate": 1.6802222222222222e-06, "loss": 0.4224, "step": 184950 }, { "epoch": 6.51, "learning_rate": 1.6746666666666668e-06, "loss": 0.422, "step": 185000 }, { "epoch": 6.51, "eval_loss": 0.24550682306289673, "eval_runtime": 18.5613, "eval_samples_per_second": 76.503, "eval_steps_per_second": 4.795, "eval_wer": 0.18017609149496233, "step": 185000 }, { "epoch": 6.52, "learning_rate": 1.6691111111111112e-06, "loss": 0.4189, "step": 185050 }, { "epoch": 6.52, "learning_rate": 1.6635555555555559e-06, "loss": 0.402, "step": 185100 }, { "epoch": 6.52, "learning_rate": 1.6580000000000003e-06, "loss": 0.3844, "step": 185150 }, { "epoch": 6.52, "learning_rate": 1.6524444444444447e-06, "loss": 0.3994, "step": 185200 }, { "epoch": 6.52, "learning_rate": 1.646888888888889e-06, "loss": 0.4309, "step": 185250 }, { "epoch": 6.52, "learning_rate": 1.6413333333333335e-06, "loss": 0.5157, "step": 185300 }, { "epoch": 6.53, "learning_rate": 1.6357777777777779e-06, "loss": 0.3887, "step": 185350 }, { "epoch": 6.53, "learning_rate": 1.6302222222222225e-06, "loss": 0.3907, "step": 185400 }, { "epoch": 6.53, "learning_rate": 1.624666666666667e-06, "loss": 0.4021, "step": 185450 }, { "epoch": 6.53, "learning_rate": 1.6191111111111113e-06, "loss": 0.4026, "step": 185500 }, { "epoch": 6.53, "learning_rate": 1.6135555555555557e-06, "loss": 0.392, "step": 185550 }, { "epoch": 6.53, "learning_rate": 1.608e-06, "loss": 0.3996, "step": 185600 }, { "epoch": 6.54, "learning_rate": 1.6024444444444445e-06, "loss": 0.406, "step": 185650 }, { "epoch": 6.54, "learning_rate": 1.596888888888889e-06, "loss": 0.3938, "step": 185700 }, { "epoch": 6.54, "learning_rate": 1.5913333333333333e-06, "loss": 0.4006, "step": 185750 }, { "epoch": 6.54, "learning_rate": 1.585777777777778e-06, "loss": 0.3763, "step": 185800 }, { "epoch": 6.54, "learning_rate": 1.5802222222222223e-06, "loss": 0.4433, "step": 185850 }, { "epoch": 6.55, "learning_rate": 1.5746666666666667e-06, "loss": 0.3731, "step": 185900 }, { "epoch": 6.55, "learning_rate": 1.5691111111111114e-06, "loss": 0.4138, "step": 185950 }, { "epoch": 6.55, "learning_rate": 1.5635555555555558e-06, "loss": 0.4108, "step": 186000 }, { "epoch": 6.55, "learning_rate": 1.5580000000000002e-06, "loss": 0.4604, "step": 186050 }, { "epoch": 6.55, "learning_rate": 1.5524444444444446e-06, "loss": 0.3898, "step": 186100 }, { "epoch": 6.55, "learning_rate": 1.546888888888889e-06, "loss": 0.3886, "step": 186150 }, { "epoch": 6.56, "learning_rate": 1.5413333333333336e-06, "loss": 0.3959, "step": 186200 }, { "epoch": 6.56, "learning_rate": 1.535777777777778e-06, "loss": 0.4105, "step": 186250 }, { "epoch": 6.56, "learning_rate": 1.5302222222222224e-06, "loss": 0.3772, "step": 186300 }, { "epoch": 6.56, "learning_rate": 1.5246666666666668e-06, "loss": 0.4043, "step": 186350 }, { "epoch": 6.56, "learning_rate": 1.5191111111111112e-06, "loss": 0.3741, "step": 186400 }, { "epoch": 6.56, "learning_rate": 1.5135555555555556e-06, "loss": 0.4184, "step": 186450 }, { "epoch": 6.57, "learning_rate": 1.508e-06, "loss": 0.3917, "step": 186500 }, { "epoch": 6.57, "learning_rate": 1.5024444444444446e-06, "loss": 0.4438, "step": 186550 }, { "epoch": 6.57, "learning_rate": 1.497e-06, "loss": 0.4364, "step": 186600 }, { "epoch": 6.57, "learning_rate": 1.4914444444444444e-06, "loss": 0.3964, "step": 186650 }, { "epoch": 6.57, "learning_rate": 1.4858888888888888e-06, "loss": 0.421, "step": 186700 }, { "epoch": 6.58, "learning_rate": 1.4803333333333334e-06, "loss": 0.5303, "step": 186750 }, { "epoch": 6.58, "learning_rate": 1.474777777777778e-06, "loss": 0.4001, "step": 186800 }, { "epoch": 6.58, "learning_rate": 1.4692222222222225e-06, "loss": 0.383, "step": 186850 }, { "epoch": 6.58, "learning_rate": 1.4636666666666669e-06, "loss": 0.3891, "step": 186900 }, { "epoch": 6.58, "learning_rate": 1.4581111111111113e-06, "loss": 0.3716, "step": 186950 }, { "epoch": 6.58, "learning_rate": 1.4525555555555557e-06, "loss": 0.3745, "step": 187000 }, { "epoch": 6.59, "learning_rate": 1.447e-06, "loss": 0.4255, "step": 187050 }, { "epoch": 6.59, "learning_rate": 1.4414444444444445e-06, "loss": 0.4212, "step": 187100 }, { "epoch": 6.59, "learning_rate": 1.4358888888888889e-06, "loss": 0.3849, "step": 187150 }, { "epoch": 6.59, "learning_rate": 1.4303333333333335e-06, "loss": 0.4112, "step": 187200 }, { "epoch": 6.59, "learning_rate": 1.424777777777778e-06, "loss": 0.3994, "step": 187250 }, { "epoch": 6.59, "learning_rate": 1.4192222222222223e-06, "loss": 0.3929, "step": 187300 }, { "epoch": 6.6, "learning_rate": 1.4136666666666667e-06, "loss": 0.4016, "step": 187350 }, { "epoch": 6.6, "learning_rate": 1.4081111111111111e-06, "loss": 0.3851, "step": 187400 }, { "epoch": 6.6, "learning_rate": 1.4025555555555555e-06, "loss": 0.4077, "step": 187450 }, { "epoch": 6.6, "learning_rate": 1.397e-06, "loss": 0.4098, "step": 187500 }, { "epoch": 6.6, "eval_loss": 0.24884368479251862, "eval_runtime": 16.8143, "eval_samples_per_second": 84.452, "eval_steps_per_second": 5.293, "eval_wer": 0.1814468548606699, "step": 187500 }, { "epoch": 6.6, "learning_rate": 1.3914444444444443e-06, "loss": 0.4329, "step": 187550 }, { "epoch": 6.61, "learning_rate": 1.3858888888888892e-06, "loss": 0.3932, "step": 187600 }, { "epoch": 6.61, "learning_rate": 1.3803333333333336e-06, "loss": 0.4309, "step": 187650 }, { "epoch": 6.61, "learning_rate": 1.374777777777778e-06, "loss": 0.3818, "step": 187700 }, { "epoch": 6.61, "learning_rate": 1.3692222222222224e-06, "loss": 0.4185, "step": 187750 }, { "epoch": 6.61, "learning_rate": 1.3636666666666668e-06, "loss": 0.424, "step": 187800 }, { "epoch": 6.61, "learning_rate": 1.3581111111111112e-06, "loss": 0.3797, "step": 187850 }, { "epoch": 6.62, "learning_rate": 1.3525555555555556e-06, "loss": 0.3864, "step": 187900 }, { "epoch": 6.62, "learning_rate": 1.347e-06, "loss": 0.3854, "step": 187950 }, { "epoch": 6.62, "learning_rate": 1.3414444444444446e-06, "loss": 0.3924, "step": 188000 }, { "epoch": 6.62, "learning_rate": 1.335888888888889e-06, "loss": 0.502, "step": 188050 }, { "epoch": 6.62, "learning_rate": 1.3303333333333334e-06, "loss": 0.3883, "step": 188100 }, { "epoch": 6.62, "learning_rate": 1.3247777777777778e-06, "loss": 0.448, "step": 188150 }, { "epoch": 6.63, "learning_rate": 1.3192222222222222e-06, "loss": 0.3971, "step": 188200 }, { "epoch": 6.63, "learning_rate": 1.3136666666666666e-06, "loss": 0.3985, "step": 188250 }, { "epoch": 6.63, "learning_rate": 1.308111111111111e-06, "loss": 0.4218, "step": 188300 }, { "epoch": 6.63, "learning_rate": 1.3025555555555558e-06, "loss": 0.4033, "step": 188350 }, { "epoch": 6.63, "learning_rate": 1.2970000000000002e-06, "loss": 0.4024, "step": 188400 }, { "epoch": 6.64, "learning_rate": 1.2914444444444446e-06, "loss": 0.3726, "step": 188450 }, { "epoch": 6.64, "learning_rate": 1.285888888888889e-06, "loss": 0.4026, "step": 188500 }, { "epoch": 6.64, "learning_rate": 1.2803333333333335e-06, "loss": 0.3941, "step": 188550 }, { "epoch": 6.64, "learning_rate": 1.2747777777777779e-06, "loss": 0.4067, "step": 188600 }, { "epoch": 6.64, "learning_rate": 1.2692222222222223e-06, "loss": 0.4186, "step": 188650 }, { "epoch": 6.64, "learning_rate": 1.2636666666666667e-06, "loss": 0.4607, "step": 188700 }, { "epoch": 6.65, "learning_rate": 1.2581111111111113e-06, "loss": 0.3951, "step": 188750 }, { "epoch": 6.65, "learning_rate": 1.2525555555555557e-06, "loss": 0.4317, "step": 188800 }, { "epoch": 6.65, "learning_rate": 1.247e-06, "loss": 0.4094, "step": 188850 }, { "epoch": 6.65, "learning_rate": 1.2414444444444445e-06, "loss": 0.4026, "step": 188900 }, { "epoch": 6.65, "learning_rate": 1.235888888888889e-06, "loss": 0.4005, "step": 188950 }, { "epoch": 6.65, "learning_rate": 1.2303333333333333e-06, "loss": 0.3743, "step": 189000 }, { "epoch": 6.66, "learning_rate": 1.224777777777778e-06, "loss": 0.3894, "step": 189050 }, { "epoch": 6.66, "learning_rate": 1.2192222222222223e-06, "loss": 0.4254, "step": 189100 }, { "epoch": 6.66, "learning_rate": 1.2136666666666667e-06, "loss": 0.3793, "step": 189150 }, { "epoch": 6.66, "learning_rate": 1.2081111111111111e-06, "loss": 0.3799, "step": 189200 }, { "epoch": 6.66, "learning_rate": 1.2025555555555557e-06, "loss": 0.4591, "step": 189250 }, { "epoch": 6.67, "learning_rate": 1.1970000000000001e-06, "loss": 0.395, "step": 189300 }, { "epoch": 6.67, "learning_rate": 1.1914444444444445e-06, "loss": 0.3721, "step": 189350 }, { "epoch": 6.67, "learning_rate": 1.185888888888889e-06, "loss": 0.4183, "step": 189400 }, { "epoch": 6.67, "learning_rate": 1.1803333333333336e-06, "loss": 0.3714, "step": 189450 }, { "epoch": 6.67, "learning_rate": 1.174777777777778e-06, "loss": 0.3888, "step": 189500 }, { "epoch": 6.67, "learning_rate": 1.1692222222222224e-06, "loss": 0.3619, "step": 189550 }, { "epoch": 6.68, "learning_rate": 1.1636666666666668e-06, "loss": 0.3929, "step": 189600 }, { "epoch": 6.68, "learning_rate": 1.1581111111111112e-06, "loss": 0.3836, "step": 189650 }, { "epoch": 6.68, "learning_rate": 1.1525555555555556e-06, "loss": 0.3932, "step": 189700 }, { "epoch": 6.68, "learning_rate": 1.147e-06, "loss": 0.4022, "step": 189750 }, { "epoch": 6.68, "learning_rate": 1.1414444444444446e-06, "loss": 0.3975, "step": 189800 }, { "epoch": 6.68, "learning_rate": 1.135888888888889e-06, "loss": 0.4073, "step": 189850 }, { "epoch": 6.69, "learning_rate": 1.1303333333333334e-06, "loss": 0.4253, "step": 189900 }, { "epoch": 6.69, "learning_rate": 1.1247777777777778e-06, "loss": 0.4282, "step": 189950 }, { "epoch": 6.69, "learning_rate": 1.1192222222222224e-06, "loss": 0.4018, "step": 190000 }, { "epoch": 6.69, "eval_loss": 0.2453201562166214, "eval_runtime": 6.418, "eval_samples_per_second": 221.253, "eval_steps_per_second": 13.867, "eval_wer": 0.18035762911863484, "step": 190000 }, { "epoch": 6.69, "learning_rate": 1.1136666666666668e-06, "loss": 0.367, "step": 190050 }, { "epoch": 6.69, "learning_rate": 1.1081111111111112e-06, "loss": 0.3667, "step": 190100 }, { "epoch": 6.69, "learning_rate": 1.1025555555555556e-06, "loss": 0.4004, "step": 190150 }, { "epoch": 6.7, "learning_rate": 1.097e-06, "loss": 0.3907, "step": 190200 }, { "epoch": 6.7, "learning_rate": 1.0914444444444447e-06, "loss": 0.3745, "step": 190250 }, { "epoch": 6.7, "learning_rate": 1.085888888888889e-06, "loss": 0.3878, "step": 190300 }, { "epoch": 6.7, "learning_rate": 1.0803333333333335e-06, "loss": 0.3772, "step": 190350 }, { "epoch": 6.7, "learning_rate": 1.0747777777777779e-06, "loss": 0.4021, "step": 190400 }, { "epoch": 6.71, "learning_rate": 1.0692222222222223e-06, "loss": 0.41, "step": 190450 }, { "epoch": 6.71, "learning_rate": 1.0636666666666667e-06, "loss": 0.4071, "step": 190500 }, { "epoch": 6.71, "learning_rate": 1.058111111111111e-06, "loss": 0.4161, "step": 190550 }, { "epoch": 6.71, "learning_rate": 1.0525555555555557e-06, "loss": 0.3775, "step": 190600 }, { "epoch": 6.71, "learning_rate": 1.047e-06, "loss": 0.3784, "step": 190650 }, { "epoch": 6.71, "learning_rate": 1.0414444444444445e-06, "loss": 0.4101, "step": 190700 }, { "epoch": 6.72, "learning_rate": 1.035888888888889e-06, "loss": 0.3745, "step": 190750 }, { "epoch": 6.72, "learning_rate": 1.0303333333333335e-06, "loss": 0.3711, "step": 190800 }, { "epoch": 6.72, "learning_rate": 1.024777777777778e-06, "loss": 0.4073, "step": 190850 }, { "epoch": 6.72, "learning_rate": 1.0192222222222223e-06, "loss": 0.3628, "step": 190900 }, { "epoch": 6.72, "learning_rate": 1.0136666666666667e-06, "loss": 0.4123, "step": 190950 }, { "epoch": 6.72, "learning_rate": 1.0081111111111111e-06, "loss": 0.4008, "step": 191000 }, { "epoch": 6.73, "learning_rate": 1.0026666666666668e-06, "loss": 0.4017, "step": 191050 }, { "epoch": 6.73, "learning_rate": 9.971111111111112e-07, "loss": 0.4095, "step": 191100 }, { "epoch": 6.73, "learning_rate": 9.915555555555556e-07, "loss": 0.3935, "step": 191150 }, { "epoch": 6.73, "learning_rate": 9.86e-07, "loss": 0.3825, "step": 191200 }, { "epoch": 6.73, "learning_rate": 9.804444444444446e-07, "loss": 0.4331, "step": 191250 }, { "epoch": 6.74, "learning_rate": 9.74888888888889e-07, "loss": 0.3751, "step": 191300 }, { "epoch": 6.74, "learning_rate": 9.693333333333334e-07, "loss": 0.4052, "step": 191350 }, { "epoch": 6.74, "learning_rate": 9.63777777777778e-07, "loss": 0.3859, "step": 191400 }, { "epoch": 6.74, "learning_rate": 9.582222222222224e-07, "loss": 0.3751, "step": 191450 }, { "epoch": 6.74, "learning_rate": 9.526666666666667e-07, "loss": 0.4097, "step": 191500 }, { "epoch": 6.74, "learning_rate": 9.471111111111111e-07, "loss": 0.4488, "step": 191550 }, { "epoch": 6.75, "learning_rate": 9.415555555555557e-07, "loss": 0.3997, "step": 191600 }, { "epoch": 6.75, "learning_rate": 9.360000000000001e-07, "loss": 0.4041, "step": 191650 }, { "epoch": 6.75, "learning_rate": 9.304444444444445e-07, "loss": 0.3733, "step": 191700 }, { "epoch": 6.75, "learning_rate": 9.248888888888889e-07, "loss": 0.4053, "step": 191750 }, { "epoch": 6.75, "learning_rate": 9.193333333333334e-07, "loss": 0.4011, "step": 191800 }, { "epoch": 6.75, "learning_rate": 9.137777777777778e-07, "loss": 0.4129, "step": 191850 }, { "epoch": 6.76, "learning_rate": 9.082222222222222e-07, "loss": 0.4045, "step": 191900 }, { "epoch": 6.76, "learning_rate": 9.026666666666666e-07, "loss": 0.417, "step": 191950 }, { "epoch": 6.76, "learning_rate": 8.971111111111113e-07, "loss": 0.3729, "step": 192000 }, { "epoch": 6.76, "learning_rate": 8.915555555555557e-07, "loss": 0.3628, "step": 192050 }, { "epoch": 6.76, "learning_rate": 8.860000000000001e-07, "loss": 0.3744, "step": 192100 }, { "epoch": 6.77, "learning_rate": 8.804444444444445e-07, "loss": 0.4, "step": 192150 }, { "epoch": 6.77, "learning_rate": 8.74888888888889e-07, "loss": 0.4011, "step": 192200 }, { "epoch": 6.77, "learning_rate": 8.693333333333334e-07, "loss": 0.4231, "step": 192250 }, { "epoch": 6.77, "learning_rate": 8.637777777777778e-07, "loss": 0.4008, "step": 192300 }, { "epoch": 6.77, "learning_rate": 8.582222222222222e-07, "loss": 0.3929, "step": 192350 }, { "epoch": 6.77, "learning_rate": 8.526666666666668e-07, "loss": 0.4007, "step": 192400 }, { "epoch": 6.78, "learning_rate": 8.471111111111112e-07, "loss": 0.4244, "step": 192450 }, { "epoch": 6.78, "learning_rate": 8.415555555555556e-07, "loss": 0.4559, "step": 192500 }, { "epoch": 6.78, "eval_loss": 0.24582235515117645, "eval_runtime": 7.3621, "eval_samples_per_second": 192.88, "eval_steps_per_second": 12.089, "eval_wer": 0.18226377416719616, "step": 192500 }, { "epoch": 6.78, "learning_rate": 8.36e-07, "loss": 0.3989, "step": 192550 }, { "epoch": 6.78, "learning_rate": 8.304444444444445e-07, "loss": 0.4205, "step": 192600 }, { "epoch": 6.78, "learning_rate": 8.248888888888889e-07, "loss": 0.3909, "step": 192650 }, { "epoch": 6.78, "learning_rate": 8.193333333333333e-07, "loss": 0.3882, "step": 192700 }, { "epoch": 6.79, "learning_rate": 8.137777777777777e-07, "loss": 0.3675, "step": 192750 }, { "epoch": 6.79, "learning_rate": 8.082222222222224e-07, "loss": 0.3746, "step": 192800 }, { "epoch": 6.79, "learning_rate": 8.026666666666668e-07, "loss": 0.3875, "step": 192850 }, { "epoch": 6.79, "learning_rate": 7.971111111111112e-07, "loss": 0.4281, "step": 192900 }, { "epoch": 6.79, "learning_rate": 7.915555555555557e-07, "loss": 0.3757, "step": 192950 }, { "epoch": 6.8, "learning_rate": 7.860000000000001e-07, "loss": 0.3982, "step": 193000 }, { "epoch": 6.8, "learning_rate": 7.804444444444445e-07, "loss": 0.3887, "step": 193050 }, { "epoch": 6.8, "learning_rate": 7.748888888888889e-07, "loss": 0.375, "step": 193100 }, { "epoch": 6.8, "learning_rate": 7.693333333333335e-07, "loss": 0.4077, "step": 193150 }, { "epoch": 6.8, "learning_rate": 7.637777777777779e-07, "loss": 0.4246, "step": 193200 }, { "epoch": 6.8, "learning_rate": 7.582222222222223e-07, "loss": 0.3804, "step": 193250 }, { "epoch": 6.81, "learning_rate": 7.526666666666667e-07, "loss": 0.4214, "step": 193300 }, { "epoch": 6.81, "learning_rate": 7.471111111111112e-07, "loss": 0.4053, "step": 193350 }, { "epoch": 6.81, "learning_rate": 7.415555555555556e-07, "loss": 0.4616, "step": 193400 }, { "epoch": 6.81, "learning_rate": 7.36e-07, "loss": 0.3863, "step": 193450 }, { "epoch": 6.81, "learning_rate": 7.304444444444444e-07, "loss": 0.3825, "step": 193500 }, { "epoch": 6.81, "learning_rate": 7.24888888888889e-07, "loss": 0.3819, "step": 193550 }, { "epoch": 6.82, "learning_rate": 7.193333333333334e-07, "loss": 0.6631, "step": 193600 }, { "epoch": 6.82, "learning_rate": 7.137777777777779e-07, "loss": 0.377, "step": 193650 }, { "epoch": 6.82, "learning_rate": 7.082222222222223e-07, "loss": 0.3761, "step": 193700 }, { "epoch": 6.82, "learning_rate": 7.026666666666668e-07, "loss": 0.3797, "step": 193750 }, { "epoch": 6.82, "learning_rate": 6.971111111111112e-07, "loss": 0.3869, "step": 193800 }, { "epoch": 6.83, "learning_rate": 6.915555555555556e-07, "loss": 0.3707, "step": 193850 }, { "epoch": 6.83, "learning_rate": 6.86e-07, "loss": 0.3895, "step": 193900 }, { "epoch": 6.83, "learning_rate": 6.804444444444446e-07, "loss": 0.5131, "step": 193950 }, { "epoch": 6.83, "learning_rate": 6.74888888888889e-07, "loss": 0.3799, "step": 194000 }, { "epoch": 6.83, "learning_rate": 6.693333333333334e-07, "loss": 0.3812, "step": 194050 }, { "epoch": 6.83, "learning_rate": 6.637777777777778e-07, "loss": 0.4706, "step": 194100 }, { "epoch": 6.84, "learning_rate": 6.582222222222223e-07, "loss": 0.3896, "step": 194150 }, { "epoch": 6.84, "learning_rate": 6.526666666666667e-07, "loss": 0.3939, "step": 194200 }, { "epoch": 6.84, "learning_rate": 6.471111111111111e-07, "loss": 0.3997, "step": 194250 }, { "epoch": 6.84, "learning_rate": 6.415555555555555e-07, "loss": 0.3788, "step": 194300 }, { "epoch": 6.84, "learning_rate": 6.360000000000001e-07, "loss": 0.4158, "step": 194350 }, { "epoch": 6.84, "learning_rate": 6.304444444444445e-07, "loss": 0.4074, "step": 194400 }, { "epoch": 6.85, "learning_rate": 6.248888888888889e-07, "loss": 0.4058, "step": 194450 }, { "epoch": 6.85, "learning_rate": 6.193333333333333e-07, "loss": 0.4541, "step": 194500 }, { "epoch": 6.85, "learning_rate": 6.137777777777779e-07, "loss": 0.3895, "step": 194550 }, { "epoch": 6.85, "learning_rate": 6.082222222222223e-07, "loss": 0.4014, "step": 194600 }, { "epoch": 6.85, "learning_rate": 6.026666666666668e-07, "loss": 0.4015, "step": 194650 }, { "epoch": 6.86, "learning_rate": 5.971111111111112e-07, "loss": 0.3946, "step": 194700 }, { "epoch": 6.86, "learning_rate": 5.915555555555557e-07, "loss": 0.3938, "step": 194750 }, { "epoch": 6.86, "learning_rate": 5.860000000000001e-07, "loss": 0.3941, "step": 194800 }, { "epoch": 6.86, "learning_rate": 5.804444444444445e-07, "loss": 0.3844, "step": 194850 }, { "epoch": 6.86, "learning_rate": 5.748888888888889e-07, "loss": 0.3843, "step": 194900 }, { "epoch": 6.86, "learning_rate": 5.693333333333334e-07, "loss": 0.3685, "step": 194950 }, { "epoch": 6.87, "learning_rate": 5.637777777777778e-07, "loss": 0.4033, "step": 195000 }, { "epoch": 6.87, "eval_loss": 0.24510587751865387, "eval_runtime": 7.116, "eval_samples_per_second": 199.551, "eval_steps_per_second": 12.507, "eval_wer": 0.1794499410002723, "step": 195000 }, { "epoch": 6.87, "learning_rate": 5.582222222222223e-07, "loss": 0.4123, "step": 195050 }, { "epoch": 6.87, "learning_rate": 5.526666666666667e-07, "loss": 0.3905, "step": 195100 }, { "epoch": 6.87, "learning_rate": 5.472222222222222e-07, "loss": 0.4451, "step": 195150 }, { "epoch": 6.87, "learning_rate": 5.416666666666667e-07, "loss": 0.4155, "step": 195200 }, { "epoch": 6.87, "learning_rate": 5.361111111111111e-07, "loss": 0.415, "step": 195250 }, { "epoch": 6.88, "learning_rate": 5.305555555555557e-07, "loss": 0.3735, "step": 195300 }, { "epoch": 6.88, "learning_rate": 5.250000000000001e-07, "loss": 0.3848, "step": 195350 }, { "epoch": 6.88, "learning_rate": 5.194444444444445e-07, "loss": 0.3688, "step": 195400 }, { "epoch": 6.88, "learning_rate": 5.138888888888889e-07, "loss": 0.45, "step": 195450 }, { "epoch": 6.88, "learning_rate": 5.083333333333334e-07, "loss": 0.3952, "step": 195500 }, { "epoch": 6.89, "learning_rate": 5.02888888888889e-07, "loss": 0.6184, "step": 195550 }, { "epoch": 6.89, "learning_rate": 4.973333333333334e-07, "loss": 0.4077, "step": 195600 }, { "epoch": 6.89, "learning_rate": 4.917777777777778e-07, "loss": 0.413, "step": 195650 }, { "epoch": 6.89, "learning_rate": 4.862222222222222e-07, "loss": 0.3929, "step": 195700 }, { "epoch": 6.89, "learning_rate": 4.806666666666667e-07, "loss": 0.3742, "step": 195750 }, { "epoch": 6.89, "learning_rate": 4.751111111111111e-07, "loss": 0.4119, "step": 195800 }, { "epoch": 6.9, "learning_rate": 4.695555555555556e-07, "loss": 0.4402, "step": 195850 }, { "epoch": 6.9, "learning_rate": 4.64e-07, "loss": 0.3924, "step": 195900 }, { "epoch": 6.9, "learning_rate": 4.584444444444445e-07, "loss": 0.4304, "step": 195950 }, { "epoch": 6.9, "learning_rate": 4.528888888888889e-07, "loss": 0.3923, "step": 196000 }, { "epoch": 6.9, "learning_rate": 4.473333333333334e-07, "loss": 0.4204, "step": 196050 }, { "epoch": 6.9, "learning_rate": 4.4177777777777785e-07, "loss": 0.38, "step": 196100 }, { "epoch": 6.91, "learning_rate": 4.3622222222222225e-07, "loss": 0.4067, "step": 196150 }, { "epoch": 6.91, "learning_rate": 4.306666666666667e-07, "loss": 0.378, "step": 196200 }, { "epoch": 6.91, "learning_rate": 4.251111111111111e-07, "loss": 0.4086, "step": 196250 }, { "epoch": 6.91, "learning_rate": 4.195555555555556e-07, "loss": 0.3856, "step": 196300 }, { "epoch": 6.91, "learning_rate": 4.1400000000000003e-07, "loss": 0.3961, "step": 196350 }, { "epoch": 6.92, "learning_rate": 4.084444444444445e-07, "loss": 0.3867, "step": 196400 }, { "epoch": 6.92, "learning_rate": 4.028888888888889e-07, "loss": 0.4854, "step": 196450 }, { "epoch": 6.92, "learning_rate": 3.973333333333334e-07, "loss": 0.3894, "step": 196500 }, { "epoch": 6.92, "learning_rate": 3.917777777777778e-07, "loss": 0.3824, "step": 196550 }, { "epoch": 6.92, "learning_rate": 3.8622222222222226e-07, "loss": 0.4189, "step": 196600 }, { "epoch": 6.92, "learning_rate": 3.8066666666666666e-07, "loss": 0.405, "step": 196650 }, { "epoch": 6.93, "learning_rate": 3.7511111111111117e-07, "loss": 0.4278, "step": 196700 }, { "epoch": 6.93, "learning_rate": 3.695555555555556e-07, "loss": 0.4307, "step": 196750 }, { "epoch": 6.93, "learning_rate": 3.6400000000000003e-07, "loss": 0.4142, "step": 196800 }, { "epoch": 6.93, "learning_rate": 3.5844444444444443e-07, "loss": 0.4206, "step": 196850 }, { "epoch": 6.93, "learning_rate": 3.5288888888888894e-07, "loss": 0.3743, "step": 196900 }, { "epoch": 6.93, "learning_rate": 3.4733333333333335e-07, "loss": 0.392, "step": 196950 }, { "epoch": 6.94, "learning_rate": 3.417777777777778e-07, "loss": 0.4369, "step": 197000 }, { "epoch": 6.94, "learning_rate": 3.362222222222222e-07, "loss": 0.3947, "step": 197050 }, { "epoch": 6.94, "learning_rate": 3.306666666666667e-07, "loss": 0.3977, "step": 197100 }, { "epoch": 6.94, "learning_rate": 3.251111111111111e-07, "loss": 0.3702, "step": 197150 }, { "epoch": 6.94, "learning_rate": 3.195555555555556e-07, "loss": 0.3989, "step": 197200 }, { "epoch": 6.94, "learning_rate": 3.14e-07, "loss": 0.3571, "step": 197250 }, { "epoch": 6.95, "learning_rate": 3.084444444444445e-07, "loss": 0.4199, "step": 197300 }, { "epoch": 6.95, "learning_rate": 3.0288888888888895e-07, "loss": 0.4124, "step": 197350 }, { "epoch": 6.95, "learning_rate": 2.9733333333333335e-07, "loss": 0.4084, "step": 197400 }, { "epoch": 6.95, "learning_rate": 2.917777777777778e-07, "loss": 0.4062, "step": 197450 }, { "epoch": 6.95, "learning_rate": 2.8622222222222226e-07, "loss": 0.3829, "step": 197500 }, { "epoch": 6.95, "eval_loss": 0.24527962505817413, "eval_runtime": 22.3814, "eval_samples_per_second": 63.446, "eval_steps_per_second": 3.977, "eval_wer": 0.18035762911863484, "step": 197500 }, { "epoch": 6.96, "learning_rate": 2.8066666666666667e-07, "loss": 0.4449, "step": 197550 }, { "epoch": 6.96, "learning_rate": 2.751111111111111e-07, "loss": 0.3997, "step": 197600 }, { "epoch": 6.96, "learning_rate": 2.695555555555556e-07, "loss": 0.383, "step": 197650 }, { "epoch": 6.96, "learning_rate": 2.6400000000000003e-07, "loss": 0.4019, "step": 197700 }, { "epoch": 6.96, "learning_rate": 2.5844444444444444e-07, "loss": 0.3734, "step": 197750 }, { "epoch": 6.96, "learning_rate": 2.528888888888889e-07, "loss": 0.3864, "step": 197800 }, { "epoch": 6.97, "learning_rate": 2.4733333333333335e-07, "loss": 0.3614, "step": 197850 }, { "epoch": 6.97, "learning_rate": 2.417777777777778e-07, "loss": 0.3876, "step": 197900 }, { "epoch": 6.97, "learning_rate": 2.3622222222222224e-07, "loss": 0.413, "step": 197950 }, { "epoch": 6.97, "learning_rate": 2.3066666666666667e-07, "loss": 0.3803, "step": 198000 }, { "epoch": 6.97, "learning_rate": 2.2511111111111112e-07, "loss": 0.3771, "step": 198050 }, { "epoch": 6.97, "learning_rate": 2.1955555555555555e-07, "loss": 0.4067, "step": 198100 }, { "epoch": 6.98, "learning_rate": 2.14e-07, "loss": 0.4004, "step": 198150 }, { "epoch": 6.98, "learning_rate": 2.0844444444444444e-07, "loss": 0.4056, "step": 198200 }, { "epoch": 6.98, "learning_rate": 2.028888888888889e-07, "loss": 0.379, "step": 198250 }, { "epoch": 6.98, "learning_rate": 1.9733333333333333e-07, "loss": 0.4205, "step": 198300 }, { "epoch": 6.98, "learning_rate": 1.9177777777777778e-07, "loss": 0.3956, "step": 198350 }, { "epoch": 6.99, "learning_rate": 1.8622222222222221e-07, "loss": 0.3851, "step": 198400 }, { "epoch": 6.99, "learning_rate": 1.806666666666667e-07, "loss": 0.3963, "step": 198450 }, { "epoch": 6.99, "learning_rate": 1.7511111111111115e-07, "loss": 0.4155, "step": 198500 }, { "epoch": 6.99, "learning_rate": 1.6955555555555558e-07, "loss": 0.466, "step": 198550 }, { "epoch": 6.99, "learning_rate": 1.6400000000000004e-07, "loss": 0.3965, "step": 198600 }, { "epoch": 6.99, "learning_rate": 1.5844444444444447e-07, "loss": 0.3897, "step": 198650 }, { "epoch": 7.0, "learning_rate": 1.528888888888889e-07, "loss": 0.376, "step": 198700 }, { "epoch": 7.0, "learning_rate": 1.4733333333333333e-07, "loss": 0.377, "step": 198750 }, { "epoch": 7.0, "learning_rate": 1.4177777777777779e-07, "loss": 0.3874, "step": 198800 }, { "epoch": 7.0, "learning_rate": 1.3622222222222224e-07, "loss": 0.3863, "step": 198850 }, { "epoch": 7.0, "learning_rate": 1.3066666666666667e-07, "loss": 0.3925, "step": 198900 }, { "epoch": 7.0, "learning_rate": 1.2511111111111113e-07, "loss": 0.4244, "step": 198950 }, { "epoch": 7.01, "learning_rate": 1.1955555555555556e-07, "loss": 0.4064, "step": 199000 }, { "epoch": 7.01, "learning_rate": 1.1400000000000001e-07, "loss": 0.3831, "step": 199050 }, { "epoch": 7.01, "learning_rate": 1.0844444444444446e-07, "loss": 0.3925, "step": 199100 }, { "epoch": 7.01, "learning_rate": 1.028888888888889e-07, "loss": 0.4377, "step": 199150 }, { "epoch": 7.01, "learning_rate": 9.733333333333334e-08, "loss": 0.3752, "step": 199200 }, { "epoch": 7.02, "learning_rate": 9.177777777777779e-08, "loss": 0.3736, "step": 199250 }, { "epoch": 7.02, "learning_rate": 8.622222222222223e-08, "loss": 0.4006, "step": 199300 }, { "epoch": 7.02, "learning_rate": 8.066666666666667e-08, "loss": 0.4034, "step": 199350 }, { "epoch": 7.02, "learning_rate": 7.511111111111112e-08, "loss": 0.3745, "step": 199400 }, { "epoch": 7.02, "learning_rate": 6.955555555555556e-08, "loss": 0.4022, "step": 199450 }, { "epoch": 7.02, "learning_rate": 6.4e-08, "loss": 0.3778, "step": 199500 }, { "epoch": 7.03, "learning_rate": 5.8444444444444454e-08, "loss": 0.4699, "step": 199550 }, { "epoch": 7.03, "learning_rate": 5.28888888888889e-08, "loss": 0.4082, "step": 199600 }, { "epoch": 7.03, "learning_rate": 4.733333333333334e-08, "loss": 0.4372, "step": 199650 }, { "epoch": 7.03, "learning_rate": 4.177777777777778e-08, "loss": 0.3597, "step": 199700 }, { "epoch": 7.03, "learning_rate": 3.622222222222223e-08, "loss": 0.4258, "step": 199750 }, { "epoch": 7.03, "learning_rate": 3.066666666666667e-08, "loss": 0.3774, "step": 199800 }, { "epoch": 7.04, "learning_rate": 2.5111111111111113e-08, "loss": 0.3795, "step": 199850 }, { "epoch": 7.04, "learning_rate": 1.9555555555555556e-08, "loss": 0.3969, "step": 199900 }, { "epoch": 7.04, "learning_rate": 1.411111111111111e-08, "loss": 0.4157, "step": 199950 }, { "epoch": 7.04, "learning_rate": 8.555555555555557e-09, "loss": 0.3676, "step": 200000 }, { "epoch": 7.04, "eval_loss": 0.24543938040733337, "eval_runtime": 117.2116, "eval_samples_per_second": 12.115, "eval_steps_per_second": 0.759, "eval_wer": 0.18035762911863484, "step": 200000 }, { "epoch": 7.04, "step": 200000, "total_flos": 3.8907541870249184e+21, "train_loss": 0.7787630347633362, "train_runtime": 209083.4414, "train_samples_per_second": 45.915, "train_steps_per_second": 0.957 } ], "logging_steps": 50, "max_steps": 200000, "num_train_epochs": 8, "save_steps": 500, "total_flos": 3.8907541870249184e+21, "trial_name": null, "trial_params": null }