{ "best_metric": 24.914285714285715, "best_model_checkpoint": "./checkpoint-51000", "epoch": 1.0000166666666668, "global_step": 60001, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 4.4e-07, "loss": 4.5376, "step": 25 }, { "epoch": 2.0, "learning_rate": 8.8e-07, "loss": 3.8397, "step": 50 }, { "epoch": 4.0, "learning_rate": 1.3800000000000001e-06, "loss": 2.7952, "step": 75 }, { "epoch": 5.0, "learning_rate": 1.8800000000000002e-06, "loss": 2.1357, "step": 100 }, { "epoch": 7.0, "learning_rate": 2.38e-06, "loss": 1.6674, "step": 125 }, { "epoch": 8.0, "learning_rate": 2.88e-06, "loss": 1.3925, "step": 150 }, { "epoch": 10.0, "learning_rate": 3.3800000000000007e-06, "loss": 1.1533, "step": 175 }, { "epoch": 11.0, "learning_rate": 3.88e-06, "loss": 0.957, "step": 200 }, { "epoch": 13.0, "learning_rate": 4.38e-06, "loss": 0.8493, "step": 225 }, { "epoch": 14.0, "learning_rate": 4.880000000000001e-06, "loss": 0.8259, "step": 250 }, { "epoch": 16.0, "learning_rate": 5.380000000000001e-06, "loss": 0.7435, "step": 275 }, { "epoch": 17.0, "learning_rate": 5.8800000000000005e-06, "loss": 0.7692, "step": 300 }, { "epoch": 19.0, "learning_rate": 6.380000000000001e-06, "loss": 0.7232, "step": 325 }, { "epoch": 20.0, "learning_rate": 6.88e-06, "loss": 0.7097, "step": 350 }, { "epoch": 22.0, "learning_rate": 7.3800000000000005e-06, "loss": 0.6814, "step": 375 }, { "epoch": 23.0, "learning_rate": 7.88e-06, "loss": 0.6832, "step": 400 }, { "epoch": 24.0, "learning_rate": 8.380000000000001e-06, "loss": 0.5935, "step": 425 }, { "epoch": 26.0, "learning_rate": 8.880000000000001e-06, "loss": 0.6328, "step": 450 }, { "epoch": 27.0, "learning_rate": 9.38e-06, "loss": 0.5815, "step": 475 }, { "epoch": 29.0, "learning_rate": 9.88e-06, "loss": 0.5843, "step": 500 }, { "epoch": 30.0, "learning_rate": 9.998090452261307e-06, "loss": 0.5647, "step": 525 }, { "epoch": 32.0, "learning_rate": 9.995577889447236e-06, "loss": 0.5265, "step": 550 }, { "epoch": 33.0, "learning_rate": 9.993065326633167e-06, "loss": 0.5325, "step": 575 }, { "epoch": 35.0, "learning_rate": 9.990552763819096e-06, "loss": 0.538, "step": 600 }, { "epoch": 36.0, "learning_rate": 9.988040201005026e-06, "loss": 0.5602, "step": 625 }, { "epoch": 38.0, "learning_rate": 9.985527638190957e-06, "loss": 0.452, "step": 650 }, { "epoch": 39.0, "learning_rate": 9.983015075376884e-06, "loss": 0.5076, "step": 675 }, { "epoch": 41.0, "learning_rate": 9.980502512562815e-06, "loss": 0.4914, "step": 700 }, { "epoch": 42.0, "learning_rate": 9.977989949748745e-06, "loss": 0.4673, "step": 725 }, { "epoch": 44.0, "learning_rate": 9.975477386934674e-06, "loss": 0.4592, "step": 750 }, { "epoch": 45.0, "learning_rate": 9.972964824120603e-06, "loss": 0.4522, "step": 775 }, { "epoch": 47.0, "learning_rate": 9.970452261306533e-06, "loss": 0.4662, "step": 800 }, { "epoch": 48.0, "learning_rate": 9.967939698492464e-06, "loss": 0.4188, "step": 825 }, { "epoch": 49.0, "learning_rate": 9.965427135678393e-06, "loss": 0.4918, "step": 850 }, { "epoch": 51.0, "learning_rate": 9.962914572864322e-06, "loss": 0.47, "step": 875 }, { "epoch": 52.0, "learning_rate": 9.960402010050252e-06, "loss": 0.4264, "step": 900 }, { "epoch": 54.0, "learning_rate": 9.957889447236183e-06, "loss": 0.4124, "step": 925 }, { "epoch": 55.0, "learning_rate": 9.95537688442211e-06, "loss": 0.4518, "step": 950 }, { "epoch": 57.0, "learning_rate": 9.952864321608041e-06, "loss": 0.3216, "step": 975 }, { "epoch": 58.0, "learning_rate": 9.95035175879397e-06, "loss": 0.4665, "step": 1000 }, { "epoch": 58.0, "eval_loss": 0.8571563959121704, "eval_runtime": 165.1074, "eval_samples_per_second": 0.606, "eval_steps_per_second": 0.103, "eval_wer": 54.51428571428571, "step": 1000 }, { "epoch": 60.0, "learning_rate": 9.9478391959799e-06, "loss": 0.3487, "step": 1025 }, { "epoch": 61.0, "learning_rate": 9.945326633165831e-06, "loss": 0.3766, "step": 1050 }, { "epoch": 63.0, "learning_rate": 9.942814070351759e-06, "loss": 0.37, "step": 1075 }, { "epoch": 64.0, "learning_rate": 9.94030150753769e-06, "loss": 0.4059, "step": 1100 }, { "epoch": 66.0, "learning_rate": 9.937788944723619e-06, "loss": 0.3836, "step": 1125 }, { "epoch": 67.0, "learning_rate": 9.935276381909548e-06, "loss": 0.3833, "step": 1150 }, { "epoch": 69.0, "learning_rate": 9.932763819095478e-06, "loss": 0.3921, "step": 1175 }, { "epoch": 70.0, "learning_rate": 9.930251256281409e-06, "loss": 0.3567, "step": 1200 }, { "epoch": 72.0, "learning_rate": 9.927738693467336e-06, "loss": 0.3847, "step": 1225 }, { "epoch": 73.0, "learning_rate": 9.925226130653267e-06, "loss": 0.3763, "step": 1250 }, { "epoch": 74.0, "learning_rate": 9.922713567839197e-06, "loss": 0.3587, "step": 1275 }, { "epoch": 76.0, "learning_rate": 9.920201005025126e-06, "loss": 0.3617, "step": 1300 }, { "epoch": 77.0, "learning_rate": 9.917688442211057e-06, "loss": 0.4359, "step": 1325 }, { "epoch": 79.0, "learning_rate": 9.915175879396985e-06, "loss": 0.3303, "step": 1350 }, { "epoch": 80.0, "learning_rate": 9.912663316582916e-06, "loss": 0.3663, "step": 1375 }, { "epoch": 82.0, "learning_rate": 9.910150753768845e-06, "loss": 0.3584, "step": 1400 }, { "epoch": 83.0, "learning_rate": 9.907638190954774e-06, "loss": 0.3259, "step": 1425 }, { "epoch": 85.0, "learning_rate": 9.905125628140704e-06, "loss": 0.3477, "step": 1450 }, { "epoch": 86.0, "learning_rate": 9.902613065326635e-06, "loss": 0.3291, "step": 1475 }, { "epoch": 88.0, "learning_rate": 9.900100502512564e-06, "loss": 0.3484, "step": 1500 }, { "epoch": 89.0, "learning_rate": 9.897587939698493e-06, "loss": 0.3507, "step": 1525 }, { "epoch": 91.0, "learning_rate": 9.895075376884423e-06, "loss": 0.3338, "step": 1550 }, { "epoch": 92.0, "learning_rate": 9.892562814070352e-06, "loss": 0.3212, "step": 1575 }, { "epoch": 94.0, "learning_rate": 9.890050251256283e-06, "loss": 0.3328, "step": 1600 }, { "epoch": 95.0, "learning_rate": 9.88753768844221e-06, "loss": 0.3458, "step": 1625 }, { "epoch": 97.0, "learning_rate": 9.885025125628142e-06, "loss": 0.3244, "step": 1650 }, { "epoch": 98.0, "learning_rate": 9.882512562814071e-06, "loss": 0.3031, "step": 1675 }, { "epoch": 99.0, "learning_rate": 9.88e-06, "loss": 0.2855, "step": 1700 }, { "epoch": 101.0, "learning_rate": 9.877487437185931e-06, "loss": 0.3053, "step": 1725 }, { "epoch": 102.0, "learning_rate": 9.87497487437186e-06, "loss": 0.2852, "step": 1750 }, { "epoch": 104.0, "learning_rate": 9.87246231155779e-06, "loss": 0.3005, "step": 1775 }, { "epoch": 105.0, "learning_rate": 9.86994974874372e-06, "loss": 0.2694, "step": 1800 }, { "epoch": 107.0, "learning_rate": 9.867437185929649e-06, "loss": 0.3108, "step": 1825 }, { "epoch": 108.0, "learning_rate": 9.864924623115578e-06, "loss": 0.3181, "step": 1850 }, { "epoch": 110.0, "learning_rate": 9.862412060301509e-06, "loss": 0.3041, "step": 1875 }, { "epoch": 111.0, "learning_rate": 9.859899497487438e-06, "loss": 0.2771, "step": 1900 }, { "epoch": 113.0, "learning_rate": 9.857386934673368e-06, "loss": 0.2606, "step": 1925 }, { "epoch": 114.0, "learning_rate": 9.854874371859297e-06, "loss": 0.2855, "step": 1950 }, { "epoch": 116.0, "learning_rate": 9.852361809045226e-06, "loss": 0.3042, "step": 1975 }, { "epoch": 117.0, "learning_rate": 9.849849246231157e-06, "loss": 0.3041, "step": 2000 }, { "epoch": 117.0, "eval_loss": 0.6711387038230896, "eval_runtime": 164.9213, "eval_samples_per_second": 0.606, "eval_steps_per_second": 0.103, "eval_wer": 44.114285714285714, "step": 2000 }, { "epoch": 119.0, "learning_rate": 9.847336683417087e-06, "loss": 0.2787, "step": 2025 }, { "epoch": 120.0, "learning_rate": 9.844824120603016e-06, "loss": 0.2585, "step": 2050 }, { "epoch": 122.0, "learning_rate": 9.842311557788945e-06, "loss": 0.2888, "step": 2075 }, { "epoch": 123.0, "learning_rate": 9.839798994974875e-06, "loss": 0.3042, "step": 2100 }, { "epoch": 124.0, "learning_rate": 9.837286432160806e-06, "loss": 0.3037, "step": 2125 }, { "epoch": 126.0, "learning_rate": 9.834773869346735e-06, "loss": 0.2795, "step": 2150 }, { "epoch": 127.0, "learning_rate": 9.832361809045226e-06, "loss": 0.2827, "step": 2175 }, { "epoch": 129.0, "learning_rate": 9.829849246231157e-06, "loss": 0.2673, "step": 2200 }, { "epoch": 130.0, "learning_rate": 9.827336683417085e-06, "loss": 0.2674, "step": 2225 }, { "epoch": 132.0, "learning_rate": 9.824824120603016e-06, "loss": 0.3057, "step": 2250 }, { "epoch": 133.0, "learning_rate": 9.822311557788945e-06, "loss": 0.2774, "step": 2275 }, { "epoch": 135.0, "learning_rate": 9.819798994974875e-06, "loss": 0.2836, "step": 2300 }, { "epoch": 136.0, "learning_rate": 9.817286432160806e-06, "loss": 0.2923, "step": 2325 }, { "epoch": 138.0, "learning_rate": 9.814773869346735e-06, "loss": 0.281, "step": 2350 }, { "epoch": 139.0, "learning_rate": 9.812261306532664e-06, "loss": 0.2471, "step": 2375 }, { "epoch": 141.0, "learning_rate": 9.809748743718594e-06, "loss": 0.2123, "step": 2400 }, { "epoch": 142.0, "learning_rate": 9.807236180904523e-06, "loss": 0.2544, "step": 2425 }, { "epoch": 144.0, "learning_rate": 9.804723618090452e-06, "loss": 0.2513, "step": 2450 }, { "epoch": 145.0, "learning_rate": 9.802211055276383e-06, "loss": 0.2633, "step": 2475 }, { "epoch": 147.0, "learning_rate": 9.799698492462313e-06, "loss": 0.2559, "step": 2500 }, { "epoch": 148.0, "learning_rate": 9.797185929648242e-06, "loss": 0.2665, "step": 2525 }, { "epoch": 149.0, "learning_rate": 9.794673366834171e-06, "loss": 0.2696, "step": 2550 }, { "epoch": 151.0, "learning_rate": 9.7921608040201e-06, "loss": 0.2586, "step": 2575 }, { "epoch": 152.0, "learning_rate": 9.789648241206032e-06, "loss": 0.2739, "step": 2600 }, { "epoch": 154.0, "learning_rate": 9.787135678391961e-06, "loss": 0.2554, "step": 2625 }, { "epoch": 155.0, "learning_rate": 9.78462311557789e-06, "loss": 0.2633, "step": 2650 }, { "epoch": 157.0, "learning_rate": 9.78211055276382e-06, "loss": 0.2505, "step": 2675 }, { "epoch": 158.0, "learning_rate": 9.779597989949749e-06, "loss": 0.2233, "step": 2700 }, { "epoch": 160.0, "learning_rate": 9.77708542713568e-06, "loss": 0.2772, "step": 2725 }, { "epoch": 161.0, "learning_rate": 9.77457286432161e-06, "loss": 0.2636, "step": 2750 }, { "epoch": 163.0, "learning_rate": 9.772060301507539e-06, "loss": 0.2542, "step": 2775 }, { "epoch": 164.0, "learning_rate": 9.769547738693468e-06, "loss": 0.2581, "step": 2800 }, { "epoch": 166.0, "learning_rate": 9.767035175879397e-06, "loss": 0.2424, "step": 2825 }, { "epoch": 167.0, "learning_rate": 9.764522613065327e-06, "loss": 0.2132, "step": 2850 }, { "epoch": 169.0, "learning_rate": 9.762010050251258e-06, "loss": 0.2484, "step": 2875 }, { "epoch": 170.0, "learning_rate": 9.759497487437187e-06, "loss": 0.2725, "step": 2900 }, { "epoch": 172.0, "learning_rate": 9.756984924623116e-06, "loss": 0.2332, "step": 2925 }, { "epoch": 173.0, "learning_rate": 9.754472361809047e-06, "loss": 0.2406, "step": 2950 }, { "epoch": 174.0, "learning_rate": 9.751959798994975e-06, "loss": 0.2219, "step": 2975 }, { "epoch": 176.0, "learning_rate": 9.749447236180906e-06, "loss": 0.2671, "step": 3000 }, { "epoch": 176.0, "eval_loss": 0.5794399380683899, "eval_runtime": 162.3092, "eval_samples_per_second": 0.616, "eval_steps_per_second": 0.105, "eval_wer": 39.77142857142857, "step": 3000 }, { "epoch": 177.0, "learning_rate": 9.746934673366835e-06, "loss": 0.226, "step": 3025 }, { "epoch": 179.0, "learning_rate": 9.744422110552765e-06, "loss": 0.2177, "step": 3050 }, { "epoch": 180.0, "learning_rate": 9.741909547738694e-06, "loss": 0.2655, "step": 3075 }, { "epoch": 182.0, "learning_rate": 9.739396984924623e-06, "loss": 0.2247, "step": 3100 }, { "epoch": 183.0, "learning_rate": 9.736884422110554e-06, "loss": 0.2196, "step": 3125 }, { "epoch": 185.0, "learning_rate": 9.734371859296484e-06, "loss": 0.2217, "step": 3150 }, { "epoch": 186.0, "learning_rate": 9.731859296482413e-06, "loss": 0.2382, "step": 3175 }, { "epoch": 188.0, "learning_rate": 9.729346733668342e-06, "loss": 0.2313, "step": 3200 }, { "epoch": 189.0, "learning_rate": 9.726834170854273e-06, "loss": 0.2327, "step": 3225 }, { "epoch": 191.0, "learning_rate": 9.724321608040201e-06, "loss": 0.2413, "step": 3250 }, { "epoch": 192.0, "learning_rate": 9.721809045226132e-06, "loss": 0.2128, "step": 3275 }, { "epoch": 194.0, "learning_rate": 9.719296482412061e-06, "loss": 0.2211, "step": 3300 }, { "epoch": 195.0, "learning_rate": 9.71678391959799e-06, "loss": 0.249, "step": 3325 }, { "epoch": 197.0, "learning_rate": 9.714271356783922e-06, "loss": 0.2273, "step": 3350 }, { "epoch": 198.0, "learning_rate": 9.71175879396985e-06, "loss": 0.2484, "step": 3375 }, { "epoch": 199.0, "learning_rate": 9.70924623115578e-06, "loss": 0.2278, "step": 3400 }, { "epoch": 201.0, "learning_rate": 9.70673366834171e-06, "loss": 0.2113, "step": 3425 }, { "epoch": 202.0, "learning_rate": 9.704221105527639e-06, "loss": 0.2757, "step": 3450 }, { "epoch": 204.0, "learning_rate": 9.701708542713568e-06, "loss": 0.2353, "step": 3475 }, { "epoch": 205.0, "learning_rate": 9.6991959798995e-06, "loss": 0.2114, "step": 3500 }, { "epoch": 207.0, "learning_rate": 9.696683417085427e-06, "loss": 0.2331, "step": 3525 }, { "epoch": 208.0, "learning_rate": 9.694170854271358e-06, "loss": 0.2456, "step": 3550 }, { "epoch": 210.0, "learning_rate": 9.691658291457287e-06, "loss": 0.1981, "step": 3575 }, { "epoch": 211.0, "learning_rate": 9.689145728643216e-06, "loss": 0.21, "step": 3600 }, { "epoch": 213.0, "learning_rate": 9.686633165829147e-06, "loss": 0.1837, "step": 3625 }, { "epoch": 214.0, "learning_rate": 9.684120603015075e-06, "loss": 0.2097, "step": 3650 }, { "epoch": 216.0, "learning_rate": 9.681608040201006e-06, "loss": 0.2427, "step": 3675 }, { "epoch": 217.0, "learning_rate": 9.679095477386935e-06, "loss": 0.232, "step": 3700 }, { "epoch": 219.0, "learning_rate": 9.676582914572865e-06, "loss": 0.197, "step": 3725 }, { "epoch": 220.0, "learning_rate": 9.674070351758796e-06, "loss": 0.2129, "step": 3750 }, { "epoch": 222.0, "learning_rate": 9.671557788944725e-06, "loss": 0.2091, "step": 3775 }, { "epoch": 223.0, "learning_rate": 9.669045226130654e-06, "loss": 0.2113, "step": 3800 }, { "epoch": 224.0, "learning_rate": 9.666532663316584e-06, "loss": 0.2063, "step": 3825 }, { "epoch": 226.0, "learning_rate": 9.664020100502513e-06, "loss": 0.1989, "step": 3850 }, { "epoch": 227.0, "learning_rate": 9.661507537688442e-06, "loss": 0.2254, "step": 3875 }, { "epoch": 229.0, "learning_rate": 9.658994974874373e-06, "loss": 0.2313, "step": 3900 }, { "epoch": 230.0, "learning_rate": 9.656482412060301e-06, "loss": 0.2248, "step": 3925 }, { "epoch": 232.0, "learning_rate": 9.653969849246232e-06, "loss": 0.2086, "step": 3950 }, { "epoch": 233.0, "learning_rate": 9.651457286432161e-06, "loss": 0.203, "step": 3975 }, { "epoch": 235.0, "learning_rate": 9.64894472361809e-06, "loss": 0.1761, "step": 4000 }, { "epoch": 235.0, "eval_loss": 0.535667359828949, "eval_runtime": 210.1723, "eval_samples_per_second": 0.476, "eval_steps_per_second": 0.081, "eval_wer": 35.08571428571429, "step": 4000 }, { "epoch": 236.0, "learning_rate": 9.646432160804022e-06, "loss": 0.232, "step": 4025 }, { "epoch": 238.0, "learning_rate": 9.643919597989951e-06, "loss": 0.1995, "step": 4050 }, { "epoch": 239.0, "learning_rate": 9.64140703517588e-06, "loss": 0.2043, "step": 4075 }, { "epoch": 241.0, "learning_rate": 9.63889447236181e-06, "loss": 0.2277, "step": 4100 }, { "epoch": 242.0, "learning_rate": 9.636381909547739e-06, "loss": 0.1835, "step": 4125 }, { "epoch": 244.0, "learning_rate": 9.633869346733668e-06, "loss": 0.2138, "step": 4150 }, { "epoch": 245.0, "learning_rate": 9.6313567839196e-06, "loss": 0.1873, "step": 4175 }, { "epoch": 247.0, "learning_rate": 9.628844221105529e-06, "loss": 0.1617, "step": 4200 }, { "epoch": 248.0, "learning_rate": 9.626331658291458e-06, "loss": 0.2099, "step": 4225 }, { "epoch": 249.0, "learning_rate": 9.623819095477387e-06, "loss": 0.1922, "step": 4250 }, { "epoch": 251.0, "learning_rate": 9.621306532663317e-06, "loss": 0.1679, "step": 4275 }, { "epoch": 252.0, "learning_rate": 9.618793969849248e-06, "loss": 0.2071, "step": 4300 }, { "epoch": 254.0, "learning_rate": 9.616281407035177e-06, "loss": 0.1833, "step": 4325 }, { "epoch": 255.0, "learning_rate": 9.613768844221106e-06, "loss": 0.174, "step": 4350 }, { "epoch": 257.0, "learning_rate": 9.611256281407036e-06, "loss": 0.2016, "step": 4375 }, { "epoch": 258.0, "learning_rate": 9.608743718592965e-06, "loss": 0.1913, "step": 4400 }, { "epoch": 260.0, "learning_rate": 9.606231155778896e-06, "loss": 0.1856, "step": 4425 }, { "epoch": 261.0, "learning_rate": 9.603718592964825e-06, "loss": 0.163, "step": 4450 }, { "epoch": 263.0, "learning_rate": 9.601206030150755e-06, "loss": 0.1832, "step": 4475 }, { "epoch": 264.0, "learning_rate": 9.598693467336684e-06, "loss": 0.1713, "step": 4500 }, { "epoch": 266.0, "learning_rate": 9.596180904522613e-06, "loss": 0.1764, "step": 4525 }, { "epoch": 267.0, "learning_rate": 9.593668341708543e-06, "loss": 0.2293, "step": 4550 }, { "epoch": 269.0, "learning_rate": 9.591155778894474e-06, "loss": 0.1771, "step": 4575 }, { "epoch": 270.0, "learning_rate": 9.588643216080403e-06, "loss": 0.1905, "step": 4600 }, { "epoch": 272.0, "learning_rate": 9.586130653266332e-06, "loss": 0.2026, "step": 4625 }, { "epoch": 273.0, "learning_rate": 9.583618090452262e-06, "loss": 0.2088, "step": 4650 }, { "epoch": 274.0, "learning_rate": 9.581105527638191e-06, "loss": 0.1932, "step": 4675 }, { "epoch": 276.0, "learning_rate": 9.578592964824122e-06, "loss": 0.1722, "step": 4700 }, { "epoch": 277.0, "learning_rate": 9.576080402010051e-06, "loss": 0.1677, "step": 4725 }, { "epoch": 279.0, "learning_rate": 9.57356783919598e-06, "loss": 0.1804, "step": 4750 }, { "epoch": 280.0, "learning_rate": 9.57105527638191e-06, "loss": 0.1818, "step": 4775 }, { "epoch": 282.0, "learning_rate": 9.56854271356784e-06, "loss": 0.1565, "step": 4800 }, { "epoch": 283.0, "learning_rate": 9.56603015075377e-06, "loss": 0.1874, "step": 4825 }, { "epoch": 285.0, "learning_rate": 9.5635175879397e-06, "loss": 0.1459, "step": 4850 }, { "epoch": 286.0, "learning_rate": 9.561005025125629e-06, "loss": 0.1823, "step": 4875 }, { "epoch": 288.0, "learning_rate": 9.558492462311558e-06, "loss": 0.1869, "step": 4900 }, { "epoch": 289.0, "learning_rate": 9.555979899497488e-06, "loss": 0.2153, "step": 4925 }, { "epoch": 291.0, "learning_rate": 9.553467336683417e-06, "loss": 0.1732, "step": 4950 }, { "epoch": 292.0, "learning_rate": 9.550954773869348e-06, "loss": 0.198, "step": 4975 }, { "epoch": 294.0, "learning_rate": 9.548442211055277e-06, "loss": 0.2089, "step": 5000 }, { "epoch": 294.0, "eval_loss": 0.5094332695007324, "eval_runtime": 162.9376, "eval_samples_per_second": 0.614, "eval_steps_per_second": 0.104, "eval_wer": 33.6, "step": 5000 }, { "epoch": 295.0, "learning_rate": 9.545929648241207e-06, "loss": 0.1648, "step": 5025 }, { "epoch": 297.0, "learning_rate": 9.543417085427138e-06, "loss": 0.1626, "step": 5050 }, { "epoch": 298.0, "learning_rate": 9.540904522613065e-06, "loss": 0.1386, "step": 5075 }, { "epoch": 299.0, "learning_rate": 9.538391959798996e-06, "loss": 0.1748, "step": 5100 }, { "epoch": 301.0, "learning_rate": 9.535879396984926e-06, "loss": 0.1662, "step": 5125 }, { "epoch": 302.0, "learning_rate": 9.533366834170855e-06, "loss": 0.1414, "step": 5150 }, { "epoch": 304.0, "learning_rate": 9.530854271356784e-06, "loss": 0.1734, "step": 5175 }, { "epoch": 305.0, "learning_rate": 9.528341708542715e-06, "loss": 0.1716, "step": 5200 }, { "epoch": 307.0, "learning_rate": 9.525829145728645e-06, "loss": 0.1866, "step": 5225 }, { "epoch": 308.0, "learning_rate": 9.523316582914574e-06, "loss": 0.2092, "step": 5250 }, { "epoch": 310.0, "learning_rate": 9.520804020100503e-06, "loss": 0.1768, "step": 5275 }, { "epoch": 311.0, "learning_rate": 9.518291457286432e-06, "loss": 0.1907, "step": 5300 }, { "epoch": 313.0, "learning_rate": 9.515778894472363e-06, "loss": 0.1788, "step": 5325 }, { "epoch": 314.0, "learning_rate": 9.513266331658291e-06, "loss": 0.1621, "step": 5350 }, { "epoch": 316.0, "learning_rate": 9.510753768844222e-06, "loss": 0.1605, "step": 5375 }, { "epoch": 317.0, "learning_rate": 9.508241206030151e-06, "loss": 0.1547, "step": 5400 }, { "epoch": 319.0, "learning_rate": 9.50572864321608e-06, "loss": 0.1641, "step": 5425 }, { "epoch": 320.0, "learning_rate": 9.503216080402012e-06, "loss": 0.1775, "step": 5450 }, { "epoch": 322.0, "learning_rate": 9.500703517587941e-06, "loss": 0.1588, "step": 5475 }, { "epoch": 323.0, "learning_rate": 9.49819095477387e-06, "loss": 0.1776, "step": 5500 }, { "epoch": 324.0, "learning_rate": 9.4956783919598e-06, "loss": 0.1506, "step": 5525 }, { "epoch": 326.0, "learning_rate": 9.493165829145729e-06, "loss": 0.178, "step": 5550 }, { "epoch": 327.0, "learning_rate": 9.490653266331658e-06, "loss": 0.189, "step": 5575 }, { "epoch": 329.0, "learning_rate": 9.48814070351759e-06, "loss": 0.1408, "step": 5600 }, { "epoch": 330.0, "learning_rate": 9.485628140703519e-06, "loss": 0.1475, "step": 5625 }, { "epoch": 332.0, "learning_rate": 9.483115577889448e-06, "loss": 0.1762, "step": 5650 }, { "epoch": 333.0, "learning_rate": 9.480603015075377e-06, "loss": 0.1409, "step": 5675 }, { "epoch": 335.0, "learning_rate": 9.478090452261307e-06, "loss": 0.1727, "step": 5700 }, { "epoch": 336.0, "learning_rate": 9.475577889447238e-06, "loss": 0.1595, "step": 5725 }, { "epoch": 338.0, "learning_rate": 9.473065326633167e-06, "loss": 0.1666, "step": 5750 }, { "epoch": 339.0, "learning_rate": 9.470552763819096e-06, "loss": 0.1483, "step": 5775 }, { "epoch": 341.0, "learning_rate": 9.468040201005026e-06, "loss": 0.1597, "step": 5800 }, { "epoch": 342.0, "learning_rate": 9.465527638190955e-06, "loss": 0.1763, "step": 5825 }, { "epoch": 344.0, "learning_rate": 9.463015075376886e-06, "loss": 0.1624, "step": 5850 }, { "epoch": 345.0, "learning_rate": 9.460502512562815e-06, "loss": 0.1477, "step": 5875 }, { "epoch": 347.0, "learning_rate": 9.457989949748745e-06, "loss": 0.1095, "step": 5900 }, { "epoch": 348.0, "learning_rate": 9.455477386934674e-06, "loss": 0.1632, "step": 5925 }, { "epoch": 349.0, "learning_rate": 9.452964824120603e-06, "loss": 0.1747, "step": 5950 }, { "epoch": 351.0, "learning_rate": 9.450452261306533e-06, "loss": 0.1417, "step": 5975 }, { "epoch": 352.0, "learning_rate": 9.447939698492464e-06, "loss": 0.1456, "step": 6000 }, { "epoch": 352.0, "eval_loss": 0.4958537220954895, "eval_runtime": 163.3441, "eval_samples_per_second": 0.612, "eval_steps_per_second": 0.104, "eval_wer": 33.02857142857143, "step": 6000 }, { "epoch": 354.0, "learning_rate": 9.445427135678393e-06, "loss": 0.1644, "step": 6025 }, { "epoch": 355.0, "learning_rate": 9.442914572864322e-06, "loss": 0.1792, "step": 6050 }, { "epoch": 357.0, "learning_rate": 9.440402010050252e-06, "loss": 0.1406, "step": 6075 }, { "epoch": 358.0, "learning_rate": 9.437889447236181e-06, "loss": 0.1586, "step": 6100 }, { "epoch": 360.0, "learning_rate": 9.435376884422112e-06, "loss": 0.142, "step": 6125 }, { "epoch": 361.0, "learning_rate": 9.432864321608041e-06, "loss": 0.1502, "step": 6150 }, { "epoch": 363.0, "learning_rate": 9.43035175879397e-06, "loss": 0.1421, "step": 6175 }, { "epoch": 364.0, "learning_rate": 9.4278391959799e-06, "loss": 0.1626, "step": 6200 }, { "epoch": 366.0, "learning_rate": 9.42532663316583e-06, "loss": 0.1291, "step": 6225 }, { "epoch": 367.0, "learning_rate": 9.42281407035176e-06, "loss": 0.1466, "step": 6250 }, { "epoch": 369.0, "learning_rate": 9.42030150753769e-06, "loss": 0.1397, "step": 6275 }, { "epoch": 370.0, "learning_rate": 9.417788944723619e-06, "loss": 0.1323, "step": 6300 }, { "epoch": 372.0, "learning_rate": 9.415276381909548e-06, "loss": 0.1334, "step": 6325 }, { "epoch": 373.0, "learning_rate": 9.412763819095478e-06, "loss": 0.122, "step": 6350 }, { "epoch": 374.0, "learning_rate": 9.410251256281407e-06, "loss": 0.1424, "step": 6375 }, { "epoch": 376.0, "learning_rate": 9.407738693467338e-06, "loss": 0.1362, "step": 6400 }, { "epoch": 377.0, "learning_rate": 9.405226130653267e-06, "loss": 0.1511, "step": 6425 }, { "epoch": 379.0, "learning_rate": 9.402713567839197e-06, "loss": 0.1558, "step": 6450 }, { "epoch": 380.0, "learning_rate": 9.400201005025128e-06, "loss": 0.1388, "step": 6475 }, { "epoch": 382.0, "learning_rate": 9.397688442211055e-06, "loss": 0.1663, "step": 6500 }, { "epoch": 383.0, "learning_rate": 9.395175879396986e-06, "loss": 0.1546, "step": 6525 }, { "epoch": 385.0, "learning_rate": 9.392663316582916e-06, "loss": 0.133, "step": 6550 }, { "epoch": 386.0, "learning_rate": 9.390150753768845e-06, "loss": 0.1339, "step": 6575 }, { "epoch": 388.0, "learning_rate": 9.387638190954774e-06, "loss": 0.1449, "step": 6600 }, { "epoch": 389.0, "learning_rate": 9.385125628140704e-06, "loss": 0.1602, "step": 6625 }, { "epoch": 391.0, "learning_rate": 9.382613065326633e-06, "loss": 0.1502, "step": 6650 }, { "epoch": 392.0, "learning_rate": 9.380100502512564e-06, "loss": 0.1215, "step": 6675 }, { "epoch": 394.0, "learning_rate": 9.377587939698493e-06, "loss": 0.1449, "step": 6700 }, { "epoch": 395.0, "learning_rate": 9.375075376884423e-06, "loss": 0.1323, "step": 6725 }, { "epoch": 397.0, "learning_rate": 9.372562814070354e-06, "loss": 0.1268, "step": 6750 }, { "epoch": 398.0, "learning_rate": 9.370050251256281e-06, "loss": 0.1407, "step": 6775 }, { "epoch": 399.0, "learning_rate": 9.367537688442212e-06, "loss": 0.1526, "step": 6800 }, { "epoch": 401.0, "learning_rate": 9.365025125628142e-06, "loss": 0.1348, "step": 6825 }, { "epoch": 402.0, "learning_rate": 9.36251256281407e-06, "loss": 0.1204, "step": 6850 }, { "epoch": 404.0, "learning_rate": 9.360000000000002e-06, "loss": 0.178, "step": 6875 }, { "epoch": 405.0, "learning_rate": 9.35748743718593e-06, "loss": 0.1453, "step": 6900 }, { "epoch": 407.0, "learning_rate": 9.35497487437186e-06, "loss": 0.1491, "step": 6925 }, { "epoch": 408.0, "learning_rate": 9.35246231155779e-06, "loss": 0.1152, "step": 6950 }, { "epoch": 410.0, "learning_rate": 9.34994974874372e-06, "loss": 0.1186, "step": 6975 }, { "epoch": 411.0, "learning_rate": 9.347437185929648e-06, "loss": 0.1514, "step": 7000 }, { "epoch": 411.0, "eval_loss": 0.48641833662986755, "eval_runtime": 160.6543, "eval_samples_per_second": 0.622, "eval_steps_per_second": 0.106, "eval_wer": 32.57142857142858, "step": 7000 }, { "epoch": 413.0, "learning_rate": 9.34492462311558e-06, "loss": 0.1398, "step": 7025 }, { "epoch": 414.0, "learning_rate": 9.342412060301507e-06, "loss": 0.1329, "step": 7050 }, { "epoch": 416.0, "learning_rate": 9.339899497487438e-06, "loss": 0.143, "step": 7075 }, { "epoch": 417.0, "learning_rate": 9.337386934673367e-06, "loss": 0.1271, "step": 7100 }, { "epoch": 419.0, "learning_rate": 9.334874371859297e-06, "loss": 0.1312, "step": 7125 }, { "epoch": 420.0, "learning_rate": 9.332361809045228e-06, "loss": 0.1321, "step": 7150 }, { "epoch": 422.0, "learning_rate": 9.329849246231157e-06, "loss": 0.1194, "step": 7175 }, { "epoch": 423.0, "learning_rate": 9.327336683417086e-06, "loss": 0.1436, "step": 7200 }, { "epoch": 424.0, "learning_rate": 9.324824120603016e-06, "loss": 0.133, "step": 7225 }, { "epoch": 426.0, "learning_rate": 9.322311557788945e-06, "loss": 0.1231, "step": 7250 }, { "epoch": 427.0, "learning_rate": 9.319798994974874e-06, "loss": 0.1253, "step": 7275 }, { "epoch": 429.0, "learning_rate": 9.317286432160805e-06, "loss": 0.118, "step": 7300 }, { "epoch": 430.0, "learning_rate": 9.314773869346735e-06, "loss": 0.1344, "step": 7325 }, { "epoch": 432.0, "learning_rate": 9.312261306532664e-06, "loss": 0.1462, "step": 7350 }, { "epoch": 433.0, "learning_rate": 9.309748743718593e-06, "loss": 0.1295, "step": 7375 }, { "epoch": 435.0, "learning_rate": 9.307236180904523e-06, "loss": 0.1222, "step": 7400 }, { "epoch": 436.0, "learning_rate": 9.304723618090454e-06, "loss": 0.1082, "step": 7425 }, { "epoch": 438.0, "learning_rate": 9.302211055276383e-06, "loss": 0.1268, "step": 7450 }, { "epoch": 439.0, "learning_rate": 9.299698492462312e-06, "loss": 0.1284, "step": 7475 }, { "epoch": 441.0, "learning_rate": 9.297185929648242e-06, "loss": 0.1198, "step": 7500 }, { "epoch": 442.0, "learning_rate": 9.294673366834171e-06, "loss": 0.1407, "step": 7525 }, { "epoch": 444.0, "learning_rate": 9.292160804020102e-06, "loss": 0.1041, "step": 7550 }, { "epoch": 445.0, "learning_rate": 9.289648241206031e-06, "loss": 0.1377, "step": 7575 }, { "epoch": 447.0, "learning_rate": 9.28713567839196e-06, "loss": 0.1112, "step": 7600 }, { "epoch": 448.0, "learning_rate": 9.28462311557789e-06, "loss": 0.1255, "step": 7625 }, { "epoch": 449.0, "learning_rate": 9.28211055276382e-06, "loss": 0.1217, "step": 7650 }, { "epoch": 451.0, "learning_rate": 9.279597989949749e-06, "loss": 0.123, "step": 7675 }, { "epoch": 452.0, "learning_rate": 9.27708542713568e-06, "loss": 0.1138, "step": 7700 }, { "epoch": 454.0, "learning_rate": 9.274572864321609e-06, "loss": 0.1299, "step": 7725 }, { "epoch": 455.0, "learning_rate": 9.272060301507538e-06, "loss": 0.1116, "step": 7750 }, { "epoch": 457.0, "learning_rate": 9.269547738693468e-06, "loss": 0.1091, "step": 7775 }, { "epoch": 458.0, "learning_rate": 9.267035175879397e-06, "loss": 0.1213, "step": 7800 }, { "epoch": 460.0, "learning_rate": 9.264522613065328e-06, "loss": 0.1116, "step": 7825 }, { "epoch": 461.0, "learning_rate": 9.262010050251257e-06, "loss": 0.1131, "step": 7850 }, { "epoch": 463.0, "learning_rate": 9.259497487437187e-06, "loss": 0.1023, "step": 7875 }, { "epoch": 464.0, "learning_rate": 9.256984924623116e-06, "loss": 0.1104, "step": 7900 }, { "epoch": 466.0, "learning_rate": 9.254472361809045e-06, "loss": 0.1332, "step": 7925 }, { "epoch": 467.0, "learning_rate": 9.252060301507539e-06, "loss": 0.1208, "step": 7950 }, { "epoch": 469.0, "learning_rate": 9.249547738693468e-06, "loss": 0.1137, "step": 7975 }, { "epoch": 470.0, "learning_rate": 9.247035175879397e-06, "loss": 0.1203, "step": 8000 }, { "epoch": 470.0, "eval_loss": 0.46249741315841675, "eval_runtime": 163.8093, "eval_samples_per_second": 0.61, "eval_steps_per_second": 0.104, "eval_wer": 31.428571428571427, "step": 8000 }, { "epoch": 472.0, "learning_rate": 9.244522613065328e-06, "loss": 0.124, "step": 8025 }, { "epoch": 473.0, "learning_rate": 9.242010050251256e-06, "loss": 0.1052, "step": 8050 }, { "epoch": 474.0, "learning_rate": 9.239497487437187e-06, "loss": 0.1253, "step": 8075 }, { "epoch": 476.0, "learning_rate": 9.236984924623116e-06, "loss": 0.1049, "step": 8100 }, { "epoch": 477.0, "learning_rate": 9.234472361809045e-06, "loss": 0.137, "step": 8125 }, { "epoch": 479.0, "learning_rate": 9.231959798994977e-06, "loss": 0.0997, "step": 8150 }, { "epoch": 480.0, "learning_rate": 9.229447236180906e-06, "loss": 0.0951, "step": 8175 }, { "epoch": 482.0, "learning_rate": 9.226934673366835e-06, "loss": 0.1213, "step": 8200 }, { "epoch": 483.0, "learning_rate": 9.224422110552764e-06, "loss": 0.1067, "step": 8225 }, { "epoch": 485.0, "learning_rate": 9.221909547738694e-06, "loss": 0.1041, "step": 8250 }, { "epoch": 486.0, "learning_rate": 9.219396984924623e-06, "loss": 0.1202, "step": 8275 }, { "epoch": 488.0, "learning_rate": 9.216884422110554e-06, "loss": 0.1067, "step": 8300 }, { "epoch": 489.0, "learning_rate": 9.214371859296483e-06, "loss": 0.1175, "step": 8325 }, { "epoch": 491.0, "learning_rate": 9.211859296482413e-06, "loss": 0.1185, "step": 8350 }, { "epoch": 492.0, "learning_rate": 9.209346733668342e-06, "loss": 0.1138, "step": 8375 }, { "epoch": 494.0, "learning_rate": 9.206834170854271e-06, "loss": 0.1237, "step": 8400 }, { "epoch": 495.0, "learning_rate": 9.204321608040202e-06, "loss": 0.1074, "step": 8425 }, { "epoch": 497.0, "learning_rate": 9.201809045226132e-06, "loss": 0.1187, "step": 8450 }, { "epoch": 498.0, "learning_rate": 9.199296482412061e-06, "loss": 0.1018, "step": 8475 }, { "epoch": 499.0, "learning_rate": 9.19678391959799e-06, "loss": 0.0919, "step": 8500 }, { "epoch": 501.0, "learning_rate": 9.19427135678392e-06, "loss": 0.1053, "step": 8525 }, { "epoch": 502.0, "learning_rate": 9.19175879396985e-06, "loss": 0.1108, "step": 8550 }, { "epoch": 504.0, "learning_rate": 9.18924623115578e-06, "loss": 0.1041, "step": 8575 }, { "epoch": 505.0, "learning_rate": 9.18673366834171e-06, "loss": 0.1093, "step": 8600 }, { "epoch": 507.0, "learning_rate": 9.184221105527639e-06, "loss": 0.1138, "step": 8625 }, { "epoch": 508.0, "learning_rate": 9.181708542713568e-06, "loss": 0.1106, "step": 8650 }, { "epoch": 510.0, "learning_rate": 9.179195979899497e-06, "loss": 0.1017, "step": 8675 }, { "epoch": 511.0, "learning_rate": 9.176683417085428e-06, "loss": 0.0919, "step": 8700 }, { "epoch": 513.0, "learning_rate": 9.174170854271358e-06, "loss": 0.0934, "step": 8725 }, { "epoch": 514.0, "learning_rate": 9.171658291457287e-06, "loss": 0.116, "step": 8750 }, { "epoch": 516.0, "learning_rate": 9.169145728643218e-06, "loss": 0.1109, "step": 8775 }, { "epoch": 517.0, "learning_rate": 9.166633165829146e-06, "loss": 0.1258, "step": 8800 }, { "epoch": 519.0, "learning_rate": 9.164120603015077e-06, "loss": 0.1127, "step": 8825 }, { "epoch": 520.0, "learning_rate": 9.161608040201006e-06, "loss": 0.1071, "step": 8850 }, { "epoch": 522.0, "learning_rate": 9.159095477386935e-06, "loss": 0.1217, "step": 8875 }, { "epoch": 523.0, "learning_rate": 9.156582914572865e-06, "loss": 0.1103, "step": 8900 }, { "epoch": 524.0, "learning_rate": 9.154070351758794e-06, "loss": 0.093, "step": 8925 }, { "epoch": 526.0, "learning_rate": 9.151557788944725e-06, "loss": 0.1135, "step": 8950 }, { "epoch": 527.0, "learning_rate": 9.149045226130654e-06, "loss": 0.1053, "step": 8975 }, { "epoch": 529.0, "learning_rate": 9.146532663316584e-06, "loss": 0.0879, "step": 9000 }, { "epoch": 529.0, "eval_loss": 0.4916209876537323, "eval_runtime": 196.2119, "eval_samples_per_second": 0.51, "eval_steps_per_second": 0.087, "eval_wer": 45.48571428571429, "step": 9000 }, { "epoch": 530.0, "learning_rate": 9.144020100502513e-06, "loss": 0.1171, "step": 9025 }, { "epoch": 532.0, "learning_rate": 9.141507537688444e-06, "loss": 0.1064, "step": 9050 }, { "epoch": 533.0, "learning_rate": 9.138994974874372e-06, "loss": 0.1004, "step": 9075 }, { "epoch": 535.0, "learning_rate": 9.136482412060303e-06, "loss": 0.1169, "step": 9100 }, { "epoch": 536.0, "learning_rate": 9.133969849246232e-06, "loss": 0.1209, "step": 9125 }, { "epoch": 538.0, "learning_rate": 9.131457286432161e-06, "loss": 0.1066, "step": 9150 }, { "epoch": 539.0, "learning_rate": 9.128944723618092e-06, "loss": 0.087, "step": 9175 }, { "epoch": 541.0, "learning_rate": 9.12643216080402e-06, "loss": 0.1087, "step": 9200 }, { "epoch": 542.0, "learning_rate": 9.123919597989951e-06, "loss": 0.0838, "step": 9225 }, { "epoch": 544.0, "learning_rate": 9.12140703517588e-06, "loss": 0.0927, "step": 9250 }, { "epoch": 545.0, "learning_rate": 9.11889447236181e-06, "loss": 0.0961, "step": 9275 }, { "epoch": 547.0, "learning_rate": 9.116381909547739e-06, "loss": 0.0901, "step": 9300 }, { "epoch": 548.0, "learning_rate": 9.11386934673367e-06, "loss": 0.096, "step": 9325 }, { "epoch": 549.0, "learning_rate": 9.111356783919598e-06, "loss": 0.0943, "step": 9350 }, { "epoch": 551.0, "learning_rate": 9.108844221105529e-06, "loss": 0.0974, "step": 9375 }, { "epoch": 552.0, "learning_rate": 9.106331658291458e-06, "loss": 0.1019, "step": 9400 }, { "epoch": 554.0, "learning_rate": 9.103819095477387e-06, "loss": 0.0902, "step": 9425 }, { "epoch": 555.0, "learning_rate": 9.101306532663318e-06, "loss": 0.1132, "step": 9450 }, { "epoch": 557.0, "learning_rate": 9.098793969849246e-06, "loss": 0.1115, "step": 9475 }, { "epoch": 558.0, "learning_rate": 9.096281407035177e-06, "loss": 0.0853, "step": 9500 }, { "epoch": 560.0, "learning_rate": 9.093768844221106e-06, "loss": 0.0806, "step": 9525 }, { "epoch": 561.0, "learning_rate": 9.091256281407036e-06, "loss": 0.0792, "step": 9550 }, { "epoch": 563.0, "learning_rate": 9.088743718592967e-06, "loss": 0.0902, "step": 9575 }, { "epoch": 564.0, "learning_rate": 9.086231155778896e-06, "loss": 0.1024, "step": 9600 }, { "epoch": 566.0, "learning_rate": 9.083718592964825e-06, "loss": 0.0905, "step": 9625 }, { "epoch": 567.0, "learning_rate": 9.081206030150755e-06, "loss": 0.0881, "step": 9650 }, { "epoch": 569.0, "learning_rate": 9.078693467336684e-06, "loss": 0.0934, "step": 9675 }, { "epoch": 570.0, "learning_rate": 9.076180904522613e-06, "loss": 0.0998, "step": 9700 }, { "epoch": 572.0, "learning_rate": 9.073668341708544e-06, "loss": 0.1069, "step": 9725 }, { "epoch": 573.0, "learning_rate": 9.071155778894472e-06, "loss": 0.0889, "step": 9750 }, { "epoch": 574.0, "learning_rate": 9.068643216080403e-06, "loss": 0.0942, "step": 9775 }, { "epoch": 576.0, "learning_rate": 9.066130653266332e-06, "loss": 0.1125, "step": 9800 }, { "epoch": 577.0, "learning_rate": 9.063618090452261e-06, "loss": 0.0795, "step": 9825 }, { "epoch": 579.0, "learning_rate": 9.061105527638193e-06, "loss": 0.0718, "step": 9850 }, { "epoch": 580.0, "learning_rate": 9.058592964824122e-06, "loss": 0.0879, "step": 9875 }, { "epoch": 582.0, "learning_rate": 9.056080402010051e-06, "loss": 0.0899, "step": 9900 }, { "epoch": 583.0, "learning_rate": 9.05356783919598e-06, "loss": 0.0859, "step": 9925 }, { "epoch": 585.0, "learning_rate": 9.05105527638191e-06, "loss": 0.1034, "step": 9950 }, { "epoch": 586.0, "learning_rate": 9.048542713567839e-06, "loss": 0.0763, "step": 9975 }, { "epoch": 588.0, "learning_rate": 9.04603015075377e-06, "loss": 0.0825, "step": 10000 }, { "epoch": 588.0, "eval_loss": 0.4961860775947571, "eval_runtime": 165.4953, "eval_samples_per_second": 0.604, "eval_steps_per_second": 0.103, "eval_wer": 30.628571428571426, "step": 10000 }, { "epoch": 589.0, "learning_rate": 9.0435175879397e-06, "loss": 0.0783, "step": 10025 }, { "epoch": 591.0, "learning_rate": 9.041005025125629e-06, "loss": 0.1025, "step": 10050 }, { "epoch": 592.0, "learning_rate": 9.038492462311558e-06, "loss": 0.092, "step": 10075 }, { "epoch": 594.0, "learning_rate": 9.035979899497487e-06, "loss": 0.1059, "step": 10100 }, { "epoch": 595.0, "learning_rate": 9.033467336683418e-06, "loss": 0.0905, "step": 10125 }, { "epoch": 597.0, "learning_rate": 9.030954773869348e-06, "loss": 0.0957, "step": 10150 }, { "epoch": 598.0, "learning_rate": 9.028442211055277e-06, "loss": 0.0729, "step": 10175 }, { "epoch": 599.0, "learning_rate": 9.025929648241208e-06, "loss": 0.0889, "step": 10200 }, { "epoch": 601.0, "learning_rate": 9.023417085427136e-06, "loss": 0.0919, "step": 10225 }, { "epoch": 602.0, "learning_rate": 9.020904522613067e-06, "loss": 0.0993, "step": 10250 }, { "epoch": 604.0, "learning_rate": 9.018391959798996e-06, "loss": 0.068, "step": 10275 }, { "epoch": 605.0, "learning_rate": 9.015879396984925e-06, "loss": 0.1183, "step": 10300 }, { "epoch": 607.0, "learning_rate": 9.013366834170855e-06, "loss": 0.0959, "step": 10325 }, { "epoch": 608.0, "learning_rate": 9.010854271356784e-06, "loss": 0.105, "step": 10350 }, { "epoch": 610.0, "learning_rate": 9.008341708542713e-06, "loss": 0.0845, "step": 10375 }, { "epoch": 611.0, "learning_rate": 9.005829145728644e-06, "loss": 0.0909, "step": 10400 }, { "epoch": 613.0, "learning_rate": 9.003316582914574e-06, "loss": 0.0828, "step": 10425 }, { "epoch": 614.0, "learning_rate": 9.000804020100503e-06, "loss": 0.0868, "step": 10450 }, { "epoch": 616.0, "learning_rate": 8.998291457286434e-06, "loss": 0.0864, "step": 10475 }, { "epoch": 617.0, "learning_rate": 8.995778894472362e-06, "loss": 0.0952, "step": 10500 }, { "epoch": 619.0, "learning_rate": 8.993266331658293e-06, "loss": 0.089, "step": 10525 }, { "epoch": 620.0, "learning_rate": 8.990753768844222e-06, "loss": 0.0814, "step": 10550 }, { "epoch": 622.0, "learning_rate": 8.988241206030151e-06, "loss": 0.0902, "step": 10575 }, { "epoch": 623.0, "learning_rate": 8.98572864321608e-06, "loss": 0.0805, "step": 10600 }, { "epoch": 624.0, "learning_rate": 8.98321608040201e-06, "loss": 0.0865, "step": 10625 }, { "epoch": 626.0, "learning_rate": 8.980703517587941e-06, "loss": 0.0794, "step": 10650 }, { "epoch": 627.0, "learning_rate": 8.97819095477387e-06, "loss": 0.0988, "step": 10675 }, { "epoch": 629.0, "learning_rate": 8.9756783919598e-06, "loss": 0.066, "step": 10700 }, { "epoch": 630.0, "learning_rate": 8.973165829145729e-06, "loss": 0.0907, "step": 10725 }, { "epoch": 632.0, "learning_rate": 8.97065326633166e-06, "loss": 0.0868, "step": 10750 }, { "epoch": 633.0, "learning_rate": 8.968140703517588e-06, "loss": 0.0899, "step": 10775 }, { "epoch": 635.0, "learning_rate": 8.965628140703519e-06, "loss": 0.0776, "step": 10800 }, { "epoch": 636.0, "learning_rate": 8.963115577889448e-06, "loss": 0.0813, "step": 10825 }, { "epoch": 638.0, "learning_rate": 8.960603015075377e-06, "loss": 0.0679, "step": 10850 }, { "epoch": 639.0, "learning_rate": 8.958090452261308e-06, "loss": 0.0851, "step": 10875 }, { "epoch": 641.0, "learning_rate": 8.955577889447236e-06, "loss": 0.0706, "step": 10900 }, { "epoch": 642.0, "learning_rate": 8.953065326633167e-06, "loss": 0.1014, "step": 10925 }, { "epoch": 644.0, "learning_rate": 8.950552763819096e-06, "loss": 0.0835, "step": 10950 }, { "epoch": 645.0, "learning_rate": 8.948040201005026e-06, "loss": 0.0786, "step": 10975 }, { "epoch": 647.0, "learning_rate": 8.945527638190955e-06, "loss": 0.0753, "step": 11000 }, { "epoch": 647.0, "eval_loss": 0.47232896089553833, "eval_runtime": 163.8528, "eval_samples_per_second": 0.61, "eval_steps_per_second": 0.104, "eval_wer": 31.2, "step": 11000 }, { "epoch": 648.0, "learning_rate": 8.943015075376886e-06, "loss": 0.0759, "step": 11025 }, { "epoch": 649.0, "learning_rate": 8.940502512562815e-06, "loss": 0.0592, "step": 11050 }, { "epoch": 651.0, "learning_rate": 8.937989949748745e-06, "loss": 0.0927, "step": 11075 }, { "epoch": 652.0, "learning_rate": 8.935477386934674e-06, "loss": 0.0757, "step": 11100 }, { "epoch": 654.0, "learning_rate": 8.932964824120603e-06, "loss": 0.0775, "step": 11125 }, { "epoch": 655.0, "learning_rate": 8.930452261306534e-06, "loss": 0.0816, "step": 11150 }, { "epoch": 657.0, "learning_rate": 8.927939698492462e-06, "loss": 0.0822, "step": 11175 }, { "epoch": 658.0, "learning_rate": 8.925427135678393e-06, "loss": 0.0862, "step": 11200 }, { "epoch": 660.0, "learning_rate": 8.922914572864322e-06, "loss": 0.1058, "step": 11225 }, { "epoch": 661.0, "learning_rate": 8.920402010050252e-06, "loss": 0.0775, "step": 11250 }, { "epoch": 663.0, "learning_rate": 8.917889447236183e-06, "loss": 0.0804, "step": 11275 }, { "epoch": 664.0, "learning_rate": 8.915376884422112e-06, "loss": 0.0948, "step": 11300 }, { "epoch": 666.0, "learning_rate": 8.912864321608041e-06, "loss": 0.0834, "step": 11325 }, { "epoch": 667.0, "learning_rate": 8.91035175879397e-06, "loss": 0.0703, "step": 11350 }, { "epoch": 669.0, "learning_rate": 8.9078391959799e-06, "loss": 0.0819, "step": 11375 }, { "epoch": 670.0, "learning_rate": 8.90532663316583e-06, "loss": 0.0623, "step": 11400 }, { "epoch": 672.0, "learning_rate": 8.90281407035176e-06, "loss": 0.0836, "step": 11425 }, { "epoch": 673.0, "learning_rate": 8.900301507537688e-06, "loss": 0.0851, "step": 11450 }, { "epoch": 674.0, "learning_rate": 8.897788944723619e-06, "loss": 0.0823, "step": 11475 }, { "epoch": 676.0, "learning_rate": 8.895276381909548e-06, "loss": 0.0703, "step": 11500 }, { "epoch": 677.0, "learning_rate": 8.892763819095478e-06, "loss": 0.0912, "step": 11525 }, { "epoch": 679.0, "learning_rate": 8.890251256281409e-06, "loss": 0.087, "step": 11550 }, { "epoch": 680.0, "learning_rate": 8.887738693467338e-06, "loss": 0.0689, "step": 11575 }, { "epoch": 682.0, "learning_rate": 8.885226130653267e-06, "loss": 0.0793, "step": 11600 }, { "epoch": 683.0, "learning_rate": 8.882713567839196e-06, "loss": 0.0764, "step": 11625 }, { "epoch": 685.0, "learning_rate": 8.880201005025126e-06, "loss": 0.08, "step": 11650 }, { "epoch": 686.0, "learning_rate": 8.877688442211057e-06, "loss": 0.0523, "step": 11675 }, { "epoch": 688.0, "learning_rate": 8.875175879396986e-06, "loss": 0.0728, "step": 11700 }, { "epoch": 689.0, "learning_rate": 8.872663316582915e-06, "loss": 0.0639, "step": 11725 }, { "epoch": 691.0, "learning_rate": 8.870150753768845e-06, "loss": 0.0494, "step": 11750 }, { "epoch": 692.0, "learning_rate": 8.867638190954774e-06, "loss": 0.0784, "step": 11775 }, { "epoch": 694.0, "learning_rate": 8.865125628140703e-06, "loss": 0.0737, "step": 11800 }, { "epoch": 695.0, "learning_rate": 8.862613065326634e-06, "loss": 0.0812, "step": 11825 }, { "epoch": 697.0, "learning_rate": 8.860100502512564e-06, "loss": 0.0798, "step": 11850 }, { "epoch": 698.0, "learning_rate": 8.857587939698493e-06, "loss": 0.0697, "step": 11875 }, { "epoch": 699.0, "learning_rate": 8.855075376884424e-06, "loss": 0.0826, "step": 11900 }, { "epoch": 701.0, "learning_rate": 8.852562814070352e-06, "loss": 0.0638, "step": 11925 }, { "epoch": 702.0, "learning_rate": 8.850050251256283e-06, "loss": 0.0809, "step": 11950 }, { "epoch": 704.0, "learning_rate": 8.847537688442212e-06, "loss": 0.0619, "step": 11975 }, { "epoch": 705.0, "learning_rate": 8.845025125628141e-06, "loss": 0.0812, "step": 12000 }, { "epoch": 705.0, "eval_loss": 0.45736855268478394, "eval_runtime": 162.5424, "eval_samples_per_second": 0.615, "eval_steps_per_second": 0.105, "eval_wer": 28.685714285714287, "step": 12000 }, { "epoch": 707.0, "learning_rate": 8.84251256281407e-06, "loss": 0.0547, "step": 12025 }, { "epoch": 708.0, "learning_rate": 8.84e-06, "loss": 0.0719, "step": 12050 }, { "epoch": 710.0, "learning_rate": 8.83748743718593e-06, "loss": 0.0681, "step": 12075 }, { "epoch": 711.0, "learning_rate": 8.83497487437186e-06, "loss": 0.085, "step": 12100 }, { "epoch": 713.0, "learning_rate": 8.83246231155779e-06, "loss": 0.0799, "step": 12125 }, { "epoch": 714.0, "learning_rate": 8.829949748743719e-06, "loss": 0.0787, "step": 12150 }, { "epoch": 716.0, "learning_rate": 8.82743718592965e-06, "loss": 0.0667, "step": 12175 }, { "epoch": 717.0, "learning_rate": 8.824924623115578e-06, "loss": 0.0656, "step": 12200 }, { "epoch": 719.0, "learning_rate": 8.822412060301509e-06, "loss": 0.0691, "step": 12225 }, { "epoch": 720.0, "learning_rate": 8.819899497487438e-06, "loss": 0.0826, "step": 12250 }, { "epoch": 722.0, "learning_rate": 8.817386934673367e-06, "loss": 0.0762, "step": 12275 }, { "epoch": 723.0, "learning_rate": 8.814874371859298e-06, "loss": 0.0941, "step": 12300 }, { "epoch": 724.0, "learning_rate": 8.812361809045226e-06, "loss": 0.0739, "step": 12325 }, { "epoch": 726.0, "learning_rate": 8.809849246231157e-06, "loss": 0.073, "step": 12350 }, { "epoch": 727.0, "learning_rate": 8.807336683417086e-06, "loss": 0.0791, "step": 12375 }, { "epoch": 729.0, "learning_rate": 8.804824120603016e-06, "loss": 0.0621, "step": 12400 }, { "epoch": 730.0, "learning_rate": 8.802311557788945e-06, "loss": 0.064, "step": 12425 }, { "epoch": 732.0, "learning_rate": 8.799798994974876e-06, "loss": 0.0665, "step": 12450 }, { "epoch": 733.0, "learning_rate": 8.797286432160804e-06, "loss": 0.0739, "step": 12475 }, { "epoch": 735.0, "learning_rate": 8.794773869346735e-06, "loss": 0.0702, "step": 12500 }, { "epoch": 736.0, "learning_rate": 8.792261306532664e-06, "loss": 0.0612, "step": 12525 }, { "epoch": 738.0, "learning_rate": 8.789748743718593e-06, "loss": 0.0645, "step": 12550 }, { "epoch": 739.0, "learning_rate": 8.787236180904524e-06, "loss": 0.0567, "step": 12575 }, { "epoch": 741.0, "learning_rate": 8.784723618090452e-06, "loss": 0.0667, "step": 12600 }, { "epoch": 742.0, "learning_rate": 8.782211055276383e-06, "loss": 0.0572, "step": 12625 }, { "epoch": 744.0, "learning_rate": 8.779698492462312e-06, "loss": 0.058, "step": 12650 }, { "epoch": 745.0, "learning_rate": 8.777185929648242e-06, "loss": 0.0649, "step": 12675 }, { "epoch": 747.0, "learning_rate": 8.774673366834171e-06, "loss": 0.0906, "step": 12700 }, { "epoch": 748.0, "learning_rate": 8.772160804020102e-06, "loss": 0.0642, "step": 12725 }, { "epoch": 749.0, "learning_rate": 8.769648241206031e-06, "loss": 0.0705, "step": 12750 }, { "epoch": 751.0, "learning_rate": 8.76713567839196e-06, "loss": 0.0779, "step": 12775 }, { "epoch": 752.0, "learning_rate": 8.76462311557789e-06, "loss": 0.0453, "step": 12800 }, { "epoch": 754.0, "learning_rate": 8.76211055276382e-06, "loss": 0.0708, "step": 12825 }, { "epoch": 755.0, "learning_rate": 8.75959798994975e-06, "loss": 0.071, "step": 12850 }, { "epoch": 757.0, "learning_rate": 8.757085427135678e-06, "loss": 0.0615, "step": 12875 }, { "epoch": 758.0, "learning_rate": 8.754572864321609e-06, "loss": 0.0796, "step": 12900 }, { "epoch": 760.0, "learning_rate": 8.752060301507538e-06, "loss": 0.0709, "step": 12925 }, { "epoch": 761.0, "learning_rate": 8.749547738693468e-06, "loss": 0.0636, "step": 12950 }, { "epoch": 763.0, "learning_rate": 8.747035175879399e-06, "loss": 0.0672, "step": 12975 }, { "epoch": 764.0, "learning_rate": 8.74462311557789e-06, "loss": 0.062, "step": 13000 }, { "epoch": 764.0, "eval_loss": 0.4627605676651001, "eval_runtime": 165.0988, "eval_samples_per_second": 0.606, "eval_steps_per_second": 0.103, "eval_wer": 28.799999999999997, "step": 13000 }, { "epoch": 766.0, "learning_rate": 8.74211055276382e-06, "loss": 0.0577, "step": 13025 }, { "epoch": 767.0, "learning_rate": 8.73959798994975e-06, "loss": 0.0565, "step": 13050 }, { "epoch": 769.0, "learning_rate": 8.737085427135678e-06, "loss": 0.0533, "step": 13075 }, { "epoch": 770.0, "learning_rate": 8.734572864321609e-06, "loss": 0.0557, "step": 13100 }, { "epoch": 772.0, "learning_rate": 8.732060301507538e-06, "loss": 0.0765, "step": 13125 }, { "epoch": 773.0, "learning_rate": 8.729547738693468e-06, "loss": 0.0612, "step": 13150 }, { "epoch": 774.0, "learning_rate": 8.727035175879399e-06, "loss": 0.064, "step": 13175 }, { "epoch": 776.0, "learning_rate": 8.724522613065326e-06, "loss": 0.0614, "step": 13200 }, { "epoch": 777.0, "learning_rate": 8.722010050251257e-06, "loss": 0.0617, "step": 13225 }, { "epoch": 779.0, "learning_rate": 8.719497487437187e-06, "loss": 0.0586, "step": 13250 }, { "epoch": 780.0, "learning_rate": 8.716984924623116e-06, "loss": 0.0557, "step": 13275 }, { "epoch": 782.0, "learning_rate": 8.714472361809045e-06, "loss": 0.064, "step": 13300 }, { "epoch": 783.0, "learning_rate": 8.711959798994976e-06, "loss": 0.0672, "step": 13325 }, { "epoch": 785.0, "learning_rate": 8.709447236180906e-06, "loss": 0.0523, "step": 13350 }, { "epoch": 786.0, "learning_rate": 8.706934673366835e-06, "loss": 0.0661, "step": 13375 }, { "epoch": 788.0, "learning_rate": 8.704422110552764e-06, "loss": 0.0624, "step": 13400 }, { "epoch": 789.0, "learning_rate": 8.701909547738694e-06, "loss": 0.054, "step": 13425 }, { "epoch": 791.0, "learning_rate": 8.699396984924625e-06, "loss": 0.0671, "step": 13450 }, { "epoch": 792.0, "learning_rate": 8.696884422110552e-06, "loss": 0.0644, "step": 13475 }, { "epoch": 794.0, "learning_rate": 8.694371859296483e-06, "loss": 0.0644, "step": 13500 }, { "epoch": 795.0, "learning_rate": 8.691859296482413e-06, "loss": 0.0607, "step": 13525 }, { "epoch": 797.0, "learning_rate": 8.689346733668342e-06, "loss": 0.0609, "step": 13550 }, { "epoch": 798.0, "learning_rate": 8.686834170854273e-06, "loss": 0.0562, "step": 13575 }, { "epoch": 799.0, "learning_rate": 8.684321608040202e-06, "loss": 0.0524, "step": 13600 }, { "epoch": 801.0, "learning_rate": 8.681809045226132e-06, "loss": 0.0538, "step": 13625 }, { "epoch": 802.0, "learning_rate": 8.679296482412061e-06, "loss": 0.0661, "step": 13650 }, { "epoch": 804.0, "learning_rate": 8.67678391959799e-06, "loss": 0.0635, "step": 13675 }, { "epoch": 805.0, "learning_rate": 8.67427135678392e-06, "loss": 0.0594, "step": 13700 }, { "epoch": 807.0, "learning_rate": 8.67175879396985e-06, "loss": 0.059, "step": 13725 }, { "epoch": 808.0, "learning_rate": 8.66924623115578e-06, "loss": 0.0673, "step": 13750 }, { "epoch": 810.0, "learning_rate": 8.66673366834171e-06, "loss": 0.0507, "step": 13775 }, { "epoch": 811.0, "learning_rate": 8.664221105527639e-06, "loss": 0.059, "step": 13800 }, { "epoch": 813.0, "learning_rate": 8.661708542713568e-06, "loss": 0.0572, "step": 13825 }, { "epoch": 814.0, "learning_rate": 8.659195979899499e-06, "loss": 0.0595, "step": 13850 }, { "epoch": 816.0, "learning_rate": 8.656683417085428e-06, "loss": 0.0446, "step": 13875 }, { "epoch": 817.0, "learning_rate": 8.654170854271358e-06, "loss": 0.0433, "step": 13900 }, { "epoch": 819.0, "learning_rate": 8.651658291457287e-06, "loss": 0.0483, "step": 13925 }, { "epoch": 820.0, "learning_rate": 8.649145728643216e-06, "loss": 0.0516, "step": 13950 }, { "epoch": 822.0, "learning_rate": 8.646633165829147e-06, "loss": 0.0541, "step": 13975 }, { "epoch": 823.0, "learning_rate": 8.644120603015077e-06, "loss": 0.0604, "step": 14000 }, { "epoch": 823.0, "eval_loss": 0.4667850434780121, "eval_runtime": 163.2225, "eval_samples_per_second": 0.613, "eval_steps_per_second": 0.104, "eval_wer": 28.000000000000004, "step": 14000 }, { "epoch": 824.0, "learning_rate": 8.641608040201006e-06, "loss": 0.0581, "step": 14025 }, { "epoch": 826.0, "learning_rate": 8.639095477386935e-06, "loss": 0.0593, "step": 14050 }, { "epoch": 827.0, "learning_rate": 8.636582914572865e-06, "loss": 0.0719, "step": 14075 }, { "epoch": 829.0, "learning_rate": 8.634070351758794e-06, "loss": 0.0558, "step": 14100 }, { "epoch": 830.0, "learning_rate": 8.631557788944725e-06, "loss": 0.0407, "step": 14125 }, { "epoch": 832.0, "learning_rate": 8.629045226130654e-06, "loss": 0.0487, "step": 14150 }, { "epoch": 833.0, "learning_rate": 8.626532663316584e-06, "loss": 0.0767, "step": 14175 }, { "epoch": 835.0, "learning_rate": 8.624020100502513e-06, "loss": 0.047, "step": 14200 }, { "epoch": 836.0, "learning_rate": 8.621507537688442e-06, "loss": 0.0621, "step": 14225 }, { "epoch": 838.0, "learning_rate": 8.618994974874373e-06, "loss": 0.0494, "step": 14250 }, { "epoch": 839.0, "learning_rate": 8.616482412060303e-06, "loss": 0.0468, "step": 14275 }, { "epoch": 841.0, "learning_rate": 8.613969849246232e-06, "loss": 0.0783, "step": 14300 }, { "epoch": 842.0, "learning_rate": 8.611457286432161e-06, "loss": 0.0554, "step": 14325 }, { "epoch": 844.0, "learning_rate": 8.60894472361809e-06, "loss": 0.0606, "step": 14350 }, { "epoch": 845.0, "learning_rate": 8.606432160804022e-06, "loss": 0.0622, "step": 14375 }, { "epoch": 847.0, "learning_rate": 8.603919597989951e-06, "loss": 0.0557, "step": 14400 }, { "epoch": 848.0, "learning_rate": 8.60140703517588e-06, "loss": 0.0474, "step": 14425 }, { "epoch": 849.0, "learning_rate": 8.59889447236181e-06, "loss": 0.0413, "step": 14450 }, { "epoch": 851.0, "learning_rate": 8.596381909547739e-06, "loss": 0.0686, "step": 14475 }, { "epoch": 852.0, "learning_rate": 8.593869346733668e-06, "loss": 0.0451, "step": 14500 }, { "epoch": 854.0, "learning_rate": 8.5913567839196e-06, "loss": 0.056, "step": 14525 }, { "epoch": 855.0, "learning_rate": 8.588844221105528e-06, "loss": 0.0584, "step": 14550 }, { "epoch": 857.0, "learning_rate": 8.586331658291458e-06, "loss": 0.0503, "step": 14575 }, { "epoch": 858.0, "learning_rate": 8.583819095477389e-06, "loss": 0.0587, "step": 14600 }, { "epoch": 860.0, "learning_rate": 8.581306532663316e-06, "loss": 0.0463, "step": 14625 }, { "epoch": 861.0, "learning_rate": 8.578793969849247e-06, "loss": 0.0408, "step": 14650 }, { "epoch": 863.0, "learning_rate": 8.576281407035177e-06, "loss": 0.0536, "step": 14675 }, { "epoch": 864.0, "learning_rate": 8.573768844221106e-06, "loss": 0.0529, "step": 14700 }, { "epoch": 866.0, "learning_rate": 8.571256281407035e-06, "loss": 0.0527, "step": 14725 }, { "epoch": 867.0, "learning_rate": 8.568743718592965e-06, "loss": 0.0626, "step": 14750 }, { "epoch": 869.0, "learning_rate": 8.566231155778894e-06, "loss": 0.0561, "step": 14775 }, { "epoch": 870.0, "learning_rate": 8.563718592964825e-06, "loss": 0.0552, "step": 14800 }, { "epoch": 872.0, "learning_rate": 8.561206030150754e-06, "loss": 0.0455, "step": 14825 }, { "epoch": 873.0, "learning_rate": 8.558693467336684e-06, "loss": 0.0684, "step": 14850 }, { "epoch": 874.0, "learning_rate": 8.556180904522615e-06, "loss": 0.0514, "step": 14875 }, { "epoch": 876.0, "learning_rate": 8.553668341708542e-06, "loss": 0.0605, "step": 14900 }, { "epoch": 877.0, "learning_rate": 8.551155778894473e-06, "loss": 0.0484, "step": 14925 }, { "epoch": 879.0, "learning_rate": 8.548643216080403e-06, "loss": 0.0541, "step": 14950 }, { "epoch": 880.0, "learning_rate": 8.546130653266332e-06, "loss": 0.0486, "step": 14975 }, { "epoch": 882.0, "learning_rate": 8.543618090452263e-06, "loss": 0.0666, "step": 15000 }, { "epoch": 882.0, "eval_loss": 0.4697132110595703, "eval_runtime": 165.8528, "eval_samples_per_second": 0.603, "eval_steps_per_second": 0.103, "eval_wer": 28.685714285714287, "step": 15000 }, { "epoch": 883.0, "learning_rate": 8.541105527638192e-06, "loss": 0.0519, "step": 15025 }, { "epoch": 885.0, "learning_rate": 8.538592964824122e-06, "loss": 0.0402, "step": 15050 }, { "epoch": 886.0, "learning_rate": 8.536080402010051e-06, "loss": 0.0601, "step": 15075 }, { "epoch": 888.0, "learning_rate": 8.53356783919598e-06, "loss": 0.0541, "step": 15100 }, { "epoch": 889.0, "learning_rate": 8.53105527638191e-06, "loss": 0.0369, "step": 15125 }, { "epoch": 891.0, "learning_rate": 8.52854271356784e-06, "loss": 0.0479, "step": 15150 }, { "epoch": 892.0, "learning_rate": 8.526030150753768e-06, "loss": 0.0528, "step": 15175 }, { "epoch": 894.0, "learning_rate": 8.5235175879397e-06, "loss": 0.0575, "step": 15200 }, { "epoch": 895.0, "learning_rate": 8.521005025125629e-06, "loss": 0.059, "step": 15225 }, { "epoch": 897.0, "learning_rate": 8.518492462311558e-06, "loss": 0.0456, "step": 15250 }, { "epoch": 898.0, "learning_rate": 8.515979899497489e-06, "loss": 0.0608, "step": 15275 }, { "epoch": 899.0, "learning_rate": 8.513467336683418e-06, "loss": 0.0555, "step": 15300 }, { "epoch": 901.0, "learning_rate": 8.510954773869348e-06, "loss": 0.0574, "step": 15325 }, { "epoch": 902.0, "learning_rate": 8.508442211055277e-06, "loss": 0.0539, "step": 15350 }, { "epoch": 904.0, "learning_rate": 8.505929648241206e-06, "loss": 0.049, "step": 15375 }, { "epoch": 905.0, "learning_rate": 8.503417085427136e-06, "loss": 0.0483, "step": 15400 }, { "epoch": 907.0, "learning_rate": 8.500904522613067e-06, "loss": 0.0371, "step": 15425 }, { "epoch": 908.0, "learning_rate": 8.498391959798996e-06, "loss": 0.0444, "step": 15450 }, { "epoch": 910.0, "learning_rate": 8.495879396984925e-06, "loss": 0.0611, "step": 15475 }, { "epoch": 911.0, "learning_rate": 8.493366834170855e-06, "loss": 0.0381, "step": 15500 }, { "epoch": 913.0, "learning_rate": 8.490854271356784e-06, "loss": 0.0445, "step": 15525 }, { "epoch": 914.0, "learning_rate": 8.488341708542715e-06, "loss": 0.0528, "step": 15550 }, { "epoch": 916.0, "learning_rate": 8.485929648241207e-06, "loss": 0.039, "step": 15575 }, { "epoch": 917.0, "learning_rate": 8.483417085427136e-06, "loss": 0.0525, "step": 15600 }, { "epoch": 919.0, "learning_rate": 8.480904522613065e-06, "loss": 0.0478, "step": 15625 }, { "epoch": 920.0, "learning_rate": 8.478391959798996e-06, "loss": 0.0517, "step": 15650 }, { "epoch": 922.0, "learning_rate": 8.475879396984926e-06, "loss": 0.0378, "step": 15675 }, { "epoch": 923.0, "learning_rate": 8.473366834170855e-06, "loss": 0.0541, "step": 15700 }, { "epoch": 924.0, "learning_rate": 8.470854271356784e-06, "loss": 0.0483, "step": 15725 }, { "epoch": 926.0, "learning_rate": 8.468341708542715e-06, "loss": 0.0572, "step": 15750 }, { "epoch": 927.0, "learning_rate": 8.465829145728643e-06, "loss": 0.0654, "step": 15775 }, { "epoch": 929.0, "learning_rate": 8.463316582914574e-06, "loss": 0.042, "step": 15800 }, { "epoch": 930.0, "learning_rate": 8.460804020100503e-06, "loss": 0.0497, "step": 15825 }, { "epoch": 932.0, "learning_rate": 8.458291457286432e-06, "loss": 0.0304, "step": 15850 }, { "epoch": 933.0, "learning_rate": 8.455778894472363e-06, "loss": 0.0391, "step": 15875 }, { "epoch": 935.0, "learning_rate": 8.453266331658291e-06, "loss": 0.0499, "step": 15900 }, { "epoch": 936.0, "learning_rate": 8.450753768844222e-06, "loss": 0.05, "step": 15925 }, { "epoch": 938.0, "learning_rate": 8.448241206030151e-06, "loss": 0.0508, "step": 15950 }, { "epoch": 939.0, "learning_rate": 8.44572864321608e-06, "loss": 0.0343, "step": 15975 }, { "epoch": 941.0, "learning_rate": 8.44321608040201e-06, "loss": 0.0405, "step": 16000 }, { "epoch": 941.0, "eval_loss": 0.49084585905075073, "eval_runtime": 211.5151, "eval_samples_per_second": 0.473, "eval_steps_per_second": 0.08, "eval_wer": 54.628571428571426, "step": 16000 }, { "epoch": 942.0, "learning_rate": 8.440703517587941e-06, "loss": 0.056, "step": 16025 }, { "epoch": 944.0, "learning_rate": 8.43819095477387e-06, "loss": 0.0445, "step": 16050 }, { "epoch": 945.0, "learning_rate": 8.4356783919598e-06, "loss": 0.0505, "step": 16075 }, { "epoch": 947.0, "learning_rate": 8.433165829145729e-06, "loss": 0.0451, "step": 16100 }, { "epoch": 948.0, "learning_rate": 8.430653266331658e-06, "loss": 0.0576, "step": 16125 }, { "epoch": 949.0, "learning_rate": 8.42814070351759e-06, "loss": 0.0436, "step": 16150 }, { "epoch": 951.0, "learning_rate": 8.425628140703517e-06, "loss": 0.0384, "step": 16175 }, { "epoch": 952.0, "learning_rate": 8.423115577889448e-06, "loss": 0.0424, "step": 16200 }, { "epoch": 954.0, "learning_rate": 8.420603015075377e-06, "loss": 0.0527, "step": 16225 }, { "epoch": 955.0, "learning_rate": 8.418090452261307e-06, "loss": 0.0455, "step": 16250 }, { "epoch": 957.0, "learning_rate": 8.415577889447238e-06, "loss": 0.0502, "step": 16275 }, { "epoch": 958.0, "learning_rate": 8.413065326633167e-06, "loss": 0.0513, "step": 16300 }, { "epoch": 960.0, "learning_rate": 8.410552763819096e-06, "loss": 0.0554, "step": 16325 }, { "epoch": 961.0, "learning_rate": 8.408040201005026e-06, "loss": 0.0373, "step": 16350 }, { "epoch": 963.0, "learning_rate": 8.405527638190955e-06, "loss": 0.0635, "step": 16375 }, { "epoch": 964.0, "learning_rate": 8.403015075376884e-06, "loss": 0.0309, "step": 16400 }, { "epoch": 966.0, "learning_rate": 8.400502512562815e-06, "loss": 0.0315, "step": 16425 }, { "epoch": 967.0, "learning_rate": 8.397989949748745e-06, "loss": 0.051, "step": 16450 }, { "epoch": 969.0, "learning_rate": 8.395477386934674e-06, "loss": 0.0331, "step": 16475 }, { "epoch": 970.0, "learning_rate": 8.392964824120603e-06, "loss": 0.0325, "step": 16500 }, { "epoch": 972.0, "learning_rate": 8.390452261306533e-06, "loss": 0.0439, "step": 16525 }, { "epoch": 973.0, "learning_rate": 8.387939698492464e-06, "loss": 0.0454, "step": 16550 }, { "epoch": 974.0, "learning_rate": 8.385427135678393e-06, "loss": 0.0315, "step": 16575 }, { "epoch": 976.0, "learning_rate": 8.382914572864322e-06, "loss": 0.0446, "step": 16600 }, { "epoch": 977.0, "learning_rate": 8.380402010050252e-06, "loss": 0.0515, "step": 16625 }, { "epoch": 979.0, "learning_rate": 8.377889447236181e-06, "loss": 0.0429, "step": 16650 }, { "epoch": 980.0, "learning_rate": 8.375376884422112e-06, "loss": 0.0438, "step": 16675 }, { "epoch": 982.0, "learning_rate": 8.372864321608041e-06, "loss": 0.0284, "step": 16700 }, { "epoch": 983.0, "learning_rate": 8.37035175879397e-06, "loss": 0.0347, "step": 16725 }, { "epoch": 985.0, "learning_rate": 8.3678391959799e-06, "loss": 0.0472, "step": 16750 }, { "epoch": 986.0, "learning_rate": 8.36532663316583e-06, "loss": 0.038, "step": 16775 }, { "epoch": 988.0, "learning_rate": 8.362814070351759e-06, "loss": 0.0374, "step": 16800 }, { "epoch": 989.0, "learning_rate": 8.36030150753769e-06, "loss": 0.0465, "step": 16825 }, { "epoch": 991.0, "learning_rate": 8.357788944723619e-06, "loss": 0.0333, "step": 16850 }, { "epoch": 992.0, "learning_rate": 8.355276381909548e-06, "loss": 0.0482, "step": 16875 }, { "epoch": 994.0, "learning_rate": 8.35276381909548e-06, "loss": 0.0396, "step": 16900 }, { "epoch": 995.0, "learning_rate": 8.350251256281407e-06, "loss": 0.0556, "step": 16925 }, { "epoch": 997.0, "learning_rate": 8.347738693467338e-06, "loss": 0.0372, "step": 16950 }, { "epoch": 998.0, "learning_rate": 8.345226130653267e-06, "loss": 0.0438, "step": 16975 }, { "epoch": 999.0, "learning_rate": 8.342713567839197e-06, "loss": 0.0349, "step": 17000 }, { "epoch": 999.0, "eval_loss": 0.472809761762619, "eval_runtime": 167.3915, "eval_samples_per_second": 0.597, "eval_steps_per_second": 0.102, "eval_wer": 28.45714285714286, "step": 17000 }, { "epoch": 1001.0, "learning_rate": 8.340201005025126e-06, "loss": 0.032, "step": 17025 }, { "epoch": 1002.0, "learning_rate": 8.337688442211055e-06, "loss": 0.0321, "step": 17050 }, { "epoch": 1004.0, "learning_rate": 8.335175879396986e-06, "loss": 0.0314, "step": 17075 }, { "epoch": 1005.0, "learning_rate": 8.332663316582916e-06, "loss": 0.0418, "step": 17100 }, { "epoch": 1007.0, "learning_rate": 8.330150753768845e-06, "loss": 0.0483, "step": 17125 }, { "epoch": 1008.0, "learning_rate": 8.327638190954774e-06, "loss": 0.0421, "step": 17150 }, { "epoch": 1010.0, "learning_rate": 8.325125628140705e-06, "loss": 0.0355, "step": 17175 }, { "epoch": 1011.0, "learning_rate": 8.322613065326633e-06, "loss": 0.0463, "step": 17200 }, { "epoch": 1013.0, "learning_rate": 8.320100502512564e-06, "loss": 0.0435, "step": 17225 }, { "epoch": 1014.0, "learning_rate": 8.317587939698493e-06, "loss": 0.0311, "step": 17250 }, { "epoch": 1016.0, "learning_rate": 8.315075376884423e-06, "loss": 0.0481, "step": 17275 }, { "epoch": 1017.0, "learning_rate": 8.312562814070354e-06, "loss": 0.0519, "step": 17300 }, { "epoch": 1019.0, "learning_rate": 8.310050251256281e-06, "loss": 0.0275, "step": 17325 }, { "epoch": 1020.0, "learning_rate": 8.307537688442212e-06, "loss": 0.0377, "step": 17350 }, { "epoch": 1022.0, "learning_rate": 8.305025125628142e-06, "loss": 0.0477, "step": 17375 }, { "epoch": 1023.0, "learning_rate": 8.30251256281407e-06, "loss": 0.0369, "step": 17400 }, { "epoch": 1024.0, "learning_rate": 8.3e-06, "loss": 0.0324, "step": 17425 }, { "epoch": 1026.0, "learning_rate": 8.297487437185931e-06, "loss": 0.0416, "step": 17450 }, { "epoch": 1027.0, "learning_rate": 8.294974874371859e-06, "loss": 0.0367, "step": 17475 }, { "epoch": 1029.0, "learning_rate": 8.29246231155779e-06, "loss": 0.0454, "step": 17500 }, { "epoch": 1030.0, "learning_rate": 8.289949748743719e-06, "loss": 0.0279, "step": 17525 }, { "epoch": 1032.0, "learning_rate": 8.287437185929648e-06, "loss": 0.0426, "step": 17550 }, { "epoch": 1033.0, "learning_rate": 8.28492462311558e-06, "loss": 0.0321, "step": 17575 }, { "epoch": 1035.0, "learning_rate": 8.282412060301507e-06, "loss": 0.0363, "step": 17600 }, { "epoch": 1036.0, "learning_rate": 8.279899497487438e-06, "loss": 0.0391, "step": 17625 }, { "epoch": 1038.0, "learning_rate": 8.277386934673367e-06, "loss": 0.0485, "step": 17650 }, { "epoch": 1039.0, "learning_rate": 8.274874371859297e-06, "loss": 0.0377, "step": 17675 }, { "epoch": 1041.0, "learning_rate": 8.272361809045228e-06, "loss": 0.0318, "step": 17700 }, { "epoch": 1042.0, "learning_rate": 8.269849246231157e-06, "loss": 0.0482, "step": 17725 }, { "epoch": 1044.0, "learning_rate": 8.267336683417086e-06, "loss": 0.0373, "step": 17750 }, { "epoch": 1045.0, "learning_rate": 8.264824120603016e-06, "loss": 0.0331, "step": 17775 }, { "epoch": 1047.0, "learning_rate": 8.262311557788945e-06, "loss": 0.0311, "step": 17800 }, { "epoch": 1048.0, "learning_rate": 8.259798994974874e-06, "loss": 0.042, "step": 17825 }, { "epoch": 1049.0, "learning_rate": 8.257286432160805e-06, "loss": 0.033, "step": 17850 }, { "epoch": 1051.0, "learning_rate": 8.254773869346733e-06, "loss": 0.0334, "step": 17875 }, { "epoch": 1052.0, "learning_rate": 8.252261306532664e-06, "loss": 0.0312, "step": 17900 }, { "epoch": 1054.0, "learning_rate": 8.249748743718593e-06, "loss": 0.0296, "step": 17925 }, { "epoch": 1055.0, "learning_rate": 8.247236180904523e-06, "loss": 0.0337, "step": 17950 }, { "epoch": 1057.0, "learning_rate": 8.244723618090454e-06, "loss": 0.0402, "step": 17975 }, { "epoch": 1058.0, "learning_rate": 8.242211055276383e-06, "loss": 0.0409, "step": 18000 }, { "epoch": 1058.0, "eval_loss": 0.4883716106414795, "eval_runtime": 168.0249, "eval_samples_per_second": 0.595, "eval_steps_per_second": 0.101, "eval_wer": 28.45714285714286, "step": 18000 }, { "epoch": 1060.0, "learning_rate": 8.239698492462312e-06, "loss": 0.0325, "step": 18025 }, { "epoch": 1061.0, "learning_rate": 8.237185929648242e-06, "loss": 0.0424, "step": 18050 }, { "epoch": 1063.0, "learning_rate": 8.234673366834171e-06, "loss": 0.0409, "step": 18075 }, { "epoch": 1064.0, "learning_rate": 8.2321608040201e-06, "loss": 0.0348, "step": 18100 }, { "epoch": 1066.0, "learning_rate": 8.229648241206031e-06, "loss": 0.0285, "step": 18125 }, { "epoch": 1067.0, "learning_rate": 8.22713567839196e-06, "loss": 0.039, "step": 18150 }, { "epoch": 1069.0, "learning_rate": 8.22462311557789e-06, "loss": 0.034, "step": 18175 }, { "epoch": 1070.0, "learning_rate": 8.22211055276382e-06, "loss": 0.0452, "step": 18200 }, { "epoch": 1072.0, "learning_rate": 8.219597989949749e-06, "loss": 0.0457, "step": 18225 }, { "epoch": 1073.0, "learning_rate": 8.21708542713568e-06, "loss": 0.0371, "step": 18250 }, { "epoch": 1074.0, "learning_rate": 8.214572864321609e-06, "loss": 0.0276, "step": 18275 }, { "epoch": 1076.0, "learning_rate": 8.212060301507538e-06, "loss": 0.031, "step": 18300 }, { "epoch": 1077.0, "learning_rate": 8.20954773869347e-06, "loss": 0.0489, "step": 18325 }, { "epoch": 1079.0, "learning_rate": 8.207035175879397e-06, "loss": 0.0437, "step": 18350 }, { "epoch": 1080.0, "learning_rate": 8.204522613065328e-06, "loss": 0.0352, "step": 18375 }, { "epoch": 1082.0, "learning_rate": 8.202010050251257e-06, "loss": 0.0394, "step": 18400 }, { "epoch": 1083.0, "learning_rate": 8.199497487437187e-06, "loss": 0.0399, "step": 18425 }, { "epoch": 1085.0, "learning_rate": 8.196984924623116e-06, "loss": 0.0296, "step": 18450 }, { "epoch": 1086.0, "learning_rate": 8.194472361809045e-06, "loss": 0.0395, "step": 18475 }, { "epoch": 1088.0, "learning_rate": 8.191959798994975e-06, "loss": 0.0464, "step": 18500 }, { "epoch": 1089.0, "learning_rate": 8.189447236180906e-06, "loss": 0.0423, "step": 18525 }, { "epoch": 1091.0, "learning_rate": 8.186934673366835e-06, "loss": 0.0259, "step": 18550 }, { "epoch": 1092.0, "learning_rate": 8.184422110552764e-06, "loss": 0.0378, "step": 18575 }, { "epoch": 1094.0, "learning_rate": 8.181909547738695e-06, "loss": 0.0306, "step": 18600 }, { "epoch": 1095.0, "learning_rate": 8.179396984924623e-06, "loss": 0.0435, "step": 18625 }, { "epoch": 1097.0, "learning_rate": 8.176884422110554e-06, "loss": 0.0243, "step": 18650 }, { "epoch": 1098.0, "learning_rate": 8.174371859296483e-06, "loss": 0.0362, "step": 18675 }, { "epoch": 1099.0, "learning_rate": 8.171859296482413e-06, "loss": 0.035, "step": 18700 }, { "epoch": 1101.0, "learning_rate": 8.169346733668342e-06, "loss": 0.0376, "step": 18725 }, { "epoch": 1102.0, "learning_rate": 8.166834170854271e-06, "loss": 0.0333, "step": 18750 }, { "epoch": 1104.0, "learning_rate": 8.164321608040202e-06, "loss": 0.0196, "step": 18775 }, { "epoch": 1105.0, "learning_rate": 8.161809045226132e-06, "loss": 0.0464, "step": 18800 }, { "epoch": 1107.0, "learning_rate": 8.159296482412061e-06, "loss": 0.0389, "step": 18825 }, { "epoch": 1108.0, "learning_rate": 8.15678391959799e-06, "loss": 0.0423, "step": 18850 }, { "epoch": 1110.0, "learning_rate": 8.154271356783921e-06, "loss": 0.0383, "step": 18875 }, { "epoch": 1111.0, "learning_rate": 8.151758793969849e-06, "loss": 0.0372, "step": 18900 }, { "epoch": 1113.0, "learning_rate": 8.14924623115578e-06, "loss": 0.0295, "step": 18925 }, { "epoch": 1114.0, "learning_rate": 8.14673366834171e-06, "loss": 0.0306, "step": 18950 }, { "epoch": 1116.0, "learning_rate": 8.144221105527639e-06, "loss": 0.0314, "step": 18975 }, { "epoch": 1117.0, "learning_rate": 8.14170854271357e-06, "loss": 0.0292, "step": 19000 }, { "epoch": 1117.0, "eval_loss": 0.45764777064323425, "eval_runtime": 163.9131, "eval_samples_per_second": 0.61, "eval_steps_per_second": 0.104, "eval_wer": 27.314285714285713, "step": 19000 }, { "epoch": 1119.0, "learning_rate": 8.139195979899497e-06, "loss": 0.0314, "step": 19025 }, { "epoch": 1120.0, "learning_rate": 8.136683417085428e-06, "loss": 0.0349, "step": 19050 }, { "epoch": 1122.0, "learning_rate": 8.134170854271358e-06, "loss": 0.0321, "step": 19075 }, { "epoch": 1123.0, "learning_rate": 8.131658291457287e-06, "loss": 0.032, "step": 19100 }, { "epoch": 1124.0, "learning_rate": 8.129145728643216e-06, "loss": 0.0383, "step": 19125 }, { "epoch": 1126.0, "learning_rate": 8.126633165829147e-06, "loss": 0.0388, "step": 19150 }, { "epoch": 1127.0, "learning_rate": 8.124120603015076e-06, "loss": 0.0368, "step": 19175 }, { "epoch": 1129.0, "learning_rate": 8.121608040201006e-06, "loss": 0.0312, "step": 19200 }, { "epoch": 1130.0, "learning_rate": 8.119095477386935e-06, "loss": 0.0387, "step": 19225 }, { "epoch": 1132.0, "learning_rate": 8.116582914572864e-06, "loss": 0.0255, "step": 19250 }, { "epoch": 1133.0, "learning_rate": 8.114070351758795e-06, "loss": 0.0284, "step": 19275 }, { "epoch": 1135.0, "learning_rate": 8.111557788944723e-06, "loss": 0.0364, "step": 19300 }, { "epoch": 1136.0, "learning_rate": 8.109045226130654e-06, "loss": 0.024, "step": 19325 }, { "epoch": 1138.0, "learning_rate": 8.106532663316583e-06, "loss": 0.0272, "step": 19350 }, { "epoch": 1139.0, "learning_rate": 8.104020100502513e-06, "loss": 0.0318, "step": 19375 }, { "epoch": 1141.0, "learning_rate": 8.101507537688444e-06, "loss": 0.0425, "step": 19400 }, { "epoch": 1142.0, "learning_rate": 8.098994974874373e-06, "loss": 0.019, "step": 19425 }, { "epoch": 1144.0, "learning_rate": 8.096482412060302e-06, "loss": 0.0383, "step": 19450 }, { "epoch": 1145.0, "learning_rate": 8.093969849246232e-06, "loss": 0.0424, "step": 19475 }, { "epoch": 1147.0, "learning_rate": 8.091457286432161e-06, "loss": 0.0297, "step": 19500 }, { "epoch": 1148.0, "learning_rate": 8.08894472361809e-06, "loss": 0.0245, "step": 19525 }, { "epoch": 1149.0, "learning_rate": 8.086432160804021e-06, "loss": 0.0414, "step": 19550 }, { "epoch": 1151.0, "learning_rate": 8.08391959798995e-06, "loss": 0.0345, "step": 19575 }, { "epoch": 1152.0, "learning_rate": 8.08140703517588e-06, "loss": 0.0401, "step": 19600 }, { "epoch": 1154.0, "learning_rate": 8.07889447236181e-06, "loss": 0.0275, "step": 19625 }, { "epoch": 1155.0, "learning_rate": 8.076381909547739e-06, "loss": 0.0248, "step": 19650 }, { "epoch": 1157.0, "learning_rate": 8.07386934673367e-06, "loss": 0.0347, "step": 19675 }, { "epoch": 1158.0, "learning_rate": 8.071356783919599e-06, "loss": 0.0301, "step": 19700 }, { "epoch": 1160.0, "learning_rate": 8.068844221105528e-06, "loss": 0.0317, "step": 19725 }, { "epoch": 1161.0, "learning_rate": 8.066331658291458e-06, "loss": 0.0326, "step": 19750 }, { "epoch": 1163.0, "learning_rate": 8.063819095477387e-06, "loss": 0.0372, "step": 19775 }, { "epoch": 1164.0, "learning_rate": 8.061306532663318e-06, "loss": 0.0281, "step": 19800 }, { "epoch": 1166.0, "learning_rate": 8.058793969849247e-06, "loss": 0.0357, "step": 19825 }, { "epoch": 1167.0, "learning_rate": 8.056381909547739e-06, "loss": 0.033, "step": 19850 }, { "epoch": 1169.0, "learning_rate": 8.05386934673367e-06, "loss": 0.0212, "step": 19875 }, { "epoch": 1170.0, "learning_rate": 8.051356783919598e-06, "loss": 0.026, "step": 19900 }, { "epoch": 1172.0, "learning_rate": 8.048844221105529e-06, "loss": 0.0337, "step": 19925 }, { "epoch": 1173.0, "learning_rate": 8.046331658291458e-06, "loss": 0.0373, "step": 19950 }, { "epoch": 1174.0, "learning_rate": 8.043819095477387e-06, "loss": 0.0409, "step": 19975 }, { "epoch": 1176.0, "learning_rate": 8.041306532663318e-06, "loss": 0.0247, "step": 20000 }, { "epoch": 1176.0, "eval_loss": 0.4733918309211731, "eval_runtime": 165.2895, "eval_samples_per_second": 0.605, "eval_steps_per_second": 0.103, "eval_wer": 28.914285714285715, "step": 20000 }, { "epoch": 1177.0, "learning_rate": 8.038793969849248e-06, "loss": 0.0274, "step": 20025 }, { "epoch": 1179.0, "learning_rate": 8.036281407035177e-06, "loss": 0.0247, "step": 20050 }, { "epoch": 1180.0, "learning_rate": 8.033768844221106e-06, "loss": 0.027, "step": 20075 }, { "epoch": 1182.0, "learning_rate": 8.031256281407036e-06, "loss": 0.0294, "step": 20100 }, { "epoch": 1183.0, "learning_rate": 8.028743718592965e-06, "loss": 0.025, "step": 20125 }, { "epoch": 1185.0, "learning_rate": 8.026231155778896e-06, "loss": 0.0352, "step": 20150 }, { "epoch": 1186.0, "learning_rate": 8.023718592964824e-06, "loss": 0.0391, "step": 20175 }, { "epoch": 1188.0, "learning_rate": 8.021206030150755e-06, "loss": 0.0347, "step": 20200 }, { "epoch": 1189.0, "learning_rate": 8.018693467336684e-06, "loss": 0.0273, "step": 20225 }, { "epoch": 1191.0, "learning_rate": 8.016180904522613e-06, "loss": 0.0274, "step": 20250 }, { "epoch": 1192.0, "learning_rate": 8.013668341708544e-06, "loss": 0.0206, "step": 20275 }, { "epoch": 1194.0, "learning_rate": 8.011155778894474e-06, "loss": 0.0263, "step": 20300 }, { "epoch": 1195.0, "learning_rate": 8.008643216080403e-06, "loss": 0.0234, "step": 20325 }, { "epoch": 1197.0, "learning_rate": 8.006130653266332e-06, "loss": 0.0383, "step": 20350 }, { "epoch": 1198.0, "learning_rate": 8.003618090452261e-06, "loss": 0.0404, "step": 20375 }, { "epoch": 1199.0, "learning_rate": 8.001105527638192e-06, "loss": 0.0239, "step": 20400 }, { "epoch": 1201.0, "learning_rate": 7.998592964824122e-06, "loss": 0.0361, "step": 20425 }, { "epoch": 1202.0, "learning_rate": 7.996080402010051e-06, "loss": 0.0335, "step": 20450 }, { "epoch": 1204.0, "learning_rate": 7.99356783919598e-06, "loss": 0.0242, "step": 20475 }, { "epoch": 1205.0, "learning_rate": 7.99105527638191e-06, "loss": 0.0418, "step": 20500 }, { "epoch": 1207.0, "learning_rate": 7.988542713567839e-06, "loss": 0.0251, "step": 20525 }, { "epoch": 1208.0, "learning_rate": 7.98603015075377e-06, "loss": 0.0226, "step": 20550 }, { "epoch": 1210.0, "learning_rate": 7.9835175879397e-06, "loss": 0.0327, "step": 20575 }, { "epoch": 1211.0, "learning_rate": 7.981005025125629e-06, "loss": 0.0259, "step": 20600 }, { "epoch": 1213.0, "learning_rate": 7.978492462311558e-06, "loss": 0.0277, "step": 20625 }, { "epoch": 1214.0, "learning_rate": 7.975979899497487e-06, "loss": 0.0252, "step": 20650 }, { "epoch": 1216.0, "learning_rate": 7.973467336683418e-06, "loss": 0.0258, "step": 20675 }, { "epoch": 1217.0, "learning_rate": 7.970954773869348e-06, "loss": 0.0255, "step": 20700 }, { "epoch": 1219.0, "learning_rate": 7.968442211055277e-06, "loss": 0.0351, "step": 20725 }, { "epoch": 1220.0, "learning_rate": 7.965929648241206e-06, "loss": 0.0191, "step": 20750 }, { "epoch": 1222.0, "learning_rate": 7.963417085427136e-06, "loss": 0.0247, "step": 20775 }, { "epoch": 1223.0, "learning_rate": 7.960904522613065e-06, "loss": 0.0356, "step": 20800 }, { "epoch": 1224.0, "learning_rate": 7.958391959798996e-06, "loss": 0.0213, "step": 20825 }, { "epoch": 1226.0, "learning_rate": 7.955879396984925e-06, "loss": 0.0281, "step": 20850 }, { "epoch": 1227.0, "learning_rate": 7.953366834170855e-06, "loss": 0.0227, "step": 20875 }, { "epoch": 1229.0, "learning_rate": 7.950854271356786e-06, "loss": 0.025, "step": 20900 }, { "epoch": 1230.0, "learning_rate": 7.948341708542713e-06, "loss": 0.0249, "step": 20925 }, { "epoch": 1232.0, "learning_rate": 7.945829145728644e-06, "loss": 0.024, "step": 20950 }, { "epoch": 1233.0, "learning_rate": 7.943316582914574e-06, "loss": 0.0299, "step": 20975 }, { "epoch": 1235.0, "learning_rate": 7.940804020100503e-06, "loss": 0.0229, "step": 21000 }, { "epoch": 1235.0, "eval_loss": 0.4899497330188751, "eval_runtime": 176.1002, "eval_samples_per_second": 0.568, "eval_steps_per_second": 0.097, "eval_wer": 29.942857142857143, "step": 21000 }, { "epoch": 1236.0, "learning_rate": 7.938291457286434e-06, "loss": 0.0287, "step": 21025 }, { "epoch": 1238.0, "learning_rate": 7.935778894472362e-06, "loss": 0.0255, "step": 21050 }, { "epoch": 1239.0, "learning_rate": 7.933266331658293e-06, "loss": 0.0335, "step": 21075 }, { "epoch": 1241.0, "learning_rate": 7.930753768844222e-06, "loss": 0.0283, "step": 21100 }, { "epoch": 1242.0, "learning_rate": 7.928241206030151e-06, "loss": 0.0237, "step": 21125 }, { "epoch": 1244.0, "learning_rate": 7.92572864321608e-06, "loss": 0.0237, "step": 21150 }, { "epoch": 1245.0, "learning_rate": 7.923216080402012e-06, "loss": 0.024, "step": 21175 }, { "epoch": 1247.0, "learning_rate": 7.92070351758794e-06, "loss": 0.0247, "step": 21200 }, { "epoch": 1248.0, "learning_rate": 7.91819095477387e-06, "loss": 0.0237, "step": 21225 }, { "epoch": 1249.0, "learning_rate": 7.9156783919598e-06, "loss": 0.0336, "step": 21250 }, { "epoch": 1251.0, "learning_rate": 7.913165829145729e-06, "loss": 0.0376, "step": 21275 }, { "epoch": 1252.0, "learning_rate": 7.91065326633166e-06, "loss": 0.0256, "step": 21300 }, { "epoch": 1254.0, "learning_rate": 7.908140703517588e-06, "loss": 0.0224, "step": 21325 }, { "epoch": 1255.0, "learning_rate": 7.905628140703519e-06, "loss": 0.0251, "step": 21350 }, { "epoch": 1257.0, "learning_rate": 7.903115577889448e-06, "loss": 0.0322, "step": 21375 }, { "epoch": 1258.0, "learning_rate": 7.900603015075377e-06, "loss": 0.0289, "step": 21400 }, { "epoch": 1260.0, "learning_rate": 7.898090452261307e-06, "loss": 0.0232, "step": 21425 }, { "epoch": 1261.0, "learning_rate": 7.895577889447238e-06, "loss": 0.0272, "step": 21450 }, { "epoch": 1263.0, "learning_rate": 7.893065326633167e-06, "loss": 0.0313, "step": 21475 }, { "epoch": 1264.0, "learning_rate": 7.890552763819096e-06, "loss": 0.0238, "step": 21500 }, { "epoch": 1266.0, "learning_rate": 7.888040201005026e-06, "loss": 0.0177, "step": 21525 }, { "epoch": 1267.0, "learning_rate": 7.885527638190955e-06, "loss": 0.0222, "step": 21550 }, { "epoch": 1269.0, "learning_rate": 7.883015075376886e-06, "loss": 0.0243, "step": 21575 }, { "epoch": 1270.0, "learning_rate": 7.880502512562814e-06, "loss": 0.0333, "step": 21600 }, { "epoch": 1272.0, "learning_rate": 7.877989949748745e-06, "loss": 0.021, "step": 21625 }, { "epoch": 1273.0, "learning_rate": 7.875477386934674e-06, "loss": 0.0246, "step": 21650 }, { "epoch": 1274.0, "learning_rate": 7.872964824120603e-06, "loss": 0.0254, "step": 21675 }, { "epoch": 1276.0, "learning_rate": 7.870452261306534e-06, "loss": 0.0307, "step": 21700 }, { "epoch": 1277.0, "learning_rate": 7.867939698492464e-06, "loss": 0.0252, "step": 21725 }, { "epoch": 1279.0, "learning_rate": 7.865427135678393e-06, "loss": 0.0172, "step": 21750 }, { "epoch": 1280.0, "learning_rate": 7.862914572864322e-06, "loss": 0.0166, "step": 21775 }, { "epoch": 1282.0, "learning_rate": 7.860402010050252e-06, "loss": 0.0182, "step": 21800 }, { "epoch": 1283.0, "learning_rate": 7.857889447236181e-06, "loss": 0.0327, "step": 21825 }, { "epoch": 1285.0, "learning_rate": 7.855477386934674e-06, "loss": 0.0186, "step": 21850 }, { "epoch": 1286.0, "learning_rate": 7.852964824120603e-06, "loss": 0.0322, "step": 21875 }, { "epoch": 1288.0, "learning_rate": 7.850452261306534e-06, "loss": 0.0286, "step": 21900 }, { "epoch": 1289.0, "learning_rate": 7.847939698492462e-06, "loss": 0.0242, "step": 21925 }, { "epoch": 1291.0, "learning_rate": 7.845427135678393e-06, "loss": 0.021, "step": 21950 }, { "epoch": 1292.0, "learning_rate": 7.842914572864322e-06, "loss": 0.0259, "step": 21975 }, { "epoch": 1294.0, "learning_rate": 7.840402010050252e-06, "loss": 0.0271, "step": 22000 }, { "epoch": 1294.0, "eval_loss": 0.478964626789093, "eval_runtime": 164.8228, "eval_samples_per_second": 0.607, "eval_steps_per_second": 0.103, "eval_wer": 28.114285714285714, "step": 22000 }, { "epoch": 1295.0, "learning_rate": 7.837889447236181e-06, "loss": 0.0171, "step": 22025 }, { "epoch": 1297.0, "learning_rate": 7.83537688442211e-06, "loss": 0.023, "step": 22050 }, { "epoch": 1298.0, "learning_rate": 7.832864321608041e-06, "loss": 0.0213, "step": 22075 }, { "epoch": 1299.0, "learning_rate": 7.83035175879397e-06, "loss": 0.0289, "step": 22100 }, { "epoch": 1301.0, "learning_rate": 7.8278391959799e-06, "loss": 0.0284, "step": 22125 }, { "epoch": 1302.0, "learning_rate": 7.82532663316583e-06, "loss": 0.0201, "step": 22150 }, { "epoch": 1304.0, "learning_rate": 7.82281407035176e-06, "loss": 0.0298, "step": 22175 }, { "epoch": 1305.0, "learning_rate": 7.820301507537688e-06, "loss": 0.0386, "step": 22200 }, { "epoch": 1307.0, "learning_rate": 7.817788944723619e-06, "loss": 0.0267, "step": 22225 }, { "epoch": 1308.0, "learning_rate": 7.815276381909548e-06, "loss": 0.0197, "step": 22250 }, { "epoch": 1310.0, "learning_rate": 7.812763819095478e-06, "loss": 0.0176, "step": 22275 }, { "epoch": 1311.0, "learning_rate": 7.810251256281409e-06, "loss": 0.0198, "step": 22300 }, { "epoch": 1313.0, "learning_rate": 7.807738693467336e-06, "loss": 0.0295, "step": 22325 }, { "epoch": 1314.0, "learning_rate": 7.805226130653267e-06, "loss": 0.022, "step": 22350 }, { "epoch": 1316.0, "learning_rate": 7.802713567839197e-06, "loss": 0.0177, "step": 22375 }, { "epoch": 1317.0, "learning_rate": 7.800201005025126e-06, "loss": 0.0207, "step": 22400 }, { "epoch": 1319.0, "learning_rate": 7.797688442211055e-06, "loss": 0.0284, "step": 22425 }, { "epoch": 1320.0, "learning_rate": 7.795175879396986e-06, "loss": 0.038, "step": 22450 }, { "epoch": 1322.0, "learning_rate": 7.792663316582916e-06, "loss": 0.0301, "step": 22475 }, { "epoch": 1323.0, "learning_rate": 7.790150753768845e-06, "loss": 0.0298, "step": 22500 }, { "epoch": 1324.0, "learning_rate": 7.787638190954774e-06, "loss": 0.0219, "step": 22525 }, { "epoch": 1326.0, "learning_rate": 7.785125628140704e-06, "loss": 0.0323, "step": 22550 }, { "epoch": 1327.0, "learning_rate": 7.782613065326635e-06, "loss": 0.0212, "step": 22575 }, { "epoch": 1329.0, "learning_rate": 7.780100502512562e-06, "loss": 0.0218, "step": 22600 }, { "epoch": 1330.0, "learning_rate": 7.777587939698493e-06, "loss": 0.0198, "step": 22625 }, { "epoch": 1332.0, "learning_rate": 7.775075376884423e-06, "loss": 0.0231, "step": 22650 }, { "epoch": 1333.0, "learning_rate": 7.772562814070352e-06, "loss": 0.0212, "step": 22675 }, { "epoch": 1335.0, "learning_rate": 7.770050251256283e-06, "loss": 0.0321, "step": 22700 }, { "epoch": 1336.0, "learning_rate": 7.767537688442212e-06, "loss": 0.0192, "step": 22725 }, { "epoch": 1338.0, "learning_rate": 7.765025125628142e-06, "loss": 0.0189, "step": 22750 }, { "epoch": 1339.0, "learning_rate": 7.762512562814071e-06, "loss": 0.0218, "step": 22775 }, { "epoch": 1341.0, "learning_rate": 7.76e-06, "loss": 0.0286, "step": 22800 }, { "epoch": 1342.0, "learning_rate": 7.75748743718593e-06, "loss": 0.0253, "step": 22825 }, { "epoch": 1344.0, "learning_rate": 7.75497487437186e-06, "loss": 0.0204, "step": 22850 }, { "epoch": 1345.0, "learning_rate": 7.752462311557788e-06, "loss": 0.0272, "step": 22875 }, { "epoch": 1347.0, "learning_rate": 7.74994974874372e-06, "loss": 0.0249, "step": 22900 }, { "epoch": 1348.0, "learning_rate": 7.747437185929649e-06, "loss": 0.0348, "step": 22925 }, { "epoch": 1349.0, "learning_rate": 7.744924623115578e-06, "loss": 0.0197, "step": 22950 }, { "epoch": 1351.0, "learning_rate": 7.742412060301509e-06, "loss": 0.0244, "step": 22975 }, { "epoch": 1352.0, "learning_rate": 7.739899497487438e-06, "loss": 0.0271, "step": 23000 }, { "epoch": 1352.0, "eval_loss": 0.5011751651763916, "eval_runtime": 170.2406, "eval_samples_per_second": 0.587, "eval_steps_per_second": 0.1, "eval_wer": 30.17142857142857, "step": 23000 }, { "epoch": 1354.0, "learning_rate": 7.737386934673368e-06, "loss": 0.0264, "step": 23025 }, { "epoch": 1355.0, "learning_rate": 7.734874371859297e-06, "loss": 0.0135, "step": 23050 }, { "epoch": 1357.0, "learning_rate": 7.732361809045226e-06, "loss": 0.0111, "step": 23075 }, { "epoch": 1358.0, "learning_rate": 7.729849246231157e-06, "loss": 0.0164, "step": 23100 }, { "epoch": 1360.0, "learning_rate": 7.727336683417087e-06, "loss": 0.0229, "step": 23125 }, { "epoch": 1361.0, "learning_rate": 7.724824120603016e-06, "loss": 0.0232, "step": 23150 }, { "epoch": 1363.0, "learning_rate": 7.722311557788945e-06, "loss": 0.0206, "step": 23175 }, { "epoch": 1364.0, "learning_rate": 7.719798994974874e-06, "loss": 0.0242, "step": 23200 }, { "epoch": 1366.0, "learning_rate": 7.717286432160804e-06, "loss": 0.0308, "step": 23225 }, { "epoch": 1367.0, "learning_rate": 7.714773869346735e-06, "loss": 0.0108, "step": 23250 }, { "epoch": 1369.0, "learning_rate": 7.712261306532664e-06, "loss": 0.0264, "step": 23275 }, { "epoch": 1370.0, "learning_rate": 7.709748743718593e-06, "loss": 0.02, "step": 23300 }, { "epoch": 1372.0, "learning_rate": 7.707236180904525e-06, "loss": 0.0279, "step": 23325 }, { "epoch": 1373.0, "learning_rate": 7.704723618090452e-06, "loss": 0.0236, "step": 23350 }, { "epoch": 1374.0, "learning_rate": 7.702211055276383e-06, "loss": 0.0189, "step": 23375 }, { "epoch": 1376.0, "learning_rate": 7.699698492462312e-06, "loss": 0.0203, "step": 23400 }, { "epoch": 1377.0, "learning_rate": 7.697185929648242e-06, "loss": 0.034, "step": 23425 }, { "epoch": 1379.0, "learning_rate": 7.694673366834171e-06, "loss": 0.0226, "step": 23450 }, { "epoch": 1380.0, "learning_rate": 7.6921608040201e-06, "loss": 0.0237, "step": 23475 }, { "epoch": 1382.0, "learning_rate": 7.68964824120603e-06, "loss": 0.0216, "step": 23500 }, { "epoch": 1383.0, "learning_rate": 7.68713567839196e-06, "loss": 0.0208, "step": 23525 }, { "epoch": 1385.0, "learning_rate": 7.68462311557789e-06, "loss": 0.0216, "step": 23550 }, { "epoch": 1386.0, "learning_rate": 7.68211055276382e-06, "loss": 0.0198, "step": 23575 }, { "epoch": 1388.0, "learning_rate": 7.67959798994975e-06, "loss": 0.0157, "step": 23600 }, { "epoch": 1389.0, "learning_rate": 7.677085427135678e-06, "loss": 0.024, "step": 23625 }, { "epoch": 1391.0, "learning_rate": 7.674572864321609e-06, "loss": 0.0237, "step": 23650 }, { "epoch": 1392.0, "learning_rate": 7.672060301507538e-06, "loss": 0.0202, "step": 23675 }, { "epoch": 1394.0, "learning_rate": 7.669547738693468e-06, "loss": 0.0203, "step": 23700 }, { "epoch": 1395.0, "learning_rate": 7.667035175879399e-06, "loss": 0.0328, "step": 23725 }, { "epoch": 1397.0, "learning_rate": 7.664522613065326e-06, "loss": 0.0261, "step": 23750 }, { "epoch": 1398.0, "learning_rate": 7.662010050251257e-06, "loss": 0.0234, "step": 23775 }, { "epoch": 1399.0, "learning_rate": 7.659497487437187e-06, "loss": 0.0277, "step": 23800 }, { "epoch": 1401.0, "learning_rate": 7.656984924623116e-06, "loss": 0.0286, "step": 23825 }, { "epoch": 1402.0, "learning_rate": 7.654472361809045e-06, "loss": 0.0201, "step": 23850 }, { "epoch": 1404.0, "learning_rate": 7.651959798994976e-06, "loss": 0.0178, "step": 23875 }, { "epoch": 1405.0, "learning_rate": 7.649447236180904e-06, "loss": 0.0162, "step": 23900 }, { "epoch": 1407.0, "learning_rate": 7.646934673366835e-06, "loss": 0.0282, "step": 23925 }, { "epoch": 1408.0, "learning_rate": 7.644422110552764e-06, "loss": 0.0187, "step": 23950 }, { "epoch": 1410.0, "learning_rate": 7.641909547738694e-06, "loss": 0.0175, "step": 23975 }, { "epoch": 1411.0, "learning_rate": 7.639396984924625e-06, "loss": 0.0184, "step": 24000 }, { "epoch": 1411.0, "eval_loss": 0.5008236169815063, "eval_runtime": 169.1896, "eval_samples_per_second": 0.591, "eval_steps_per_second": 0.1, "eval_wer": 27.314285714285713, "step": 24000 }, { "epoch": 1413.0, "learning_rate": 7.636884422110552e-06, "loss": 0.0271, "step": 24025 }, { "epoch": 1414.0, "learning_rate": 7.634371859296483e-06, "loss": 0.0211, "step": 24050 }, { "epoch": 1416.0, "learning_rate": 7.631859296482413e-06, "loss": 0.0147, "step": 24075 }, { "epoch": 1417.0, "learning_rate": 7.629346733668343e-06, "loss": 0.0222, "step": 24100 }, { "epoch": 1419.0, "learning_rate": 7.626834170854271e-06, "loss": 0.0224, "step": 24125 }, { "epoch": 1420.0, "learning_rate": 7.6243216080402015e-06, "loss": 0.0204, "step": 24150 }, { "epoch": 1422.0, "learning_rate": 7.621809045226132e-06, "loss": 0.0222, "step": 24175 }, { "epoch": 1423.0, "learning_rate": 7.619296482412061e-06, "loss": 0.0204, "step": 24200 }, { "epoch": 1424.0, "learning_rate": 7.616783919597991e-06, "loss": 0.0185, "step": 24225 }, { "epoch": 1426.0, "learning_rate": 7.61427135678392e-06, "loss": 0.018, "step": 24250 }, { "epoch": 1427.0, "learning_rate": 7.61175879396985e-06, "loss": 0.0139, "step": 24275 }, { "epoch": 1429.0, "learning_rate": 7.609246231155779e-06, "loss": 0.0175, "step": 24300 }, { "epoch": 1430.0, "learning_rate": 7.606733668341709e-06, "loss": 0.016, "step": 24325 }, { "epoch": 1432.0, "learning_rate": 7.604221105527639e-06, "loss": 0.0258, "step": 24350 }, { "epoch": 1433.0, "learning_rate": 7.601708542713569e-06, "loss": 0.0169, "step": 24375 }, { "epoch": 1435.0, "learning_rate": 7.599195979899499e-06, "loss": 0.0208, "step": 24400 }, { "epoch": 1436.0, "learning_rate": 7.5966834170854274e-06, "loss": 0.0215, "step": 24425 }, { "epoch": 1438.0, "learning_rate": 7.594170854271358e-06, "loss": 0.0192, "step": 24450 }, { "epoch": 1439.0, "learning_rate": 7.591658291457287e-06, "loss": 0.0236, "step": 24475 }, { "epoch": 1441.0, "learning_rate": 7.589145728643217e-06, "loss": 0.0253, "step": 24500 }, { "epoch": 1442.0, "learning_rate": 7.5866331658291456e-06, "loss": 0.02, "step": 24525 }, { "epoch": 1444.0, "learning_rate": 7.584120603015076e-06, "loss": 0.0142, "step": 24550 }, { "epoch": 1445.0, "learning_rate": 7.581608040201006e-06, "loss": 0.0234, "step": 24575 }, { "epoch": 1447.0, "learning_rate": 7.579095477386935e-06, "loss": 0.0192, "step": 24600 }, { "epoch": 1448.0, "learning_rate": 7.576582914572865e-06, "loss": 0.0161, "step": 24625 }, { "epoch": 1449.0, "learning_rate": 7.574070351758795e-06, "loss": 0.0201, "step": 24650 }, { "epoch": 1451.0, "learning_rate": 7.571557788944725e-06, "loss": 0.0214, "step": 24675 }, { "epoch": 1452.0, "learning_rate": 7.569045226130653e-06, "loss": 0.0242, "step": 24700 }, { "epoch": 1454.0, "learning_rate": 7.5665326633165835e-06, "loss": 0.0168, "step": 24725 }, { "epoch": 1455.0, "learning_rate": 7.564020100502513e-06, "loss": 0.0166, "step": 24750 }, { "epoch": 1457.0, "learning_rate": 7.561507537688443e-06, "loss": 0.0223, "step": 24775 }, { "epoch": 1458.0, "learning_rate": 7.558994974874373e-06, "loss": 0.0214, "step": 24800 }, { "epoch": 1460.0, "learning_rate": 7.556482412060302e-06, "loss": 0.0174, "step": 24825 }, { "epoch": 1461.0, "learning_rate": 7.553969849246232e-06, "loss": 0.0245, "step": 24850 }, { "epoch": 1463.0, "learning_rate": 7.551457286432161e-06, "loss": 0.0137, "step": 24875 }, { "epoch": 1464.0, "learning_rate": 7.548944723618091e-06, "loss": 0.0186, "step": 24900 }, { "epoch": 1466.0, "learning_rate": 7.546432160804021e-06, "loss": 0.0196, "step": 24925 }, { "epoch": 1467.0, "learning_rate": 7.543919597989951e-06, "loss": 0.0244, "step": 24950 }, { "epoch": 1469.0, "learning_rate": 7.541407035175879e-06, "loss": 0.0127, "step": 24975 }, { "epoch": 1470.0, "learning_rate": 7.5388944723618095e-06, "loss": 0.0211, "step": 25000 }, { "epoch": 1470.0, "eval_loss": 0.5118334293365479, "eval_runtime": 167.4206, "eval_samples_per_second": 0.597, "eval_steps_per_second": 0.102, "eval_wer": 27.65714285714286, "step": 25000 }, { "epoch": 1472.0, "learning_rate": 7.53638190954774e-06, "loss": 0.0262, "step": 25025 }, { "epoch": 1473.0, "learning_rate": 7.533869346733669e-06, "loss": 0.014, "step": 25050 }, { "epoch": 1474.0, "learning_rate": 7.531356783919599e-06, "loss": 0.0144, "step": 25075 }, { "epoch": 1476.0, "learning_rate": 7.528844221105528e-06, "loss": 0.0164, "step": 25100 }, { "epoch": 1477.0, "learning_rate": 7.526331658291458e-06, "loss": 0.0167, "step": 25125 }, { "epoch": 1479.0, "learning_rate": 7.523819095477387e-06, "loss": 0.0145, "step": 25150 }, { "epoch": 1480.0, "learning_rate": 7.521306532663317e-06, "loss": 0.0138, "step": 25175 }, { "epoch": 1482.0, "learning_rate": 7.5187939698492475e-06, "loss": 0.0232, "step": 25200 }, { "epoch": 1483.0, "learning_rate": 7.516281407035177e-06, "loss": 0.0176, "step": 25225 }, { "epoch": 1485.0, "learning_rate": 7.513768844221106e-06, "loss": 0.0201, "step": 25250 }, { "epoch": 1486.0, "learning_rate": 7.5112562814070354e-06, "loss": 0.0249, "step": 25275 }, { "epoch": 1488.0, "learning_rate": 7.508743718592966e-06, "loss": 0.0304, "step": 25300 }, { "epoch": 1489.0, "learning_rate": 7.506231155778895e-06, "loss": 0.0157, "step": 25325 }, { "epoch": 1491.0, "learning_rate": 7.503718592964825e-06, "loss": 0.0157, "step": 25350 }, { "epoch": 1492.0, "learning_rate": 7.5012060301507536e-06, "loss": 0.0132, "step": 25375 }, { "epoch": 1494.0, "learning_rate": 7.498693467336684e-06, "loss": 0.0273, "step": 25400 }, { "epoch": 1495.0, "learning_rate": 7.496180904522614e-06, "loss": 0.0186, "step": 25425 }, { "epoch": 1497.0, "learning_rate": 7.493668341708543e-06, "loss": 0.0116, "step": 25450 }, { "epoch": 1498.0, "learning_rate": 7.491155778894473e-06, "loss": 0.0209, "step": 25475 }, { "epoch": 1499.0, "learning_rate": 7.488643216080403e-06, "loss": 0.018, "step": 25500 }, { "epoch": 1501.0, "learning_rate": 7.486130653266333e-06, "loss": 0.0155, "step": 25525 }, { "epoch": 1502.0, "learning_rate": 7.483618090452261e-06, "loss": 0.0205, "step": 25550 }, { "epoch": 1504.0, "learning_rate": 7.4811055276381915e-06, "loss": 0.0221, "step": 25575 }, { "epoch": 1505.0, "learning_rate": 7.478592964824121e-06, "loss": 0.0205, "step": 25600 }, { "epoch": 1507.0, "learning_rate": 7.476080402010051e-06, "loss": 0.016, "step": 25625 }, { "epoch": 1508.0, "learning_rate": 7.473567839195981e-06, "loss": 0.0171, "step": 25650 }, { "epoch": 1510.0, "learning_rate": 7.47105527638191e-06, "loss": 0.021, "step": 25675 }, { "epoch": 1511.0, "learning_rate": 7.46854271356784e-06, "loss": 0.0165, "step": 25700 }, { "epoch": 1513.0, "learning_rate": 7.466030150753769e-06, "loss": 0.0132, "step": 25725 }, { "epoch": 1514.0, "learning_rate": 7.463517587939699e-06, "loss": 0.0151, "step": 25750 }, { "epoch": 1516.0, "learning_rate": 7.461005025125629e-06, "loss": 0.0207, "step": 25775 }, { "epoch": 1517.0, "learning_rate": 7.458492462311559e-06, "loss": 0.0146, "step": 25800 }, { "epoch": 1519.0, "learning_rate": 7.455979899497488e-06, "loss": 0.0145, "step": 25825 }, { "epoch": 1520.0, "learning_rate": 7.4534673366834175e-06, "loss": 0.0144, "step": 25850 }, { "epoch": 1522.0, "learning_rate": 7.450954773869348e-06, "loss": 0.0152, "step": 25875 }, { "epoch": 1523.0, "learning_rate": 7.448442211055277e-06, "loss": 0.015, "step": 25900 }, { "epoch": 1524.0, "learning_rate": 7.445929648241207e-06, "loss": 0.019, "step": 25925 }, { "epoch": 1526.0, "learning_rate": 7.443417085427136e-06, "loss": 0.013, "step": 25950 }, { "epoch": 1527.0, "learning_rate": 7.440904522613066e-06, "loss": 0.0125, "step": 25975 }, { "epoch": 1529.0, "learning_rate": 7.438391959798995e-06, "loss": 0.0183, "step": 26000 }, { "epoch": 1529.0, "eval_loss": 0.5397529602050781, "eval_runtime": 170.1683, "eval_samples_per_second": 0.588, "eval_steps_per_second": 0.1, "eval_wer": 30.057142857142853, "step": 26000 }, { "epoch": 1530.0, "learning_rate": 7.435879396984925e-06, "loss": 0.022, "step": 26025 }, { "epoch": 1532.0, "learning_rate": 7.4333668341708555e-06, "loss": 0.0227, "step": 26050 }, { "epoch": 1533.0, "learning_rate": 7.430854271356785e-06, "loss": 0.0128, "step": 26075 }, { "epoch": 1535.0, "learning_rate": 7.428341708542714e-06, "loss": 0.0137, "step": 26100 }, { "epoch": 1536.0, "learning_rate": 7.4258291457286434e-06, "loss": 0.0155, "step": 26125 }, { "epoch": 1538.0, "learning_rate": 7.423316582914574e-06, "loss": 0.0226, "step": 26150 }, { "epoch": 1539.0, "learning_rate": 7.420804020100503e-06, "loss": 0.0159, "step": 26175 }, { "epoch": 1541.0, "learning_rate": 7.418291457286433e-06, "loss": 0.016, "step": 26200 }, { "epoch": 1542.0, "learning_rate": 7.4157788944723616e-06, "loss": 0.0152, "step": 26225 }, { "epoch": 1544.0, "learning_rate": 7.413266331658292e-06, "loss": 0.0184, "step": 26250 }, { "epoch": 1545.0, "learning_rate": 7.410753768844222e-06, "loss": 0.0231, "step": 26275 }, { "epoch": 1547.0, "learning_rate": 7.408241206030151e-06, "loss": 0.0119, "step": 26300 }, { "epoch": 1548.0, "learning_rate": 7.405728643216081e-06, "loss": 0.0243, "step": 26325 }, { "epoch": 1549.0, "learning_rate": 7.403216080402011e-06, "loss": 0.0162, "step": 26350 }, { "epoch": 1551.0, "learning_rate": 7.40070351758794e-06, "loss": 0.0179, "step": 26375 }, { "epoch": 1552.0, "learning_rate": 7.398190954773869e-06, "loss": 0.0143, "step": 26400 }, { "epoch": 1554.0, "learning_rate": 7.3956783919597995e-06, "loss": 0.0124, "step": 26425 }, { "epoch": 1555.0, "learning_rate": 7.39316582914573e-06, "loss": 0.012, "step": 26450 }, { "epoch": 1557.0, "learning_rate": 7.390653266331659e-06, "loss": 0.01, "step": 26475 }, { "epoch": 1558.0, "learning_rate": 7.388140703517589e-06, "loss": 0.0171, "step": 26500 }, { "epoch": 1560.0, "learning_rate": 7.385628140703518e-06, "loss": 0.0125, "step": 26525 }, { "epoch": 1561.0, "learning_rate": 7.383115577889448e-06, "loss": 0.0175, "step": 26550 }, { "epoch": 1563.0, "learning_rate": 7.380603015075377e-06, "loss": 0.0251, "step": 26575 }, { "epoch": 1564.0, "learning_rate": 7.378090452261307e-06, "loss": 0.0149, "step": 26600 }, { "epoch": 1566.0, "learning_rate": 7.375577889447237e-06, "loss": 0.0132, "step": 26625 }, { "epoch": 1567.0, "learning_rate": 7.373065326633167e-06, "loss": 0.0189, "step": 26650 }, { "epoch": 1569.0, "learning_rate": 7.370653266331658e-06, "loss": 0.0182, "step": 26675 }, { "epoch": 1570.0, "learning_rate": 7.3681407035175886e-06, "loss": 0.0172, "step": 26700 }, { "epoch": 1572.0, "learning_rate": 7.365628140703518e-06, "loss": 0.0121, "step": 26725 }, { "epoch": 1573.0, "learning_rate": 7.363115577889448e-06, "loss": 0.0185, "step": 26750 }, { "epoch": 1574.0, "learning_rate": 7.360603015075377e-06, "loss": 0.0139, "step": 26775 }, { "epoch": 1576.0, "learning_rate": 7.3580904522613075e-06, "loss": 0.0103, "step": 26800 }, { "epoch": 1577.0, "learning_rate": 7.355577889447236e-06, "loss": 0.0158, "step": 26825 }, { "epoch": 1579.0, "learning_rate": 7.353065326633166e-06, "loss": 0.0193, "step": 26850 }, { "epoch": 1580.0, "learning_rate": 7.350552763819096e-06, "loss": 0.024, "step": 26875 }, { "epoch": 1582.0, "learning_rate": 7.348140703517589e-06, "loss": 0.0261, "step": 26900 }, { "epoch": 1583.0, "learning_rate": 7.345628140703518e-06, "loss": 0.0147, "step": 26925 }, { "epoch": 1585.0, "learning_rate": 7.343115577889448e-06, "loss": 0.0167, "step": 26950 }, { "epoch": 1586.0, "learning_rate": 7.340603015075377e-06, "loss": 0.0201, "step": 26975 }, { "epoch": 1588.0, "learning_rate": 7.338090452261307e-06, "loss": 0.0164, "step": 27000 }, { "epoch": 1588.0, "eval_loss": 0.5005923509597778, "eval_runtime": 165.5466, "eval_samples_per_second": 0.604, "eval_steps_per_second": 0.103, "eval_wer": 27.314285714285713, "step": 27000 }, { "epoch": 1589.0, "learning_rate": 7.335577889447236e-06, "loss": 0.0203, "step": 27025 }, { "epoch": 1591.0, "learning_rate": 7.333065326633166e-06, "loss": 0.0219, "step": 27050 }, { "epoch": 1592.0, "learning_rate": 7.3305527638190966e-06, "loss": 0.0134, "step": 27075 }, { "epoch": 1594.0, "learning_rate": 7.328040201005026e-06, "loss": 0.016, "step": 27100 }, { "epoch": 1595.0, "learning_rate": 7.325527638190956e-06, "loss": 0.0111, "step": 27125 }, { "epoch": 1597.0, "learning_rate": 7.3230150753768845e-06, "loss": 0.0153, "step": 27150 }, { "epoch": 1598.0, "learning_rate": 7.320502512562815e-06, "loss": 0.0183, "step": 27175 }, { "epoch": 1599.0, "learning_rate": 7.317989949748744e-06, "loss": 0.0117, "step": 27200 }, { "epoch": 1601.0, "learning_rate": 7.315477386934674e-06, "loss": 0.0263, "step": 27225 }, { "epoch": 1602.0, "learning_rate": 7.312964824120604e-06, "loss": 0.0155, "step": 27250 }, { "epoch": 1604.0, "learning_rate": 7.310452261306533e-06, "loss": 0.0159, "step": 27275 }, { "epoch": 1605.0, "learning_rate": 7.307939698492463e-06, "loss": 0.0251, "step": 27300 }, { "epoch": 1607.0, "learning_rate": 7.305427135678392e-06, "loss": 0.015, "step": 27325 }, { "epoch": 1608.0, "learning_rate": 7.3029145728643225e-06, "loss": 0.0133, "step": 27350 }, { "epoch": 1610.0, "learning_rate": 7.300402010050252e-06, "loss": 0.0163, "step": 27375 }, { "epoch": 1611.0, "learning_rate": 7.297889447236182e-06, "loss": 0.0171, "step": 27400 }, { "epoch": 1613.0, "learning_rate": 7.2953768844221105e-06, "loss": 0.0216, "step": 27425 }, { "epoch": 1614.0, "learning_rate": 7.292864321608041e-06, "loss": 0.0166, "step": 27450 }, { "epoch": 1616.0, "learning_rate": 7.290351758793971e-06, "loss": 0.0132, "step": 27475 }, { "epoch": 1617.0, "learning_rate": 7.2878391959799e-06, "loss": 0.0143, "step": 27500 }, { "epoch": 1619.0, "learning_rate": 7.28532663316583e-06, "loss": 0.0122, "step": 27525 }, { "epoch": 1620.0, "learning_rate": 7.282814070351759e-06, "loss": 0.0166, "step": 27550 }, { "epoch": 1622.0, "learning_rate": 7.280301507537689e-06, "loss": 0.0165, "step": 27575 }, { "epoch": 1623.0, "learning_rate": 7.277788944723618e-06, "loss": 0.0173, "step": 27600 }, { "epoch": 1624.0, "learning_rate": 7.2752763819095484e-06, "loss": 0.017, "step": 27625 }, { "epoch": 1626.0, "learning_rate": 7.272763819095478e-06, "loss": 0.0149, "step": 27650 }, { "epoch": 1627.0, "learning_rate": 7.270251256281408e-06, "loss": 0.0169, "step": 27675 }, { "epoch": 1629.0, "learning_rate": 7.267738693467338e-06, "loss": 0.0192, "step": 27700 }, { "epoch": 1630.0, "learning_rate": 7.265226130653267e-06, "loss": 0.0184, "step": 27725 }, { "epoch": 1632.0, "learning_rate": 7.262713567839197e-06, "loss": 0.0174, "step": 27750 }, { "epoch": 1633.0, "learning_rate": 7.260201005025126e-06, "loss": 0.0146, "step": 27775 }, { "epoch": 1635.0, "learning_rate": 7.257688442211056e-06, "loss": 0.0122, "step": 27800 }, { "epoch": 1636.0, "learning_rate": 7.255175879396985e-06, "loss": 0.0108, "step": 27825 }, { "epoch": 1638.0, "learning_rate": 7.252663316582915e-06, "loss": 0.0166, "step": 27850 }, { "epoch": 1639.0, "learning_rate": 7.250150753768845e-06, "loss": 0.0138, "step": 27875 }, { "epoch": 1641.0, "learning_rate": 7.247638190954774e-06, "loss": 0.0146, "step": 27900 }, { "epoch": 1642.0, "learning_rate": 7.2451256281407046e-06, "loss": 0.0144, "step": 27925 }, { "epoch": 1644.0, "learning_rate": 7.242613065326634e-06, "loss": 0.0136, "step": 27950 }, { "epoch": 1645.0, "learning_rate": 7.240100502512564e-06, "loss": 0.0231, "step": 27975 }, { "epoch": 1647.0, "learning_rate": 7.2375879396984925e-06, "loss": 0.0169, "step": 28000 }, { "epoch": 1647.0, "eval_loss": 0.5059393048286438, "eval_runtime": 166.3618, "eval_samples_per_second": 0.601, "eval_steps_per_second": 0.102, "eval_wer": 27.085714285714285, "step": 28000 }, { "epoch": 1648.0, "learning_rate": 7.235075376884423e-06, "loss": 0.0115, "step": 28025 }, { "epoch": 1649.0, "learning_rate": 7.232562814070352e-06, "loss": 0.02, "step": 28050 }, { "epoch": 1651.0, "learning_rate": 7.230050251256282e-06, "loss": 0.0163, "step": 28075 }, { "epoch": 1652.0, "learning_rate": 7.227537688442212e-06, "loss": 0.022, "step": 28100 }, { "epoch": 1654.0, "learning_rate": 7.225025125628141e-06, "loss": 0.0141, "step": 28125 }, { "epoch": 1655.0, "learning_rate": 7.222512562814071e-06, "loss": 0.0195, "step": 28150 }, { "epoch": 1657.0, "learning_rate": 7.22e-06, "loss": 0.0186, "step": 28175 }, { "epoch": 1658.0, "learning_rate": 7.2174874371859305e-06, "loss": 0.0142, "step": 28200 }, { "epoch": 1660.0, "learning_rate": 7.21497487437186e-06, "loss": 0.0131, "step": 28225 }, { "epoch": 1661.0, "learning_rate": 7.21246231155779e-06, "loss": 0.0109, "step": 28250 }, { "epoch": 1663.0, "learning_rate": 7.2099497487437185e-06, "loss": 0.0168, "step": 28275 }, { "epoch": 1664.0, "learning_rate": 7.207437185929649e-06, "loss": 0.0176, "step": 28300 }, { "epoch": 1666.0, "learning_rate": 7.204924623115579e-06, "loss": 0.0084, "step": 28325 }, { "epoch": 1667.0, "learning_rate": 7.202412060301508e-06, "loss": 0.0159, "step": 28350 }, { "epoch": 1669.0, "learning_rate": 7.199899497487438e-06, "loss": 0.0185, "step": 28375 }, { "epoch": 1670.0, "learning_rate": 7.197386934673367e-06, "loss": 0.0188, "step": 28400 }, { "epoch": 1672.0, "learning_rate": 7.194874371859297e-06, "loss": 0.0145, "step": 28425 }, { "epoch": 1673.0, "learning_rate": 7.192361809045226e-06, "loss": 0.0184, "step": 28450 }, { "epoch": 1674.0, "learning_rate": 7.1898492462311564e-06, "loss": 0.013, "step": 28475 }, { "epoch": 1676.0, "learning_rate": 7.187336683417087e-06, "loss": 0.012, "step": 28500 }, { "epoch": 1677.0, "learning_rate": 7.184824120603016e-06, "loss": 0.0134, "step": 28525 }, { "epoch": 1679.0, "learning_rate": 7.182311557788946e-06, "loss": 0.0125, "step": 28550 }, { "epoch": 1680.0, "learning_rate": 7.179798994974875e-06, "loss": 0.0119, "step": 28575 }, { "epoch": 1682.0, "learning_rate": 7.177286432160805e-06, "loss": 0.013, "step": 28600 }, { "epoch": 1683.0, "learning_rate": 7.174773869346734e-06, "loss": 0.0158, "step": 28625 }, { "epoch": 1685.0, "learning_rate": 7.172261306532664e-06, "loss": 0.0142, "step": 28650 }, { "epoch": 1686.0, "learning_rate": 7.169748743718593e-06, "loss": 0.0138, "step": 28675 }, { "epoch": 1688.0, "learning_rate": 7.167236180904523e-06, "loss": 0.0115, "step": 28700 }, { "epoch": 1689.0, "learning_rate": 7.164723618090453e-06, "loss": 0.0108, "step": 28725 }, { "epoch": 1691.0, "learning_rate": 7.162211055276382e-06, "loss": 0.0237, "step": 28750 }, { "epoch": 1692.0, "learning_rate": 7.1596984924623126e-06, "loss": 0.014, "step": 28775 }, { "epoch": 1694.0, "learning_rate": 7.157185929648242e-06, "loss": 0.0162, "step": 28800 }, { "epoch": 1695.0, "learning_rate": 7.154673366834172e-06, "loss": 0.0167, "step": 28825 }, { "epoch": 1697.0, "learning_rate": 7.1521608040201005e-06, "loss": 0.0095, "step": 28850 }, { "epoch": 1698.0, "learning_rate": 7.149648241206031e-06, "loss": 0.0148, "step": 28875 }, { "epoch": 1699.0, "learning_rate": 7.14713567839196e-06, "loss": 0.011, "step": 28900 }, { "epoch": 1701.0, "learning_rate": 7.14462311557789e-06, "loss": 0.0146, "step": 28925 }, { "epoch": 1702.0, "learning_rate": 7.14211055276382e-06, "loss": 0.011, "step": 28950 }, { "epoch": 1704.0, "learning_rate": 7.139597989949749e-06, "loss": 0.0208, "step": 28975 }, { "epoch": 1705.0, "learning_rate": 7.137085427135679e-06, "loss": 0.0147, "step": 29000 }, { "epoch": 1705.0, "eval_loss": 0.5324943661689758, "eval_runtime": 172.5244, "eval_samples_per_second": 0.58, "eval_steps_per_second": 0.099, "eval_wer": 27.77142857142857, "step": 29000 }, { "epoch": 1707.0, "learning_rate": 7.134572864321608e-06, "loss": 0.0119, "step": 29025 }, { "epoch": 1708.0, "learning_rate": 7.1320603015075385e-06, "loss": 0.0147, "step": 29050 }, { "epoch": 1710.0, "learning_rate": 7.129547738693468e-06, "loss": 0.0148, "step": 29075 }, { "epoch": 1711.0, "learning_rate": 7.127035175879398e-06, "loss": 0.0093, "step": 29100 }, { "epoch": 1713.0, "learning_rate": 7.1245226130653265e-06, "loss": 0.0089, "step": 29125 }, { "epoch": 1714.0, "learning_rate": 7.122010050251257e-06, "loss": 0.0098, "step": 29150 }, { "epoch": 1716.0, "learning_rate": 7.119497487437187e-06, "loss": 0.0132, "step": 29175 }, { "epoch": 1717.0, "learning_rate": 7.116984924623116e-06, "loss": 0.0129, "step": 29200 }, { "epoch": 1719.0, "learning_rate": 7.114472361809046e-06, "loss": 0.0203, "step": 29225 }, { "epoch": 1720.0, "learning_rate": 7.111959798994975e-06, "loss": 0.018, "step": 29250 }, { "epoch": 1722.0, "learning_rate": 7.109447236180905e-06, "loss": 0.0143, "step": 29275 }, { "epoch": 1723.0, "learning_rate": 7.106934673366834e-06, "loss": 0.0089, "step": 29300 }, { "epoch": 1724.0, "learning_rate": 7.1044221105527644e-06, "loss": 0.0106, "step": 29325 }, { "epoch": 1726.0, "learning_rate": 7.101909547738695e-06, "loss": 0.0071, "step": 29350 }, { "epoch": 1727.0, "learning_rate": 7.099396984924624e-06, "loss": 0.0121, "step": 29375 }, { "epoch": 1729.0, "learning_rate": 7.096884422110554e-06, "loss": 0.0135, "step": 29400 }, { "epoch": 1730.0, "learning_rate": 7.094371859296483e-06, "loss": 0.0197, "step": 29425 }, { "epoch": 1732.0, "learning_rate": 7.091859296482413e-06, "loss": 0.0136, "step": 29450 }, { "epoch": 1733.0, "learning_rate": 7.089346733668342e-06, "loss": 0.018, "step": 29475 }, { "epoch": 1735.0, "learning_rate": 7.086834170854272e-06, "loss": 0.0212, "step": 29500 }, { "epoch": 1736.0, "learning_rate": 7.084321608040201e-06, "loss": 0.0113, "step": 29525 }, { "epoch": 1738.0, "learning_rate": 7.081809045226131e-06, "loss": 0.016, "step": 29550 }, { "epoch": 1739.0, "learning_rate": 7.079296482412061e-06, "loss": 0.0116, "step": 29575 }, { "epoch": 1741.0, "learning_rate": 7.0768844221105535e-06, "loss": 0.0216, "step": 29600 }, { "epoch": 1742.0, "learning_rate": 7.074371859296483e-06, "loss": 0.0214, "step": 29625 }, { "epoch": 1744.0, "learning_rate": 7.071859296482413e-06, "loss": 0.015, "step": 29650 }, { "epoch": 1745.0, "learning_rate": 7.069346733668342e-06, "loss": 0.0164, "step": 29675 }, { "epoch": 1747.0, "learning_rate": 7.0668341708542724e-06, "loss": 0.0151, "step": 29700 }, { "epoch": 1748.0, "learning_rate": 7.064321608040201e-06, "loss": 0.0089, "step": 29725 }, { "epoch": 1749.0, "learning_rate": 7.061809045226131e-06, "loss": 0.0088, "step": 29750 }, { "epoch": 1751.0, "learning_rate": 7.059296482412061e-06, "loss": 0.013, "step": 29775 }, { "epoch": 1752.0, "learning_rate": 7.056783919597991e-06, "loss": 0.0105, "step": 29800 }, { "epoch": 1754.0, "learning_rate": 7.054271356783921e-06, "loss": 0.0097, "step": 29825 }, { "epoch": 1755.0, "learning_rate": 7.051758793969849e-06, "loss": 0.0091, "step": 29850 }, { "epoch": 1757.0, "learning_rate": 7.049246231155779e-06, "loss": 0.013, "step": 29875 }, { "epoch": 1758.0, "learning_rate": 7.046733668341709e-06, "loss": 0.0102, "step": 29900 }, { "epoch": 1760.0, "learning_rate": 7.044221105527639e-06, "loss": 0.0133, "step": 29925 }, { "epoch": 1761.0, "learning_rate": 7.041708542713569e-06, "loss": 0.0158, "step": 29950 }, { "epoch": 1763.0, "learning_rate": 7.039195979899498e-06, "loss": 0.0132, "step": 29975 }, { "epoch": 1764.0, "learning_rate": 7.036683417085428e-06, "loss": 0.0104, "step": 30000 }, { "epoch": 1764.0, "eval_loss": 0.4817672073841095, "eval_runtime": 167.8285, "eval_samples_per_second": 0.596, "eval_steps_per_second": 0.101, "eval_wer": 26.171428571428574, "step": 30000 }, { "epoch": 1766.0, "learning_rate": 7.034170854271357e-06, "loss": 0.0122, "step": 30025 }, { "epoch": 1767.0, "learning_rate": 7.031658291457287e-06, "loss": 0.0105, "step": 30050 }, { "epoch": 1769.0, "learning_rate": 7.0291457286432165e-06, "loss": 0.0103, "step": 30075 }, { "epoch": 1770.0, "learning_rate": 7.026633165829147e-06, "loss": 0.0129, "step": 30100 }, { "epoch": 1772.0, "learning_rate": 7.024120603015075e-06, "loss": 0.01, "step": 30125 }, { "epoch": 1773.0, "learning_rate": 7.021608040201005e-06, "loss": 0.0132, "step": 30150 }, { "epoch": 1774.0, "learning_rate": 7.0190954773869355e-06, "loss": 0.0125, "step": 30175 }, { "epoch": 1776.0, "learning_rate": 7.016582914572865e-06, "loss": 0.0118, "step": 30200 }, { "epoch": 1777.0, "learning_rate": 7.014070351758795e-06, "loss": 0.0132, "step": 30225 }, { "epoch": 1779.0, "learning_rate": 7.011557788944724e-06, "loss": 0.0162, "step": 30250 }, { "epoch": 1780.0, "learning_rate": 7.0090452261306545e-06, "loss": 0.0072, "step": 30275 }, { "epoch": 1782.0, "learning_rate": 7.006532663316583e-06, "loss": 0.0134, "step": 30300 }, { "epoch": 1783.0, "learning_rate": 7.004020100502513e-06, "loss": 0.0145, "step": 30325 }, { "epoch": 1785.0, "learning_rate": 7.0015075376884425e-06, "loss": 0.0151, "step": 30350 }, { "epoch": 1786.0, "learning_rate": 6.998994974874373e-06, "loss": 0.008, "step": 30375 }, { "epoch": 1788.0, "learning_rate": 6.996482412060303e-06, "loss": 0.0113, "step": 30400 }, { "epoch": 1789.0, "learning_rate": 6.993969849246231e-06, "loss": 0.0109, "step": 30425 }, { "epoch": 1791.0, "learning_rate": 6.9914572864321615e-06, "loss": 0.009, "step": 30450 }, { "epoch": 1792.0, "learning_rate": 6.988944723618091e-06, "loss": 0.0098, "step": 30475 }, { "epoch": 1794.0, "learning_rate": 6.986432160804021e-06, "loss": 0.0124, "step": 30500 }, { "epoch": 1795.0, "learning_rate": 6.98391959798995e-06, "loss": 0.0145, "step": 30525 }, { "epoch": 1797.0, "learning_rate": 6.9814070351758804e-06, "loss": 0.0162, "step": 30550 }, { "epoch": 1798.0, "learning_rate": 6.97889447236181e-06, "loss": 0.0116, "step": 30575 }, { "epoch": 1799.0, "learning_rate": 6.976381909547739e-06, "loss": 0.0139, "step": 30600 }, { "epoch": 1801.0, "learning_rate": 6.973869346733669e-06, "loss": 0.0141, "step": 30625 }, { "epoch": 1802.0, "learning_rate": 6.971356783919599e-06, "loss": 0.0164, "step": 30650 }, { "epoch": 1804.0, "learning_rate": 6.968844221105529e-06, "loss": 0.0135, "step": 30675 }, { "epoch": 1805.0, "learning_rate": 6.966331658291457e-06, "loss": 0.0096, "step": 30700 }, { "epoch": 1807.0, "learning_rate": 6.963819095477387e-06, "loss": 0.017, "step": 30725 }, { "epoch": 1808.0, "learning_rate": 6.961306532663317e-06, "loss": 0.0149, "step": 30750 }, { "epoch": 1810.0, "learning_rate": 6.958793969849247e-06, "loss": 0.0162, "step": 30775 }, { "epoch": 1811.0, "learning_rate": 6.956281407035177e-06, "loss": 0.0084, "step": 30800 }, { "epoch": 1813.0, "learning_rate": 6.953768844221106e-06, "loss": 0.0129, "step": 30825 }, { "epoch": 1814.0, "learning_rate": 6.951256281407036e-06, "loss": 0.0092, "step": 30850 }, { "epoch": 1816.0, "learning_rate": 6.948743718592965e-06, "loss": 0.013, "step": 30875 }, { "epoch": 1817.0, "learning_rate": 6.946231155778895e-06, "loss": 0.0113, "step": 30900 }, { "epoch": 1819.0, "learning_rate": 6.9437185929648245e-06, "loss": 0.0077, "step": 30925 }, { "epoch": 1820.0, "learning_rate": 6.941206030150755e-06, "loss": 0.0157, "step": 30950 }, { "epoch": 1822.0, "learning_rate": 6.938693467336683e-06, "loss": 0.01, "step": 30975 }, { "epoch": 1823.0, "learning_rate": 6.936180904522613e-06, "loss": 0.0128, "step": 31000 }, { "epoch": 1823.0, "eval_loss": 0.5259056091308594, "eval_runtime": 171.4433, "eval_samples_per_second": 0.583, "eval_steps_per_second": 0.099, "eval_wer": 28.34285714285714, "step": 31000 }, { "epoch": 1824.0, "learning_rate": 6.9336683417085435e-06, "loss": 0.0097, "step": 31025 }, { "epoch": 1826.0, "learning_rate": 6.931155778894473e-06, "loss": 0.0088, "step": 31050 }, { "epoch": 1827.0, "learning_rate": 6.928643216080403e-06, "loss": 0.0137, "step": 31075 }, { "epoch": 1829.0, "learning_rate": 6.926130653266332e-06, "loss": 0.0124, "step": 31100 }, { "epoch": 1830.0, "learning_rate": 6.923618090452262e-06, "loss": 0.0102, "step": 31125 }, { "epoch": 1832.0, "learning_rate": 6.921105527638191e-06, "loss": 0.0108, "step": 31150 }, { "epoch": 1833.0, "learning_rate": 6.918592964824121e-06, "loss": 0.0108, "step": 31175 }, { "epoch": 1835.0, "learning_rate": 6.9160804020100505e-06, "loss": 0.0113, "step": 31200 }, { "epoch": 1836.0, "learning_rate": 6.913567839195981e-06, "loss": 0.0115, "step": 31225 }, { "epoch": 1838.0, "learning_rate": 6.911055276381911e-06, "loss": 0.013, "step": 31250 }, { "epoch": 1839.0, "learning_rate": 6.908542713567839e-06, "loss": 0.0118, "step": 31275 }, { "epoch": 1841.0, "learning_rate": 6.9060301507537695e-06, "loss": 0.008, "step": 31300 }, { "epoch": 1842.0, "learning_rate": 6.903517587939699e-06, "loss": 0.0101, "step": 31325 }, { "epoch": 1844.0, "learning_rate": 6.901005025125629e-06, "loss": 0.0116, "step": 31350 }, { "epoch": 1845.0, "learning_rate": 6.898492462311558e-06, "loss": 0.0108, "step": 31375 }, { "epoch": 1847.0, "learning_rate": 6.8959798994974884e-06, "loss": 0.0099, "step": 31400 }, { "epoch": 1848.0, "learning_rate": 6.893467336683418e-06, "loss": 0.0091, "step": 31425 }, { "epoch": 1849.0, "learning_rate": 6.890954773869347e-06, "loss": 0.0072, "step": 31450 }, { "epoch": 1851.0, "learning_rate": 6.888442211055277e-06, "loss": 0.0153, "step": 31475 }, { "epoch": 1852.0, "learning_rate": 6.885929648241207e-06, "loss": 0.0085, "step": 31500 }, { "epoch": 1854.0, "learning_rate": 6.883417085427137e-06, "loss": 0.0079, "step": 31525 }, { "epoch": 1855.0, "learning_rate": 6.880904522613065e-06, "loss": 0.0073, "step": 31550 }, { "epoch": 1857.0, "learning_rate": 6.878391959798995e-06, "loss": 0.0098, "step": 31575 }, { "epoch": 1858.0, "learning_rate": 6.875879396984925e-06, "loss": 0.0074, "step": 31600 }, { "epoch": 1860.0, "learning_rate": 6.873366834170855e-06, "loss": 0.0078, "step": 31625 }, { "epoch": 1861.0, "learning_rate": 6.870854271356785e-06, "loss": 0.0075, "step": 31650 }, { "epoch": 1863.0, "learning_rate": 6.868341708542714e-06, "loss": 0.0109, "step": 31675 }, { "epoch": 1864.0, "learning_rate": 6.865829145728644e-06, "loss": 0.0098, "step": 31700 }, { "epoch": 1866.0, "learning_rate": 6.863316582914573e-06, "loss": 0.0092, "step": 31725 }, { "epoch": 1867.0, "learning_rate": 6.860804020100503e-06, "loss": 0.0094, "step": 31750 }, { "epoch": 1869.0, "learning_rate": 6.8582914572864325e-06, "loss": 0.0095, "step": 31775 }, { "epoch": 1870.0, "learning_rate": 6.855778894472363e-06, "loss": 0.0111, "step": 31800 }, { "epoch": 1872.0, "learning_rate": 6.853266331658291e-06, "loss": 0.0131, "step": 31825 }, { "epoch": 1873.0, "learning_rate": 6.850753768844221e-06, "loss": 0.0075, "step": 31850 }, { "epoch": 1874.0, "learning_rate": 6.8482412060301515e-06, "loss": 0.0153, "step": 31875 }, { "epoch": 1876.0, "learning_rate": 6.845728643216081e-06, "loss": 0.0093, "step": 31900 }, { "epoch": 1877.0, "learning_rate": 6.843216080402011e-06, "loss": 0.0098, "step": 31925 }, { "epoch": 1879.0, "learning_rate": 6.84070351758794e-06, "loss": 0.0074, "step": 31950 }, { "epoch": 1880.0, "learning_rate": 6.83819095477387e-06, "loss": 0.0106, "step": 31975 }, { "epoch": 1882.0, "learning_rate": 6.835678391959799e-06, "loss": 0.0145, "step": 32000 }, { "epoch": 1882.0, "eval_loss": 0.5298639535903931, "eval_runtime": 168.3817, "eval_samples_per_second": 0.594, "eval_steps_per_second": 0.101, "eval_wer": 26.285714285714285, "step": 32000 }, { "epoch": 1883.0, "learning_rate": 6.833165829145729e-06, "loss": 0.0126, "step": 32025 }, { "epoch": 1885.0, "learning_rate": 6.830653266331659e-06, "loss": 0.0138, "step": 32050 }, { "epoch": 1886.0, "learning_rate": 6.828140703517589e-06, "loss": 0.0226, "step": 32075 }, { "epoch": 1888.0, "learning_rate": 6.825628140703519e-06, "loss": 0.0069, "step": 32100 }, { "epoch": 1889.0, "learning_rate": 6.823115577889447e-06, "loss": 0.0126, "step": 32125 }, { "epoch": 1891.0, "learning_rate": 6.8206030150753775e-06, "loss": 0.0102, "step": 32150 }, { "epoch": 1892.0, "learning_rate": 6.818090452261307e-06, "loss": 0.0079, "step": 32175 }, { "epoch": 1894.0, "learning_rate": 6.815577889447237e-06, "loss": 0.0109, "step": 32200 }, { "epoch": 1895.0, "learning_rate": 6.813065326633166e-06, "loss": 0.0111, "step": 32225 }, { "epoch": 1897.0, "learning_rate": 6.810552763819096e-06, "loss": 0.0068, "step": 32250 }, { "epoch": 1898.0, "learning_rate": 6.808040201005026e-06, "loss": 0.0076, "step": 32275 }, { "epoch": 1899.0, "learning_rate": 6.805527638190955e-06, "loss": 0.0116, "step": 32300 }, { "epoch": 1901.0, "learning_rate": 6.803015075376885e-06, "loss": 0.011, "step": 32325 }, { "epoch": 1902.0, "learning_rate": 6.800502512562815e-06, "loss": 0.0159, "step": 32350 }, { "epoch": 1904.0, "learning_rate": 6.797989949748745e-06, "loss": 0.0138, "step": 32375 }, { "epoch": 1905.0, "learning_rate": 6.795477386934673e-06, "loss": 0.0157, "step": 32400 }, { "epoch": 1907.0, "learning_rate": 6.792964824120603e-06, "loss": 0.0082, "step": 32425 }, { "epoch": 1908.0, "learning_rate": 6.790452261306533e-06, "loss": 0.0107, "step": 32450 }, { "epoch": 1910.0, "learning_rate": 6.787939698492463e-06, "loss": 0.009, "step": 32475 }, { "epoch": 1911.0, "learning_rate": 6.785427135678393e-06, "loss": 0.01, "step": 32500 }, { "epoch": 1913.0, "learning_rate": 6.782914572864322e-06, "loss": 0.0092, "step": 32525 }, { "epoch": 1914.0, "learning_rate": 6.780402010050252e-06, "loss": 0.0105, "step": 32550 }, { "epoch": 1916.0, "learning_rate": 6.777889447236181e-06, "loss": 0.0104, "step": 32575 }, { "epoch": 1917.0, "learning_rate": 6.775376884422111e-06, "loss": 0.0107, "step": 32600 }, { "epoch": 1919.0, "learning_rate": 6.7728643216080405e-06, "loss": 0.0133, "step": 32625 }, { "epoch": 1920.0, "learning_rate": 6.770351758793971e-06, "loss": 0.0084, "step": 32650 }, { "epoch": 1922.0, "learning_rate": 6.767839195979901e-06, "loss": 0.0083, "step": 32675 }, { "epoch": 1923.0, "learning_rate": 6.765326633165829e-06, "loss": 0.0105, "step": 32700 }, { "epoch": 1924.0, "learning_rate": 6.7628140703517595e-06, "loss": 0.0076, "step": 32725 }, { "epoch": 1926.0, "learning_rate": 6.760301507537689e-06, "loss": 0.0115, "step": 32750 }, { "epoch": 1927.0, "learning_rate": 6.757788944723619e-06, "loss": 0.0136, "step": 32775 }, { "epoch": 1929.0, "learning_rate": 6.755276381909548e-06, "loss": 0.0165, "step": 32800 }, { "epoch": 1930.0, "learning_rate": 6.752763819095478e-06, "loss": 0.0066, "step": 32825 }, { "epoch": 1932.0, "learning_rate": 6.750251256281407e-06, "loss": 0.0104, "step": 32850 }, { "epoch": 1933.0, "learning_rate": 6.747738693467337e-06, "loss": 0.0082, "step": 32875 }, { "epoch": 1935.0, "learning_rate": 6.745226130653267e-06, "loss": 0.0103, "step": 32900 }, { "epoch": 1936.0, "learning_rate": 6.742713567839197e-06, "loss": 0.0088, "step": 32925 }, { "epoch": 1938.0, "learning_rate": 6.740201005025127e-06, "loss": 0.0111, "step": 32950 }, { "epoch": 1939.0, "learning_rate": 6.737688442211055e-06, "loss": 0.0067, "step": 32975 }, { "epoch": 1941.0, "learning_rate": 6.7351758793969855e-06, "loss": 0.0075, "step": 33000 }, { "epoch": 1941.0, "eval_loss": 0.5082035660743713, "eval_runtime": 168.1697, "eval_samples_per_second": 0.595, "eval_steps_per_second": 0.101, "eval_wer": 27.42857142857143, "step": 33000 }, { "epoch": 1942.0, "learning_rate": 6.732663316582915e-06, "loss": 0.0126, "step": 33025 }, { "epoch": 1944.0, "learning_rate": 6.730150753768845e-06, "loss": 0.0074, "step": 33050 }, { "epoch": 1945.0, "learning_rate": 6.727638190954774e-06, "loss": 0.0122, "step": 33075 }, { "epoch": 1947.0, "learning_rate": 6.725125628140704e-06, "loss": 0.0089, "step": 33100 }, { "epoch": 1948.0, "learning_rate": 6.722613065326634e-06, "loss": 0.0103, "step": 33125 }, { "epoch": 1949.0, "learning_rate": 6.720100502512563e-06, "loss": 0.0085, "step": 33150 }, { "epoch": 1951.0, "learning_rate": 6.717587939698493e-06, "loss": 0.0095, "step": 33175 }, { "epoch": 1952.0, "learning_rate": 6.715075376884423e-06, "loss": 0.0055, "step": 33200 }, { "epoch": 1954.0, "learning_rate": 6.712562814070353e-06, "loss": 0.0064, "step": 33225 }, { "epoch": 1955.0, "learning_rate": 6.710050251256281e-06, "loss": 0.0097, "step": 33250 }, { "epoch": 1957.0, "learning_rate": 6.707537688442211e-06, "loss": 0.012, "step": 33275 }, { "epoch": 1958.0, "learning_rate": 6.705025125628142e-06, "loss": 0.0105, "step": 33300 }, { "epoch": 1960.0, "learning_rate": 6.702512562814071e-06, "loss": 0.0083, "step": 33325 }, { "epoch": 1961.0, "learning_rate": 6.700000000000001e-06, "loss": 0.011, "step": 33350 }, { "epoch": 1963.0, "learning_rate": 6.69748743718593e-06, "loss": 0.009, "step": 33375 }, { "epoch": 1964.0, "learning_rate": 6.69497487437186e-06, "loss": 0.0144, "step": 33400 }, { "epoch": 1966.0, "learning_rate": 6.692462311557789e-06, "loss": 0.0122, "step": 33425 }, { "epoch": 1967.0, "learning_rate": 6.689949748743719e-06, "loss": 0.0109, "step": 33450 }, { "epoch": 1969.0, "learning_rate": 6.6874371859296485e-06, "loss": 0.0095, "step": 33475 }, { "epoch": 1970.0, "learning_rate": 6.684924623115579e-06, "loss": 0.0081, "step": 33500 }, { "epoch": 1972.0, "learning_rate": 6.682412060301509e-06, "loss": 0.0105, "step": 33525 }, { "epoch": 1973.0, "learning_rate": 6.679899497487437e-06, "loss": 0.0103, "step": 33550 }, { "epoch": 1974.0, "learning_rate": 6.67748743718593e-06, "loss": 0.0094, "step": 33575 }, { "epoch": 1976.0, "learning_rate": 6.67497487437186e-06, "loss": 0.0134, "step": 33600 }, { "epoch": 1977.0, "learning_rate": 6.672462311557789e-06, "loss": 0.0081, "step": 33625 }, { "epoch": 1979.0, "learning_rate": 6.669949748743719e-06, "loss": 0.0104, "step": 33650 }, { "epoch": 1980.0, "learning_rate": 6.667437185929648e-06, "loss": 0.0081, "step": 33675 }, { "epoch": 1982.0, "learning_rate": 6.664924623115578e-06, "loss": 0.0086, "step": 33700 }, { "epoch": 1983.0, "learning_rate": 6.662412060301508e-06, "loss": 0.0104, "step": 33725 }, { "epoch": 1985.0, "learning_rate": 6.6598994974874375e-06, "loss": 0.012, "step": 33750 }, { "epoch": 1986.0, "learning_rate": 6.657386934673368e-06, "loss": 0.007, "step": 33775 }, { "epoch": 1988.0, "learning_rate": 6.654874371859297e-06, "loss": 0.0114, "step": 33800 }, { "epoch": 1989.0, "learning_rate": 6.652361809045227e-06, "loss": 0.0113, "step": 33825 }, { "epoch": 1991.0, "learning_rate": 6.649849246231156e-06, "loss": 0.0078, "step": 33850 }, { "epoch": 1992.0, "learning_rate": 6.647336683417086e-06, "loss": 0.0045, "step": 33875 }, { "epoch": 1994.0, "learning_rate": 6.644824120603015e-06, "loss": 0.009, "step": 33900 }, { "epoch": 1995.0, "learning_rate": 6.642311557788945e-06, "loss": 0.0088, "step": 33925 }, { "epoch": 1997.0, "learning_rate": 6.6397989949748755e-06, "loss": 0.0065, "step": 33950 }, { "epoch": 1998.0, "learning_rate": 6.637286432160804e-06, "loss": 0.0094, "step": 33975 }, { "epoch": 1999.0, "learning_rate": 6.634773869346734e-06, "loss": 0.0087, "step": 34000 }, { "epoch": 1999.0, "eval_loss": 0.514407753944397, "eval_runtime": 168.9801, "eval_samples_per_second": 0.592, "eval_steps_per_second": 0.101, "eval_wer": 26.62857142857143, "step": 34000 }, { "epoch": 2001.0, "learning_rate": 6.6322613065326635e-06, "loss": 0.0073, "step": 34025 }, { "epoch": 2002.0, "learning_rate": 6.629748743718594e-06, "loss": 0.011, "step": 34050 }, { "epoch": 2004.0, "learning_rate": 6.627236180904523e-06, "loss": 0.0129, "step": 34075 }, { "epoch": 2005.0, "learning_rate": 6.624723618090453e-06, "loss": 0.0104, "step": 34100 }, { "epoch": 2007.0, "learning_rate": 6.622211055276383e-06, "loss": 0.0108, "step": 34125 }, { "epoch": 2008.0, "learning_rate": 6.619698492462312e-06, "loss": 0.0092, "step": 34150 }, { "epoch": 2010.0, "learning_rate": 6.617185929648242e-06, "loss": 0.0076, "step": 34175 }, { "epoch": 2011.0, "learning_rate": 6.614673366834171e-06, "loss": 0.0086, "step": 34200 }, { "epoch": 2013.0, "learning_rate": 6.6121608040201015e-06, "loss": 0.0103, "step": 34225 }, { "epoch": 2014.0, "learning_rate": 6.60964824120603e-06, "loss": 0.0075, "step": 34250 }, { "epoch": 2016.0, "learning_rate": 6.60713567839196e-06, "loss": 0.012, "step": 34275 }, { "epoch": 2017.0, "learning_rate": 6.6046231155778894e-06, "loss": 0.0098, "step": 34300 }, { "epoch": 2019.0, "learning_rate": 6.60211055276382e-06, "loss": 0.0111, "step": 34325 }, { "epoch": 2020.0, "learning_rate": 6.59959798994975e-06, "loss": 0.0105, "step": 34350 }, { "epoch": 2022.0, "learning_rate": 6.597085427135679e-06, "loss": 0.0042, "step": 34375 }, { "epoch": 2023.0, "learning_rate": 6.594572864321609e-06, "loss": 0.0098, "step": 34400 }, { "epoch": 2024.0, "learning_rate": 6.592060301507538e-06, "loss": 0.0081, "step": 34425 }, { "epoch": 2026.0, "learning_rate": 6.589547738693468e-06, "loss": 0.0077, "step": 34450 }, { "epoch": 2027.0, "learning_rate": 6.587035175879397e-06, "loss": 0.0084, "step": 34475 }, { "epoch": 2029.0, "learning_rate": 6.584522613065327e-06, "loss": 0.0081, "step": 34500 }, { "epoch": 2030.0, "learning_rate": 6.582010050251256e-06, "loss": 0.0042, "step": 34525 }, { "epoch": 2032.0, "learning_rate": 6.579497487437186e-06, "loss": 0.0101, "step": 34550 }, { "epoch": 2033.0, "learning_rate": 6.576984924623116e-06, "loss": 0.0098, "step": 34575 }, { "epoch": 2035.0, "learning_rate": 6.5744723618090455e-06, "loss": 0.0163, "step": 34600 }, { "epoch": 2036.0, "learning_rate": 6.571959798994976e-06, "loss": 0.006, "step": 34625 }, { "epoch": 2038.0, "learning_rate": 6.569447236180905e-06, "loss": 0.008, "step": 34650 }, { "epoch": 2039.0, "learning_rate": 6.566934673366835e-06, "loss": 0.0083, "step": 34675 }, { "epoch": 2041.0, "learning_rate": 6.564422110552764e-06, "loss": 0.0103, "step": 34700 }, { "epoch": 2042.0, "learning_rate": 6.561909547738694e-06, "loss": 0.0082, "step": 34725 }, { "epoch": 2044.0, "learning_rate": 6.559396984924624e-06, "loss": 0.0089, "step": 34750 }, { "epoch": 2045.0, "learning_rate": 6.556884422110553e-06, "loss": 0.0114, "step": 34775 }, { "epoch": 2047.0, "learning_rate": 6.5543718592964835e-06, "loss": 0.0095, "step": 34800 }, { "epoch": 2048.0, "learning_rate": 6.551859296482412e-06, "loss": 0.0112, "step": 34825 }, { "epoch": 2049.0, "learning_rate": 6.549346733668342e-06, "loss": 0.0091, "step": 34850 }, { "epoch": 2051.0, "learning_rate": 6.5468341708542715e-06, "loss": 0.0093, "step": 34875 }, { "epoch": 2052.0, "learning_rate": 6.544321608040202e-06, "loss": 0.0057, "step": 34900 }, { "epoch": 2054.0, "learning_rate": 6.541809045226131e-06, "loss": 0.0058, "step": 34925 }, { "epoch": 2055.0, "learning_rate": 6.539296482412061e-06, "loss": 0.0055, "step": 34950 }, { "epoch": 2057.0, "learning_rate": 6.536783919597991e-06, "loss": 0.0123, "step": 34975 }, { "epoch": 2058.0, "learning_rate": 6.534371859296484e-06, "loss": 0.005, "step": 35000 }, { "epoch": 2058.0, "eval_loss": 0.5590147376060486, "eval_runtime": 167.2891, "eval_samples_per_second": 0.598, "eval_steps_per_second": 0.102, "eval_wer": 27.085714285714285, "step": 35000 }, { "epoch": 2060.0, "learning_rate": 6.531859296482412e-06, "loss": 0.0055, "step": 35025 }, { "epoch": 2061.0, "learning_rate": 6.529346733668342e-06, "loss": 0.0084, "step": 35050 }, { "epoch": 2063.0, "learning_rate": 6.526834170854272e-06, "loss": 0.0082, "step": 35075 }, { "epoch": 2064.0, "learning_rate": 6.524321608040202e-06, "loss": 0.0057, "step": 35100 }, { "epoch": 2066.0, "learning_rate": 6.52180904522613e-06, "loss": 0.0062, "step": 35125 }, { "epoch": 2067.0, "learning_rate": 6.5192964824120605e-06, "loss": 0.0068, "step": 35150 }, { "epoch": 2069.0, "learning_rate": 6.516783919597991e-06, "loss": 0.0063, "step": 35175 }, { "epoch": 2070.0, "learning_rate": 6.51427135678392e-06, "loss": 0.0071, "step": 35200 }, { "epoch": 2072.0, "learning_rate": 6.51175879396985e-06, "loss": 0.0035, "step": 35225 }, { "epoch": 2073.0, "learning_rate": 6.5092462311557795e-06, "loss": 0.0145, "step": 35250 }, { "epoch": 2074.0, "learning_rate": 6.50673366834171e-06, "loss": 0.0135, "step": 35275 }, { "epoch": 2076.0, "learning_rate": 6.504221105527638e-06, "loss": 0.0071, "step": 35300 }, { "epoch": 2077.0, "learning_rate": 6.501708542713568e-06, "loss": 0.012, "step": 35325 }, { "epoch": 2079.0, "learning_rate": 6.499195979899498e-06, "loss": 0.0073, "step": 35350 }, { "epoch": 2080.0, "learning_rate": 6.496683417085428e-06, "loss": 0.0071, "step": 35375 }, { "epoch": 2082.0, "learning_rate": 6.494170854271358e-06, "loss": 0.0098, "step": 35400 }, { "epoch": 2083.0, "learning_rate": 6.4916582914572864e-06, "loss": 0.0063, "step": 35425 }, { "epoch": 2085.0, "learning_rate": 6.489145728643217e-06, "loss": 0.0073, "step": 35450 }, { "epoch": 2086.0, "learning_rate": 6.486633165829146e-06, "loss": 0.0057, "step": 35475 }, { "epoch": 2088.0, "learning_rate": 6.484120603015076e-06, "loss": 0.0102, "step": 35500 }, { "epoch": 2089.0, "learning_rate": 6.4816080402010054e-06, "loss": 0.0136, "step": 35525 }, { "epoch": 2091.0, "learning_rate": 6.479095477386936e-06, "loss": 0.0104, "step": 35550 }, { "epoch": 2092.0, "learning_rate": 6.476582914572866e-06, "loss": 0.0074, "step": 35575 }, { "epoch": 2094.0, "learning_rate": 6.474070351758794e-06, "loss": 0.0079, "step": 35600 }, { "epoch": 2095.0, "learning_rate": 6.471557788944724e-06, "loss": 0.0079, "step": 35625 }, { "epoch": 2097.0, "learning_rate": 6.469045226130654e-06, "loss": 0.0083, "step": 35650 }, { "epoch": 2098.0, "learning_rate": 6.466532663316584e-06, "loss": 0.0084, "step": 35675 }, { "epoch": 2099.0, "learning_rate": 6.464020100502512e-06, "loss": 0.0114, "step": 35700 }, { "epoch": 2101.0, "learning_rate": 6.4615075376884426e-06, "loss": 0.0096, "step": 35725 }, { "epoch": 2102.0, "learning_rate": 6.458994974874372e-06, "loss": 0.0111, "step": 35750 }, { "epoch": 2104.0, "learning_rate": 6.456482412060302e-06, "loss": 0.0066, "step": 35775 }, { "epoch": 2105.0, "learning_rate": 6.453969849246232e-06, "loss": 0.0071, "step": 35800 }, { "epoch": 2107.0, "learning_rate": 6.4514572864321615e-06, "loss": 0.012, "step": 35825 }, { "epoch": 2108.0, "learning_rate": 6.448944723618092e-06, "loss": 0.0064, "step": 35850 }, { "epoch": 2110.0, "learning_rate": 6.44643216080402e-06, "loss": 0.0105, "step": 35875 }, { "epoch": 2111.0, "learning_rate": 6.44391959798995e-06, "loss": 0.0073, "step": 35900 }, { "epoch": 2113.0, "learning_rate": 6.44140703517588e-06, "loss": 0.0082, "step": 35925 }, { "epoch": 2114.0, "learning_rate": 6.43889447236181e-06, "loss": 0.0064, "step": 35950 }, { "epoch": 2116.0, "learning_rate": 6.436381909547738e-06, "loss": 0.0107, "step": 35975 }, { "epoch": 2117.0, "learning_rate": 6.4338693467336685e-06, "loss": 0.0099, "step": 36000 }, { "epoch": 2117.0, "eval_loss": 0.5545507669448853, "eval_runtime": 166.0781, "eval_samples_per_second": 0.602, "eval_steps_per_second": 0.102, "eval_wer": 28.914285714285715, "step": 36000 }, { "epoch": 2119.0, "learning_rate": 6.431356783919599e-06, "loss": 0.0091, "step": 36025 }, { "epoch": 2120.0, "learning_rate": 6.428844221105528e-06, "loss": 0.0069, "step": 36050 }, { "epoch": 2122.0, "learning_rate": 6.426331658291458e-06, "loss": 0.0094, "step": 36075 }, { "epoch": 2123.0, "learning_rate": 6.4238190954773875e-06, "loss": 0.0054, "step": 36100 }, { "epoch": 2124.0, "learning_rate": 6.421306532663318e-06, "loss": 0.0096, "step": 36125 }, { "epoch": 2126.0, "learning_rate": 6.418793969849246e-06, "loss": 0.0062, "step": 36150 }, { "epoch": 2127.0, "learning_rate": 6.416281407035176e-06, "loss": 0.0094, "step": 36175 }, { "epoch": 2129.0, "learning_rate": 6.4137688442211065e-06, "loss": 0.0066, "step": 36200 }, { "epoch": 2130.0, "learning_rate": 6.411256281407036e-06, "loss": 0.0077, "step": 36225 }, { "epoch": 2132.0, "learning_rate": 6.408743718592966e-06, "loss": 0.0076, "step": 36250 }, { "epoch": 2133.0, "learning_rate": 6.4062311557788944e-06, "loss": 0.0082, "step": 36275 }, { "epoch": 2135.0, "learning_rate": 6.403718592964825e-06, "loss": 0.0058, "step": 36300 }, { "epoch": 2136.0, "learning_rate": 6.401206030150754e-06, "loss": 0.0097, "step": 36325 }, { "epoch": 2138.0, "learning_rate": 6.398693467336684e-06, "loss": 0.0075, "step": 36350 }, { "epoch": 2139.0, "learning_rate": 6.3961809045226134e-06, "loss": 0.0051, "step": 36375 }, { "epoch": 2141.0, "learning_rate": 6.393668341708544e-06, "loss": 0.0064, "step": 36400 }, { "epoch": 2142.0, "learning_rate": 6.391155778894474e-06, "loss": 0.0061, "step": 36425 }, { "epoch": 2144.0, "learning_rate": 6.388643216080402e-06, "loss": 0.0069, "step": 36450 }, { "epoch": 2145.0, "learning_rate": 6.386130653266332e-06, "loss": 0.0103, "step": 36475 }, { "epoch": 2147.0, "learning_rate": 6.383618090452262e-06, "loss": 0.007, "step": 36500 }, { "epoch": 2148.0, "learning_rate": 6.381105527638192e-06, "loss": 0.0104, "step": 36525 }, { "epoch": 2149.0, "learning_rate": 6.37859296482412e-06, "loss": 0.007, "step": 36550 }, { "epoch": 2151.0, "learning_rate": 6.3760804020100506e-06, "loss": 0.008, "step": 36575 }, { "epoch": 2152.0, "learning_rate": 6.37356783919598e-06, "loss": 0.0052, "step": 36600 }, { "epoch": 2154.0, "learning_rate": 6.37105527638191e-06, "loss": 0.0119, "step": 36625 }, { "epoch": 2155.0, "learning_rate": 6.36854271356784e-06, "loss": 0.007, "step": 36650 }, { "epoch": 2157.0, "learning_rate": 6.3660301507537695e-06, "loss": 0.0044, "step": 36675 }, { "epoch": 2158.0, "learning_rate": 6.3635175879397e-06, "loss": 0.0102, "step": 36700 }, { "epoch": 2160.0, "learning_rate": 6.361005025125628e-06, "loss": 0.0063, "step": 36725 }, { "epoch": 2161.0, "learning_rate": 6.358492462311558e-06, "loss": 0.0118, "step": 36750 }, { "epoch": 2163.0, "learning_rate": 6.355979899497488e-06, "loss": 0.0037, "step": 36775 }, { "epoch": 2164.0, "learning_rate": 6.353467336683418e-06, "loss": 0.0056, "step": 36800 }, { "epoch": 2166.0, "learning_rate": 6.350954773869348e-06, "loss": 0.0059, "step": 36825 }, { "epoch": 2167.0, "learning_rate": 6.3484422110552765e-06, "loss": 0.0081, "step": 36850 }, { "epoch": 2169.0, "learning_rate": 6.345929648241207e-06, "loss": 0.0091, "step": 36875 }, { "epoch": 2170.0, "learning_rate": 6.343417085427136e-06, "loss": 0.0083, "step": 36900 }, { "epoch": 2172.0, "learning_rate": 6.340904522613066e-06, "loss": 0.015, "step": 36925 }, { "epoch": 2173.0, "learning_rate": 6.3383919597989955e-06, "loss": 0.008, "step": 36950 }, { "epoch": 2174.0, "learning_rate": 6.335879396984926e-06, "loss": 0.0054, "step": 36975 }, { "epoch": 2176.0, "learning_rate": 6.333366834170854e-06, "loss": 0.007, "step": 37000 }, { "epoch": 2176.0, "eval_loss": 0.5364224910736084, "eval_runtime": 166.6326, "eval_samples_per_second": 0.6, "eval_steps_per_second": 0.102, "eval_wer": 26.857142857142858, "step": 37000 }, { "epoch": 2177.0, "learning_rate": 6.330854271356784e-06, "loss": 0.0056, "step": 37025 }, { "epoch": 2179.0, "learning_rate": 6.3283417085427145e-06, "loss": 0.0169, "step": 37050 }, { "epoch": 2180.0, "learning_rate": 6.325829145728644e-06, "loss": 0.0117, "step": 37075 }, { "epoch": 2182.0, "learning_rate": 6.323316582914574e-06, "loss": 0.0067, "step": 37100 }, { "epoch": 2183.0, "learning_rate": 6.3208040201005024e-06, "loss": 0.0105, "step": 37125 }, { "epoch": 2185.0, "learning_rate": 6.318291457286433e-06, "loss": 0.0094, "step": 37150 }, { "epoch": 2186.0, "learning_rate": 6.315778894472362e-06, "loss": 0.0121, "step": 37175 }, { "epoch": 2188.0, "learning_rate": 6.313266331658292e-06, "loss": 0.0092, "step": 37200 }, { "epoch": 2189.0, "learning_rate": 6.3107537688442214e-06, "loss": 0.0048, "step": 37225 }, { "epoch": 2191.0, "learning_rate": 6.308241206030152e-06, "loss": 0.0086, "step": 37250 }, { "epoch": 2192.0, "learning_rate": 6.305728643216082e-06, "loss": 0.0089, "step": 37275 }, { "epoch": 2194.0, "learning_rate": 6.30321608040201e-06, "loss": 0.0069, "step": 37300 }, { "epoch": 2195.0, "learning_rate": 6.30070351758794e-06, "loss": 0.0078, "step": 37325 }, { "epoch": 2197.0, "learning_rate": 6.29819095477387e-06, "loss": 0.0074, "step": 37350 }, { "epoch": 2198.0, "learning_rate": 6.2956783919598e-06, "loss": 0.0079, "step": 37375 }, { "epoch": 2199.0, "learning_rate": 6.293165829145728e-06, "loss": 0.006, "step": 37400 }, { "epoch": 2201.0, "learning_rate": 6.2906532663316586e-06, "loss": 0.0065, "step": 37425 }, { "epoch": 2202.0, "learning_rate": 6.288140703517589e-06, "loss": 0.0048, "step": 37450 }, { "epoch": 2204.0, "learning_rate": 6.285628140703518e-06, "loss": 0.0061, "step": 37475 }, { "epoch": 2205.0, "learning_rate": 6.283115577889448e-06, "loss": 0.0049, "step": 37500 }, { "epoch": 2207.0, "learning_rate": 6.2806030150753776e-06, "loss": 0.005, "step": 37525 }, { "epoch": 2208.0, "learning_rate": 6.278090452261308e-06, "loss": 0.0057, "step": 37550 }, { "epoch": 2210.0, "learning_rate": 6.275577889447236e-06, "loss": 0.0062, "step": 37575 }, { "epoch": 2211.0, "learning_rate": 6.273065326633166e-06, "loss": 0.007, "step": 37600 }, { "epoch": 2213.0, "learning_rate": 6.270552763819096e-06, "loss": 0.0054, "step": 37625 }, { "epoch": 2214.0, "learning_rate": 6.268040201005026e-06, "loss": 0.0062, "step": 37650 }, { "epoch": 2216.0, "learning_rate": 6.265527638190956e-06, "loss": 0.0057, "step": 37675 }, { "epoch": 2217.0, "learning_rate": 6.2630150753768845e-06, "loss": 0.0102, "step": 37700 }, { "epoch": 2219.0, "learning_rate": 6.260502512562815e-06, "loss": 0.0072, "step": 37725 }, { "epoch": 2220.0, "learning_rate": 6.257989949748744e-06, "loss": 0.0109, "step": 37750 }, { "epoch": 2222.0, "learning_rate": 6.255477386934674e-06, "loss": 0.007, "step": 37775 }, { "epoch": 2223.0, "learning_rate": 6.2529648241206035e-06, "loss": 0.0096, "step": 37800 }, { "epoch": 2224.0, "learning_rate": 6.250452261306534e-06, "loss": 0.0098, "step": 37825 }, { "epoch": 2226.0, "learning_rate": 6.247939698492462e-06, "loss": 0.0062, "step": 37850 }, { "epoch": 2227.0, "learning_rate": 6.245427135678392e-06, "loss": 0.0069, "step": 37875 }, { "epoch": 2229.0, "learning_rate": 6.2429145728643225e-06, "loss": 0.0093, "step": 37900 }, { "epoch": 2230.0, "learning_rate": 6.240402010050252e-06, "loss": 0.0084, "step": 37925 }, { "epoch": 2232.0, "learning_rate": 6.237889447236182e-06, "loss": 0.0059, "step": 37950 }, { "epoch": 2233.0, "learning_rate": 6.2353768844221105e-06, "loss": 0.0071, "step": 37975 }, { "epoch": 2235.0, "learning_rate": 6.232864321608041e-06, "loss": 0.0045, "step": 38000 }, { "epoch": 2235.0, "eval_loss": 0.557407796382904, "eval_runtime": 167.0508, "eval_samples_per_second": 0.599, "eval_steps_per_second": 0.102, "eval_wer": 27.200000000000003, "step": 38000 }, { "epoch": 2236.0, "learning_rate": 6.23035175879397e-06, "loss": 0.006, "step": 38025 }, { "epoch": 2238.0, "learning_rate": 6.2278391959799e-06, "loss": 0.0072, "step": 38050 }, { "epoch": 2239.0, "learning_rate": 6.22532663316583e-06, "loss": 0.0054, "step": 38075 }, { "epoch": 2241.0, "learning_rate": 6.22281407035176e-06, "loss": 0.0044, "step": 38100 }, { "epoch": 2242.0, "learning_rate": 6.220301507537689e-06, "loss": 0.0088, "step": 38125 }, { "epoch": 2244.0, "learning_rate": 6.217788944723618e-06, "loss": 0.0085, "step": 38150 }, { "epoch": 2245.0, "learning_rate": 6.2152763819095484e-06, "loss": 0.0111, "step": 38175 }, { "epoch": 2247.0, "learning_rate": 6.212763819095478e-06, "loss": 0.0074, "step": 38200 }, { "epoch": 2248.0, "learning_rate": 6.210251256281408e-06, "loss": 0.0095, "step": 38225 }, { "epoch": 2249.0, "learning_rate": 6.207738693467336e-06, "loss": 0.0051, "step": 38250 }, { "epoch": 2251.0, "learning_rate": 6.2052261306532666e-06, "loss": 0.0146, "step": 38275 }, { "epoch": 2252.0, "learning_rate": 6.202713567839197e-06, "loss": 0.0094, "step": 38300 }, { "epoch": 2254.0, "learning_rate": 6.200201005025126e-06, "loss": 0.0105, "step": 38325 }, { "epoch": 2255.0, "learning_rate": 6.197688442211056e-06, "loss": 0.006, "step": 38350 }, { "epoch": 2257.0, "learning_rate": 6.1951758793969856e-06, "loss": 0.0111, "step": 38375 }, { "epoch": 2258.0, "learning_rate": 6.192663316582916e-06, "loss": 0.0072, "step": 38400 }, { "epoch": 2260.0, "learning_rate": 6.190150753768844e-06, "loss": 0.0072, "step": 38425 }, { "epoch": 2261.0, "learning_rate": 6.187638190954774e-06, "loss": 0.0056, "step": 38450 }, { "epoch": 2263.0, "learning_rate": 6.185125628140704e-06, "loss": 0.0059, "step": 38475 }, { "epoch": 2264.0, "learning_rate": 6.182613065326634e-06, "loss": 0.0076, "step": 38500 }, { "epoch": 2266.0, "learning_rate": 6.180100502512564e-06, "loss": 0.008, "step": 38525 }, { "epoch": 2267.0, "learning_rate": 6.1775879396984925e-06, "loss": 0.0088, "step": 38550 }, { "epoch": 2269.0, "learning_rate": 6.175075376884423e-06, "loss": 0.0067, "step": 38575 }, { "epoch": 2270.0, "learning_rate": 6.172562814070352e-06, "loss": 0.008, "step": 38600 }, { "epoch": 2272.0, "learning_rate": 6.170050251256282e-06, "loss": 0.0088, "step": 38625 }, { "epoch": 2273.0, "learning_rate": 6.1675376884422115e-06, "loss": 0.0113, "step": 38650 }, { "epoch": 2274.0, "learning_rate": 6.165025125628142e-06, "loss": 0.0093, "step": 38675 }, { "epoch": 2276.0, "learning_rate": 6.162512562814071e-06, "loss": 0.0083, "step": 38700 }, { "epoch": 2277.0, "learning_rate": 6.16e-06, "loss": 0.0061, "step": 38725 }, { "epoch": 2279.0, "learning_rate": 6.1574874371859305e-06, "loss": 0.0065, "step": 38750 }, { "epoch": 2280.0, "learning_rate": 6.15497487437186e-06, "loss": 0.0055, "step": 38775 }, { "epoch": 2282.0, "learning_rate": 6.15246231155779e-06, "loss": 0.006, "step": 38800 }, { "epoch": 2283.0, "learning_rate": 6.1499497487437185e-06, "loss": 0.0077, "step": 38825 }, { "epoch": 2285.0, "learning_rate": 6.147437185929649e-06, "loss": 0.0082, "step": 38850 }, { "epoch": 2286.0, "learning_rate": 6.144924623115578e-06, "loss": 0.0071, "step": 38875 }, { "epoch": 2288.0, "learning_rate": 6.142412060301508e-06, "loss": 0.006, "step": 38900 }, { "epoch": 2289.0, "learning_rate": 6.139899497487438e-06, "loss": 0.0059, "step": 38925 }, { "epoch": 2291.0, "learning_rate": 6.137386934673368e-06, "loss": 0.0049, "step": 38950 }, { "epoch": 2292.0, "learning_rate": 6.134874371859297e-06, "loss": 0.0061, "step": 38975 }, { "epoch": 2294.0, "learning_rate": 6.132361809045226e-06, "loss": 0.0064, "step": 39000 }, { "epoch": 2294.0, "eval_loss": 0.5051302313804626, "eval_runtime": 164.9112, "eval_samples_per_second": 0.606, "eval_steps_per_second": 0.103, "eval_wer": 25.71428571428571, "step": 39000 }, { "epoch": 2295.0, "learning_rate": 6.1298492462311564e-06, "loss": 0.0083, "step": 39025 }, { "epoch": 2297.0, "learning_rate": 6.127336683417086e-06, "loss": 0.0043, "step": 39050 }, { "epoch": 2298.0, "learning_rate": 6.124824120603016e-06, "loss": 0.0046, "step": 39075 }, { "epoch": 2299.0, "learning_rate": 6.122311557788944e-06, "loss": 0.0069, "step": 39100 }, { "epoch": 2301.0, "learning_rate": 6.1197989949748746e-06, "loss": 0.0107, "step": 39125 }, { "epoch": 2302.0, "learning_rate": 6.117286432160805e-06, "loss": 0.0051, "step": 39150 }, { "epoch": 2304.0, "learning_rate": 6.114773869346734e-06, "loss": 0.0086, "step": 39175 }, { "epoch": 2305.0, "learning_rate": 6.112261306532664e-06, "loss": 0.0061, "step": 39200 }, { "epoch": 2307.0, "learning_rate": 6.1097487437185936e-06, "loss": 0.0088, "step": 39225 }, { "epoch": 2308.0, "learning_rate": 6.107236180904524e-06, "loss": 0.0051, "step": 39250 }, { "epoch": 2310.0, "learning_rate": 6.104723618090452e-06, "loss": 0.007, "step": 39275 }, { "epoch": 2311.0, "learning_rate": 6.102211055276382e-06, "loss": 0.0043, "step": 39300 }, { "epoch": 2313.0, "learning_rate": 6.0996984924623125e-06, "loss": 0.006, "step": 39325 }, { "epoch": 2314.0, "learning_rate": 6.097185929648242e-06, "loss": 0.006, "step": 39350 }, { "epoch": 2316.0, "learning_rate": 6.094673366834172e-06, "loss": 0.0066, "step": 39375 }, { "epoch": 2317.0, "learning_rate": 6.0921608040201005e-06, "loss": 0.0096, "step": 39400 }, { "epoch": 2319.0, "learning_rate": 6.089648241206031e-06, "loss": 0.0089, "step": 39425 }, { "epoch": 2320.0, "learning_rate": 6.08713567839196e-06, "loss": 0.0056, "step": 39450 }, { "epoch": 2322.0, "learning_rate": 6.08462311557789e-06, "loss": 0.0103, "step": 39475 }, { "epoch": 2323.0, "learning_rate": 6.0821105527638195e-06, "loss": 0.0058, "step": 39500 }, { "epoch": 2324.0, "learning_rate": 6.07959798994975e-06, "loss": 0.0062, "step": 39525 }, { "epoch": 2326.0, "learning_rate": 6.077085427135679e-06, "loss": 0.0062, "step": 39550 }, { "epoch": 2327.0, "learning_rate": 6.074572864321608e-06, "loss": 0.0054, "step": 39575 }, { "epoch": 2329.0, "learning_rate": 6.0720603015075385e-06, "loss": 0.0077, "step": 39600 }, { "epoch": 2330.0, "learning_rate": 6.069547738693468e-06, "loss": 0.0046, "step": 39625 }, { "epoch": 2332.0, "learning_rate": 6.067035175879398e-06, "loss": 0.0064, "step": 39650 }, { "epoch": 2333.0, "learning_rate": 6.0645226130653265e-06, "loss": 0.0069, "step": 39675 }, { "epoch": 2335.0, "learning_rate": 6.062010050251257e-06, "loss": 0.0057, "step": 39700 }, { "epoch": 2336.0, "learning_rate": 6.059497487437186e-06, "loss": 0.0066, "step": 39725 }, { "epoch": 2338.0, "learning_rate": 6.056984924623116e-06, "loss": 0.0065, "step": 39750 }, { "epoch": 2339.0, "learning_rate": 6.054472361809046e-06, "loss": 0.0061, "step": 39775 }, { "epoch": 2341.0, "learning_rate": 6.051959798994976e-06, "loss": 0.0081, "step": 39800 }, { "epoch": 2342.0, "learning_rate": 6.049447236180905e-06, "loss": 0.005, "step": 39825 }, { "epoch": 2344.0, "learning_rate": 6.046934673366834e-06, "loss": 0.0085, "step": 39850 }, { "epoch": 2345.0, "learning_rate": 6.0444221105527644e-06, "loss": 0.0052, "step": 39875 }, { "epoch": 2347.0, "learning_rate": 6.041909547738694e-06, "loss": 0.0049, "step": 39900 }, { "epoch": 2348.0, "learning_rate": 6.039396984924624e-06, "loss": 0.007, "step": 39925 }, { "epoch": 2349.0, "learning_rate": 6.036884422110554e-06, "loss": 0.0056, "step": 39950 }, { "epoch": 2351.0, "learning_rate": 6.0343718592964826e-06, "loss": 0.0061, "step": 39975 }, { "epoch": 2352.0, "learning_rate": 6.031859296482413e-06, "loss": 0.0079, "step": 40000 }, { "epoch": 2352.0, "eval_loss": 0.524686872959137, "eval_runtime": 164.0713, "eval_samples_per_second": 0.609, "eval_steps_per_second": 0.104, "eval_wer": 25.942857142857147, "step": 40000 }, { "epoch": 2354.0, "learning_rate": 6.029346733668342e-06, "loss": 0.0053, "step": 40025 }, { "epoch": 2355.0, "learning_rate": 6.026834170854272e-06, "loss": 0.0061, "step": 40050 }, { "epoch": 2357.0, "learning_rate": 6.0243216080402016e-06, "loss": 0.0061, "step": 40075 }, { "epoch": 2358.0, "learning_rate": 6.021809045226131e-06, "loss": 0.0051, "step": 40100 }, { "epoch": 2360.0, "learning_rate": 6.01929648241206e-06, "loss": 0.0041, "step": 40125 }, { "epoch": 2361.0, "learning_rate": 6.01678391959799e-06, "loss": 0.0071, "step": 40150 }, { "epoch": 2363.0, "learning_rate": 6.0142713567839205e-06, "loss": 0.0051, "step": 40175 }, { "epoch": 2364.0, "learning_rate": 6.01175879396985e-06, "loss": 0.0068, "step": 40200 }, { "epoch": 2366.0, "learning_rate": 6.00924623115578e-06, "loss": 0.0089, "step": 40225 }, { "epoch": 2367.0, "learning_rate": 6.0067336683417085e-06, "loss": 0.0043, "step": 40250 }, { "epoch": 2369.0, "learning_rate": 6.004221105527639e-06, "loss": 0.0054, "step": 40275 }, { "epoch": 2370.0, "learning_rate": 6.001708542713568e-06, "loss": 0.0054, "step": 40300 }, { "epoch": 2372.0, "learning_rate": 5.999195979899498e-06, "loss": 0.0058, "step": 40325 }, { "epoch": 2373.0, "learning_rate": 5.9966834170854275e-06, "loss": 0.0075, "step": 40350 }, { "epoch": 2374.0, "learning_rate": 5.994170854271358e-06, "loss": 0.0077, "step": 40375 }, { "epoch": 2376.0, "learning_rate": 5.991658291457287e-06, "loss": 0.0062, "step": 40400 }, { "epoch": 2377.0, "learning_rate": 5.989145728643216e-06, "loss": 0.0052, "step": 40425 }, { "epoch": 2379.0, "learning_rate": 5.9866331658291465e-06, "loss": 0.0057, "step": 40450 }, { "epoch": 2380.0, "learning_rate": 5.984120603015076e-06, "loss": 0.0037, "step": 40475 }, { "epoch": 2382.0, "learning_rate": 5.981608040201006e-06, "loss": 0.0065, "step": 40500 }, { "epoch": 2383.0, "learning_rate": 5.9790954773869345e-06, "loss": 0.0059, "step": 40525 }, { "epoch": 2385.0, "learning_rate": 5.976582914572865e-06, "loss": 0.0134, "step": 40550 }, { "epoch": 2386.0, "learning_rate": 5.974070351758794e-06, "loss": 0.0056, "step": 40575 }, { "epoch": 2388.0, "learning_rate": 5.971557788944724e-06, "loss": 0.0039, "step": 40600 }, { "epoch": 2389.0, "learning_rate": 5.969045226130654e-06, "loss": 0.0072, "step": 40625 }, { "epoch": 2391.0, "learning_rate": 5.966532663316584e-06, "loss": 0.0103, "step": 40650 }, { "epoch": 2392.0, "learning_rate": 5.964020100502513e-06, "loss": 0.0086, "step": 40675 }, { "epoch": 2394.0, "learning_rate": 5.961507537688442e-06, "loss": 0.0024, "step": 40700 }, { "epoch": 2395.0, "learning_rate": 5.9589949748743724e-06, "loss": 0.0038, "step": 40725 }, { "epoch": 2397.0, "learning_rate": 5.956482412060302e-06, "loss": 0.0066, "step": 40750 }, { "epoch": 2398.0, "learning_rate": 5.953969849246232e-06, "loss": 0.0057, "step": 40775 }, { "epoch": 2399.0, "learning_rate": 5.951457286432162e-06, "loss": 0.0086, "step": 40800 }, { "epoch": 2401.0, "learning_rate": 5.9489447236180906e-06, "loss": 0.0176, "step": 40825 }, { "epoch": 2402.0, "learning_rate": 5.946432160804021e-06, "loss": 0.0062, "step": 40850 }, { "epoch": 2404.0, "learning_rate": 5.94391959798995e-06, "loss": 0.0082, "step": 40875 }, { "epoch": 2405.0, "learning_rate": 5.94140703517588e-06, "loss": 0.0063, "step": 40900 }, { "epoch": 2407.0, "learning_rate": 5.9388944723618096e-06, "loss": 0.0052, "step": 40925 }, { "epoch": 2408.0, "learning_rate": 5.936381909547739e-06, "loss": 0.0083, "step": 40950 }, { "epoch": 2410.0, "learning_rate": 5.933869346733668e-06, "loss": 0.0046, "step": 40975 }, { "epoch": 2411.0, "learning_rate": 5.931356783919598e-06, "loss": 0.0083, "step": 41000 }, { "epoch": 2411.0, "eval_loss": 0.5513765811920166, "eval_runtime": 163.2913, "eval_samples_per_second": 0.612, "eval_steps_per_second": 0.104, "eval_wer": 25.6, "step": 41000 }, { "epoch": 2413.0, "learning_rate": 5.9288442211055285e-06, "loss": 0.0043, "step": 41025 }, { "epoch": 2414.0, "learning_rate": 5.926331658291458e-06, "loss": 0.0052, "step": 41050 }, { "epoch": 2416.0, "learning_rate": 5.923819095477388e-06, "loss": 0.0068, "step": 41075 }, { "epoch": 2417.0, "learning_rate": 5.9213065326633165e-06, "loss": 0.0059, "step": 41100 }, { "epoch": 2419.0, "learning_rate": 5.918793969849247e-06, "loss": 0.0072, "step": 41125 }, { "epoch": 2420.0, "learning_rate": 5.916281407035176e-06, "loss": 0.0079, "step": 41150 }, { "epoch": 2422.0, "learning_rate": 5.913768844221106e-06, "loss": 0.0075, "step": 41175 }, { "epoch": 2423.0, "learning_rate": 5.9112562814070355e-06, "loss": 0.0048, "step": 41200 }, { "epoch": 2424.0, "learning_rate": 5.908743718592965e-06, "loss": 0.0069, "step": 41225 }, { "epoch": 2426.0, "learning_rate": 5.906231155778895e-06, "loss": 0.004, "step": 41250 }, { "epoch": 2427.0, "learning_rate": 5.903718592964824e-06, "loss": 0.0068, "step": 41275 }, { "epoch": 2429.0, "learning_rate": 5.9012060301507545e-06, "loss": 0.0066, "step": 41300 }, { "epoch": 2430.0, "learning_rate": 5.898693467336684e-06, "loss": 0.0055, "step": 41325 }, { "epoch": 2432.0, "learning_rate": 5.896180904522614e-06, "loss": 0.0083, "step": 41350 }, { "epoch": 2433.0, "learning_rate": 5.8936683417085425e-06, "loss": 0.0082, "step": 41375 }, { "epoch": 2435.0, "learning_rate": 5.891155778894473e-06, "loss": 0.0046, "step": 41400 }, { "epoch": 2436.0, "learning_rate": 5.888643216080403e-06, "loss": 0.0085, "step": 41425 }, { "epoch": 2438.0, "learning_rate": 5.886130653266332e-06, "loss": 0.0062, "step": 41450 }, { "epoch": 2439.0, "learning_rate": 5.883618090452262e-06, "loss": 0.0068, "step": 41475 }, { "epoch": 2441.0, "learning_rate": 5.881105527638192e-06, "loss": 0.0089, "step": 41500 }, { "epoch": 2442.0, "learning_rate": 5.878592964824121e-06, "loss": 0.0061, "step": 41525 }, { "epoch": 2444.0, "learning_rate": 5.87608040201005e-06, "loss": 0.0077, "step": 41550 }, { "epoch": 2445.0, "learning_rate": 5.8735678391959804e-06, "loss": 0.0052, "step": 41575 }, { "epoch": 2447.0, "learning_rate": 5.87105527638191e-06, "loss": 0.0043, "step": 41600 }, { "epoch": 2448.0, "learning_rate": 5.86854271356784e-06, "loss": 0.0052, "step": 41625 }, { "epoch": 2449.0, "learning_rate": 5.86603015075377e-06, "loss": 0.0046, "step": 41650 }, { "epoch": 2451.0, "learning_rate": 5.8635175879396986e-06, "loss": 0.0051, "step": 41675 }, { "epoch": 2452.0, "learning_rate": 5.861005025125629e-06, "loss": 0.0037, "step": 41700 }, { "epoch": 2454.0, "learning_rate": 5.858492462311558e-06, "loss": 0.004, "step": 41725 }, { "epoch": 2455.0, "learning_rate": 5.855979899497488e-06, "loss": 0.0041, "step": 41750 }, { "epoch": 2457.0, "learning_rate": 5.8534673366834176e-06, "loss": 0.0054, "step": 41775 }, { "epoch": 2458.0, "learning_rate": 5.850954773869347e-06, "loss": 0.005, "step": 41800 }, { "epoch": 2460.0, "learning_rate": 5.848442211055276e-06, "loss": 0.0031, "step": 41825 }, { "epoch": 2461.0, "learning_rate": 5.845929648241206e-06, "loss": 0.0046, "step": 41850 }, { "epoch": 2463.0, "learning_rate": 5.8434170854271366e-06, "loss": 0.0073, "step": 41875 }, { "epoch": 2464.0, "learning_rate": 5.840904522613066e-06, "loss": 0.0071, "step": 41900 }, { "epoch": 2466.0, "learning_rate": 5.838391959798996e-06, "loss": 0.0074, "step": 41925 }, { "epoch": 2467.0, "learning_rate": 5.8358793969849245e-06, "loss": 0.0047, "step": 41950 }, { "epoch": 2469.0, "learning_rate": 5.833366834170855e-06, "loss": 0.0043, "step": 41975 }, { "epoch": 2470.0, "learning_rate": 5.830854271356784e-06, "loss": 0.0101, "step": 42000 }, { "epoch": 2470.0, "eval_loss": 0.5710281133651733, "eval_runtime": 169.1648, "eval_samples_per_second": 0.591, "eval_steps_per_second": 0.1, "eval_wer": 25.6, "step": 42000 }, { "epoch": 2472.0, "learning_rate": 5.828341708542714e-06, "loss": 0.006, "step": 42025 }, { "epoch": 2473.0, "learning_rate": 5.825829145728644e-06, "loss": 0.0079, "step": 42050 }, { "epoch": 2474.0, "learning_rate": 5.823316582914573e-06, "loss": 0.0067, "step": 42075 }, { "epoch": 2476.0, "learning_rate": 5.820804020100503e-06, "loss": 0.0071, "step": 42100 }, { "epoch": 2477.0, "learning_rate": 5.818291457286432e-06, "loss": 0.0057, "step": 42125 }, { "epoch": 2479.0, "learning_rate": 5.8157788944723625e-06, "loss": 0.0055, "step": 42150 }, { "epoch": 2480.0, "learning_rate": 5.813266331658292e-06, "loss": 0.0044, "step": 42175 }, { "epoch": 2482.0, "learning_rate": 5.810753768844222e-06, "loss": 0.0044, "step": 42200 }, { "epoch": 2483.0, "learning_rate": 5.8082412060301505e-06, "loss": 0.0033, "step": 42225 }, { "epoch": 2485.0, "learning_rate": 5.805728643216081e-06, "loss": 0.006, "step": 42250 }, { "epoch": 2486.0, "learning_rate": 5.803216080402011e-06, "loss": 0.005, "step": 42275 }, { "epoch": 2488.0, "learning_rate": 5.80070351758794e-06, "loss": 0.006, "step": 42300 }, { "epoch": 2489.0, "learning_rate": 5.79819095477387e-06, "loss": 0.0036, "step": 42325 }, { "epoch": 2491.0, "learning_rate": 5.7956783919598e-06, "loss": 0.0052, "step": 42350 }, { "epoch": 2492.0, "learning_rate": 5.793165829145729e-06, "loss": 0.0055, "step": 42375 }, { "epoch": 2494.0, "learning_rate": 5.790653266331658e-06, "loss": 0.005, "step": 42400 }, { "epoch": 2495.0, "learning_rate": 5.7881407035175884e-06, "loss": 0.0059, "step": 42425 }, { "epoch": 2497.0, "learning_rate": 5.785628140703518e-06, "loss": 0.0045, "step": 42450 }, { "epoch": 2498.0, "learning_rate": 5.783115577889448e-06, "loss": 0.0051, "step": 42475 }, { "epoch": 2499.0, "learning_rate": 5.780603015075378e-06, "loss": 0.0051, "step": 42500 }, { "epoch": 2501.0, "learning_rate": 5.778090452261307e-06, "loss": 0.0052, "step": 42525 }, { "epoch": 2502.0, "learning_rate": 5.775577889447237e-06, "loss": 0.008, "step": 42550 }, { "epoch": 2504.0, "learning_rate": 5.773065326633166e-06, "loss": 0.0048, "step": 42575 }, { "epoch": 2505.0, "learning_rate": 5.770552763819096e-06, "loss": 0.0035, "step": 42600 }, { "epoch": 2507.0, "learning_rate": 5.7680402010050256e-06, "loss": 0.0051, "step": 42625 }, { "epoch": 2508.0, "learning_rate": 5.765527638190955e-06, "loss": 0.0036, "step": 42650 }, { "epoch": 2510.0, "learning_rate": 5.763015075376885e-06, "loss": 0.0044, "step": 42675 }, { "epoch": 2511.0, "learning_rate": 5.760502512562814e-06, "loss": 0.0047, "step": 42700 }, { "epoch": 2513.0, "learning_rate": 5.7579899497487446e-06, "loss": 0.0079, "step": 42725 }, { "epoch": 2514.0, "learning_rate": 5.755477386934674e-06, "loss": 0.0043, "step": 42750 }, { "epoch": 2516.0, "learning_rate": 5.752964824120604e-06, "loss": 0.0038, "step": 42775 }, { "epoch": 2517.0, "learning_rate": 5.7504522613065325e-06, "loss": 0.0026, "step": 42800 }, { "epoch": 2519.0, "learning_rate": 5.747939698492463e-06, "loss": 0.0038, "step": 42825 }, { "epoch": 2520.0, "learning_rate": 5.745427135678392e-06, "loss": 0.0022, "step": 42850 }, { "epoch": 2522.0, "learning_rate": 5.742914572864322e-06, "loss": 0.0117, "step": 42875 }, { "epoch": 2523.0, "learning_rate": 5.740402010050252e-06, "loss": 0.0039, "step": 42900 }, { "epoch": 2524.0, "learning_rate": 5.737889447236181e-06, "loss": 0.0039, "step": 42925 }, { "epoch": 2526.0, "learning_rate": 5.735376884422111e-06, "loss": 0.0045, "step": 42950 }, { "epoch": 2527.0, "learning_rate": 5.73286432160804e-06, "loss": 0.0058, "step": 42975 }, { "epoch": 2529.0, "learning_rate": 5.7303517587939705e-06, "loss": 0.0062, "step": 43000 }, { "epoch": 2529.0, "eval_loss": 0.5829825401306152, "eval_runtime": 165.1942, "eval_samples_per_second": 0.605, "eval_steps_per_second": 0.103, "eval_wer": 28.000000000000004, "step": 43000 }, { "epoch": 2530.0, "learning_rate": 5.7278391959799e-06, "loss": 0.0038, "step": 43025 }, { "epoch": 2532.0, "learning_rate": 5.72532663316583e-06, "loss": 0.0054, "step": 43050 }, { "epoch": 2533.0, "learning_rate": 5.7228140703517585e-06, "loss": 0.0086, "step": 43075 }, { "epoch": 2535.0, "learning_rate": 5.720301507537689e-06, "loss": 0.0065, "step": 43100 }, { "epoch": 2536.0, "learning_rate": 5.717788944723619e-06, "loss": 0.0055, "step": 43125 }, { "epoch": 2538.0, "learning_rate": 5.715276381909548e-06, "loss": 0.0056, "step": 43150 }, { "epoch": 2539.0, "learning_rate": 5.712763819095478e-06, "loss": 0.0049, "step": 43175 }, { "epoch": 2541.0, "learning_rate": 5.710251256281407e-06, "loss": 0.0037, "step": 43200 }, { "epoch": 2542.0, "learning_rate": 5.707738693467337e-06, "loss": 0.0066, "step": 43225 }, { "epoch": 2544.0, "learning_rate": 5.705226130653266e-06, "loss": 0.0072, "step": 43250 }, { "epoch": 2545.0, "learning_rate": 5.7027135678391964e-06, "loss": 0.0049, "step": 43275 }, { "epoch": 2547.0, "learning_rate": 5.700201005025127e-06, "loss": 0.0037, "step": 43300 }, { "epoch": 2548.0, "learning_rate": 5.697688442211056e-06, "loss": 0.0039, "step": 43325 }, { "epoch": 2549.0, "learning_rate": 5.695175879396986e-06, "loss": 0.0056, "step": 43350 }, { "epoch": 2551.0, "learning_rate": 5.692663316582915e-06, "loss": 0.0061, "step": 43375 }, { "epoch": 2552.0, "learning_rate": 5.690150753768845e-06, "loss": 0.0048, "step": 43400 }, { "epoch": 2554.0, "learning_rate": 5.687638190954774e-06, "loss": 0.0052, "step": 43425 }, { "epoch": 2555.0, "learning_rate": 5.685125628140704e-06, "loss": 0.0066, "step": 43450 }, { "epoch": 2557.0, "learning_rate": 5.6826130653266336e-06, "loss": 0.0078, "step": 43475 }, { "epoch": 2558.0, "learning_rate": 5.680100502512563e-06, "loss": 0.0075, "step": 43500 }, { "epoch": 2560.0, "learning_rate": 5.677587939698493e-06, "loss": 0.0041, "step": 43525 }, { "epoch": 2561.0, "learning_rate": 5.675075376884422e-06, "loss": 0.0057, "step": 43550 }, { "epoch": 2563.0, "learning_rate": 5.6725628140703526e-06, "loss": 0.007, "step": 43575 }, { "epoch": 2564.0, "learning_rate": 5.670050251256282e-06, "loss": 0.0071, "step": 43600 }, { "epoch": 2566.0, "learning_rate": 5.667537688442212e-06, "loss": 0.0042, "step": 43625 }, { "epoch": 2567.0, "learning_rate": 5.6650251256281405e-06, "loss": 0.0029, "step": 43650 }, { "epoch": 2569.0, "learning_rate": 5.662512562814071e-06, "loss": 0.0075, "step": 43675 }, { "epoch": 2570.0, "learning_rate": 5.66e-06, "loss": 0.0045, "step": 43700 }, { "epoch": 2572.0, "learning_rate": 5.65748743718593e-06, "loss": 0.0042, "step": 43725 }, { "epoch": 2573.0, "learning_rate": 5.65497487437186e-06, "loss": 0.0024, "step": 43750 }, { "epoch": 2574.0, "learning_rate": 5.652462311557789e-06, "loss": 0.0038, "step": 43775 }, { "epoch": 2576.0, "learning_rate": 5.649949748743719e-06, "loss": 0.0055, "step": 43800 }, { "epoch": 2577.0, "learning_rate": 5.647437185929648e-06, "loss": 0.0093, "step": 43825 }, { "epoch": 2579.0, "learning_rate": 5.6449246231155785e-06, "loss": 0.0068, "step": 43850 }, { "epoch": 2580.0, "learning_rate": 5.642412060301508e-06, "loss": 0.0091, "step": 43875 }, { "epoch": 2582.0, "learning_rate": 5.639899497487438e-06, "loss": 0.004, "step": 43900 }, { "epoch": 2583.0, "learning_rate": 5.637386934673368e-06, "loss": 0.0032, "step": 43925 }, { "epoch": 2585.0, "learning_rate": 5.634874371859297e-06, "loss": 0.0037, "step": 43950 }, { "epoch": 2586.0, "learning_rate": 5.632361809045227e-06, "loss": 0.0034, "step": 43975 }, { "epoch": 2588.0, "learning_rate": 5.629849246231156e-06, "loss": 0.0046, "step": 44000 }, { "epoch": 2588.0, "eval_loss": 0.5827962756156921, "eval_runtime": 167.175, "eval_samples_per_second": 0.598, "eval_steps_per_second": 0.102, "eval_wer": 26.857142857142858, "step": 44000 }, { "epoch": 2589.0, "learning_rate": 5.627336683417086e-06, "loss": 0.0036, "step": 44025 }, { "epoch": 2591.0, "learning_rate": 5.624824120603015e-06, "loss": 0.008, "step": 44050 }, { "epoch": 2592.0, "learning_rate": 5.622311557788945e-06, "loss": 0.0037, "step": 44075 }, { "epoch": 2594.0, "learning_rate": 5.619798994974874e-06, "loss": 0.0042, "step": 44100 }, { "epoch": 2595.0, "learning_rate": 5.6172864321608044e-06, "loss": 0.0048, "step": 44125 }, { "epoch": 2597.0, "learning_rate": 5.614773869346735e-06, "loss": 0.0045, "step": 44150 }, { "epoch": 2598.0, "learning_rate": 5.612261306532664e-06, "loss": 0.0054, "step": 44175 }, { "epoch": 2599.0, "learning_rate": 5.609748743718594e-06, "loss": 0.0055, "step": 44200 }, { "epoch": 2601.0, "learning_rate": 5.607236180904523e-06, "loss": 0.0041, "step": 44225 }, { "epoch": 2602.0, "learning_rate": 5.604723618090453e-06, "loss": 0.0062, "step": 44250 }, { "epoch": 2604.0, "learning_rate": 5.602211055276382e-06, "loss": 0.0063, "step": 44275 }, { "epoch": 2605.0, "learning_rate": 5.599698492462312e-06, "loss": 0.0062, "step": 44300 }, { "epoch": 2607.0, "learning_rate": 5.597185929648241e-06, "loss": 0.0047, "step": 44325 }, { "epoch": 2608.0, "learning_rate": 5.594673366834171e-06, "loss": 0.0031, "step": 44350 }, { "epoch": 2610.0, "learning_rate": 5.592160804020101e-06, "loss": 0.0067, "step": 44375 }, { "epoch": 2611.0, "learning_rate": 5.58964824120603e-06, "loss": 0.0043, "step": 44400 }, { "epoch": 2613.0, "learning_rate": 5.5871356783919606e-06, "loss": 0.0055, "step": 44425 }, { "epoch": 2614.0, "learning_rate": 5.58462311557789e-06, "loss": 0.0067, "step": 44450 }, { "epoch": 2616.0, "learning_rate": 5.58211055276382e-06, "loss": 0.0052, "step": 44475 }, { "epoch": 2617.0, "learning_rate": 5.5795979899497485e-06, "loss": 0.0056, "step": 44500 }, { "epoch": 2619.0, "learning_rate": 5.577085427135679e-06, "loss": 0.0057, "step": 44525 }, { "epoch": 2620.0, "learning_rate": 5.574572864321609e-06, "loss": 0.0041, "step": 44550 }, { "epoch": 2622.0, "learning_rate": 5.572060301507538e-06, "loss": 0.0035, "step": 44575 }, { "epoch": 2623.0, "learning_rate": 5.569547738693468e-06, "loss": 0.0055, "step": 44600 }, { "epoch": 2624.0, "learning_rate": 5.567035175879397e-06, "loss": 0.0042, "step": 44625 }, { "epoch": 2626.0, "learning_rate": 5.564522613065327e-06, "loss": 0.0038, "step": 44650 }, { "epoch": 2627.0, "learning_rate": 5.562010050251256e-06, "loss": 0.0044, "step": 44675 }, { "epoch": 2629.0, "learning_rate": 5.5594974874371865e-06, "loss": 0.0038, "step": 44700 }, { "epoch": 2630.0, "learning_rate": 5.556984924623116e-06, "loss": 0.006, "step": 44725 }, { "epoch": 2632.0, "learning_rate": 5.554472361809046e-06, "loss": 0.0031, "step": 44750 }, { "epoch": 2633.0, "learning_rate": 5.551959798994976e-06, "loss": 0.0027, "step": 44775 }, { "epoch": 2635.0, "learning_rate": 5.549447236180905e-06, "loss": 0.0063, "step": 44800 }, { "epoch": 2636.0, "learning_rate": 5.546934673366835e-06, "loss": 0.0037, "step": 44825 }, { "epoch": 2638.0, "learning_rate": 5.544422110552764e-06, "loss": 0.0045, "step": 44850 }, { "epoch": 2639.0, "learning_rate": 5.541909547738694e-06, "loss": 0.0053, "step": 44875 }, { "epoch": 2641.0, "learning_rate": 5.539597989949749e-06, "loss": 0.0046, "step": 44900 }, { "epoch": 2642.0, "learning_rate": 5.537085427135679e-06, "loss": 0.0044, "step": 44925 }, { "epoch": 2644.0, "learning_rate": 5.534572864321609e-06, "loss": 0.0036, "step": 44950 }, { "epoch": 2645.0, "learning_rate": 5.532060301507538e-06, "loss": 0.0068, "step": 44975 }, { "epoch": 2647.0, "learning_rate": 5.529547738693468e-06, "loss": 0.0053, "step": 45000 }, { "epoch": 2647.0, "eval_loss": 0.5621368885040283, "eval_runtime": 166.0604, "eval_samples_per_second": 0.602, "eval_steps_per_second": 0.102, "eval_wer": 27.42857142857143, "step": 45000 }, { "epoch": 2648.0, "learning_rate": 5.527035175879397e-06, "loss": 0.0051, "step": 45025 }, { "epoch": 2649.0, "learning_rate": 5.524522613065327e-06, "loss": 0.0039, "step": 45050 }, { "epoch": 2651.0, "learning_rate": 5.522010050251257e-06, "loss": 0.0047, "step": 45075 }, { "epoch": 2652.0, "learning_rate": 5.519497487437187e-06, "loss": 0.0088, "step": 45100 }, { "epoch": 2654.0, "learning_rate": 5.516984924623115e-06, "loss": 0.007, "step": 45125 }, { "epoch": 2655.0, "learning_rate": 5.5144723618090455e-06, "loss": 0.0017, "step": 45150 }, { "epoch": 2657.0, "learning_rate": 5.511959798994976e-06, "loss": 0.0031, "step": 45175 }, { "epoch": 2658.0, "learning_rate": 5.509447236180905e-06, "loss": 0.0048, "step": 45200 }, { "epoch": 2660.0, "learning_rate": 5.506934673366835e-06, "loss": 0.0037, "step": 45225 }, { "epoch": 2661.0, "learning_rate": 5.504422110552764e-06, "loss": 0.0044, "step": 45250 }, { "epoch": 2663.0, "learning_rate": 5.501909547738694e-06, "loss": 0.0021, "step": 45275 }, { "epoch": 2664.0, "learning_rate": 5.499396984924623e-06, "loss": 0.0052, "step": 45300 }, { "epoch": 2666.0, "learning_rate": 5.496884422110553e-06, "loss": 0.0042, "step": 45325 }, { "epoch": 2667.0, "learning_rate": 5.494371859296483e-06, "loss": 0.0043, "step": 45350 }, { "epoch": 2669.0, "learning_rate": 5.491859296482413e-06, "loss": 0.0031, "step": 45375 }, { "epoch": 2670.0, "learning_rate": 5.489346733668343e-06, "loss": 0.0056, "step": 45400 }, { "epoch": 2672.0, "learning_rate": 5.4868341708542715e-06, "loss": 0.0031, "step": 45425 }, { "epoch": 2673.0, "learning_rate": 5.484321608040202e-06, "loss": 0.0032, "step": 45450 }, { "epoch": 2674.0, "learning_rate": 5.481809045226131e-06, "loss": 0.0029, "step": 45475 }, { "epoch": 2676.0, "learning_rate": 5.479296482412061e-06, "loss": 0.0053, "step": 45500 }, { "epoch": 2677.0, "learning_rate": 5.47678391959799e-06, "loss": 0.0038, "step": 45525 }, { "epoch": 2679.0, "learning_rate": 5.47427135678392e-06, "loss": 0.0043, "step": 45550 }, { "epoch": 2680.0, "learning_rate": 5.47175879396985e-06, "loss": 0.0036, "step": 45575 }, { "epoch": 2682.0, "learning_rate": 5.469246231155779e-06, "loss": 0.0055, "step": 45600 }, { "epoch": 2683.0, "learning_rate": 5.4667336683417095e-06, "loss": 0.0037, "step": 45625 }, { "epoch": 2685.0, "learning_rate": 5.464221105527639e-06, "loss": 0.0063, "step": 45650 }, { "epoch": 2686.0, "learning_rate": 5.461708542713569e-06, "loss": 0.0038, "step": 45675 }, { "epoch": 2688.0, "learning_rate": 5.459195979899497e-06, "loss": 0.0044, "step": 45700 }, { "epoch": 2689.0, "learning_rate": 5.456683417085428e-06, "loss": 0.0037, "step": 45725 }, { "epoch": 2691.0, "learning_rate": 5.454170854271357e-06, "loss": 0.003, "step": 45750 }, { "epoch": 2692.0, "learning_rate": 5.451658291457287e-06, "loss": 0.0054, "step": 45775 }, { "epoch": 2694.0, "learning_rate": 5.449145728643217e-06, "loss": 0.0066, "step": 45800 }, { "epoch": 2695.0, "learning_rate": 5.446633165829146e-06, "loss": 0.0042, "step": 45825 }, { "epoch": 2697.0, "learning_rate": 5.444120603015076e-06, "loss": 0.0027, "step": 45850 }, { "epoch": 2698.0, "learning_rate": 5.441608040201005e-06, "loss": 0.0026, "step": 45875 }, { "epoch": 2699.0, "learning_rate": 5.439095477386935e-06, "loss": 0.003, "step": 45900 }, { "epoch": 2701.0, "learning_rate": 5.436582914572865e-06, "loss": 0.0056, "step": 45925 }, { "epoch": 2702.0, "learning_rate": 5.434070351758795e-06, "loss": 0.0042, "step": 45950 }, { "epoch": 2704.0, "learning_rate": 5.431557788944723e-06, "loss": 0.0046, "step": 45975 }, { "epoch": 2705.0, "learning_rate": 5.4290452261306535e-06, "loss": 0.0047, "step": 46000 }, { "epoch": 2705.0, "eval_loss": 0.5672851800918579, "eval_runtime": 168.5135, "eval_samples_per_second": 0.593, "eval_steps_per_second": 0.101, "eval_wer": 25.942857142857147, "step": 46000 }, { "epoch": 2707.0, "learning_rate": 5.426532663316584e-06, "loss": 0.0039, "step": 46025 }, { "epoch": 2708.0, "learning_rate": 5.424020100502513e-06, "loss": 0.0049, "step": 46050 }, { "epoch": 2710.0, "learning_rate": 5.421507537688443e-06, "loss": 0.0062, "step": 46075 }, { "epoch": 2711.0, "learning_rate": 5.418994974874372e-06, "loss": 0.0058, "step": 46100 }, { "epoch": 2713.0, "learning_rate": 5.416482412060302e-06, "loss": 0.0065, "step": 46125 }, { "epoch": 2714.0, "learning_rate": 5.413969849246231e-06, "loss": 0.0046, "step": 46150 }, { "epoch": 2716.0, "learning_rate": 5.411457286432161e-06, "loss": 0.0036, "step": 46175 }, { "epoch": 2717.0, "learning_rate": 5.4089447236180915e-06, "loss": 0.0052, "step": 46200 }, { "epoch": 2719.0, "learning_rate": 5.406432160804021e-06, "loss": 0.003, "step": 46225 }, { "epoch": 2720.0, "learning_rate": 5.403919597989951e-06, "loss": 0.0058, "step": 46250 }, { "epoch": 2722.0, "learning_rate": 5.4014070351758795e-06, "loss": 0.0052, "step": 46275 }, { "epoch": 2723.0, "learning_rate": 5.39889447236181e-06, "loss": 0.0053, "step": 46300 }, { "epoch": 2724.0, "learning_rate": 5.396381909547739e-06, "loss": 0.0059, "step": 46325 }, { "epoch": 2726.0, "learning_rate": 5.393869346733669e-06, "loss": 0.0039, "step": 46350 }, { "epoch": 2727.0, "learning_rate": 5.391356783919598e-06, "loss": 0.0029, "step": 46375 }, { "epoch": 2729.0, "learning_rate": 5.388844221105528e-06, "loss": 0.0044, "step": 46400 }, { "epoch": 2730.0, "learning_rate": 5.386331658291458e-06, "loss": 0.0099, "step": 46425 }, { "epoch": 2732.0, "learning_rate": 5.383819095477387e-06, "loss": 0.0046, "step": 46450 }, { "epoch": 2733.0, "learning_rate": 5.3813065326633175e-06, "loss": 0.0061, "step": 46475 }, { "epoch": 2735.0, "learning_rate": 5.378793969849247e-06, "loss": 0.0044, "step": 46500 }, { "epoch": 2736.0, "learning_rate": 5.376281407035177e-06, "loss": 0.0034, "step": 46525 }, { "epoch": 2738.0, "learning_rate": 5.373768844221105e-06, "loss": 0.0066, "step": 46550 }, { "epoch": 2739.0, "learning_rate": 5.371256281407036e-06, "loss": 0.0044, "step": 46575 }, { "epoch": 2741.0, "learning_rate": 5.368743718592965e-06, "loss": 0.0054, "step": 46600 }, { "epoch": 2742.0, "learning_rate": 5.366231155778895e-06, "loss": 0.0023, "step": 46625 }, { "epoch": 2744.0, "learning_rate": 5.363718592964825e-06, "loss": 0.0034, "step": 46650 }, { "epoch": 2745.0, "learning_rate": 5.361206030150754e-06, "loss": 0.0037, "step": 46675 }, { "epoch": 2747.0, "learning_rate": 5.358693467336684e-06, "loss": 0.0043, "step": 46700 }, { "epoch": 2748.0, "learning_rate": 5.356180904522613e-06, "loss": 0.0034, "step": 46725 }, { "epoch": 2749.0, "learning_rate": 5.353668341708543e-06, "loss": 0.0041, "step": 46750 }, { "epoch": 2751.0, "learning_rate": 5.351155778894473e-06, "loss": 0.0046, "step": 46775 }, { "epoch": 2752.0, "learning_rate": 5.348643216080403e-06, "loss": 0.0048, "step": 46800 }, { "epoch": 2754.0, "learning_rate": 5.346130653266332e-06, "loss": 0.0068, "step": 46825 }, { "epoch": 2755.0, "learning_rate": 5.3436180904522615e-06, "loss": 0.0044, "step": 46850 }, { "epoch": 2757.0, "learning_rate": 5.341105527638192e-06, "loss": 0.005, "step": 46875 }, { "epoch": 2758.0, "learning_rate": 5.338592964824121e-06, "loss": 0.0022, "step": 46900 }, { "epoch": 2760.0, "learning_rate": 5.336080402010051e-06, "loss": 0.0028, "step": 46925 }, { "epoch": 2761.0, "learning_rate": 5.33356783919598e-06, "loss": 0.0033, "step": 46950 }, { "epoch": 2763.0, "learning_rate": 5.33105527638191e-06, "loss": 0.0035, "step": 46975 }, { "epoch": 2764.0, "learning_rate": 5.328542713567839e-06, "loss": 0.0045, "step": 47000 }, { "epoch": 2764.0, "eval_loss": 0.5220341086387634, "eval_runtime": 167.8653, "eval_samples_per_second": 0.596, "eval_steps_per_second": 0.101, "eval_wer": 25.6, "step": 47000 }, { "epoch": 2766.0, "learning_rate": 5.326030150753769e-06, "loss": 0.011, "step": 47025 }, { "epoch": 2767.0, "learning_rate": 5.3235175879396995e-06, "loss": 0.0055, "step": 47050 }, { "epoch": 2769.0, "learning_rate": 5.321005025125629e-06, "loss": 0.002, "step": 47075 }, { "epoch": 2770.0, "learning_rate": 5.318492462311558e-06, "loss": 0.0043, "step": 47100 }, { "epoch": 2772.0, "learning_rate": 5.3159798994974875e-06, "loss": 0.0037, "step": 47125 }, { "epoch": 2773.0, "learning_rate": 5.313467336683418e-06, "loss": 0.0035, "step": 47150 }, { "epoch": 2774.0, "learning_rate": 5.310954773869347e-06, "loss": 0.0043, "step": 47175 }, { "epoch": 2776.0, "learning_rate": 5.308442211055277e-06, "loss": 0.0045, "step": 47200 }, { "epoch": 2777.0, "learning_rate": 5.305929648241206e-06, "loss": 0.0036, "step": 47225 }, { "epoch": 2779.0, "learning_rate": 5.303417085427136e-06, "loss": 0.0035, "step": 47250 }, { "epoch": 2780.0, "learning_rate": 5.300904522613066e-06, "loss": 0.0032, "step": 47275 }, { "epoch": 2782.0, "learning_rate": 5.298391959798995e-06, "loss": 0.0033, "step": 47300 }, { "epoch": 2783.0, "learning_rate": 5.2958793969849255e-06, "loss": 0.0036, "step": 47325 }, { "epoch": 2785.0, "learning_rate": 5.293366834170855e-06, "loss": 0.0054, "step": 47350 }, { "epoch": 2786.0, "learning_rate": 5.290854271356785e-06, "loss": 0.005, "step": 47375 }, { "epoch": 2788.0, "learning_rate": 5.2883417085427134e-06, "loss": 0.0055, "step": 47400 }, { "epoch": 2789.0, "learning_rate": 5.285829145728644e-06, "loss": 0.0041, "step": 47425 }, { "epoch": 2791.0, "learning_rate": 5.283316582914574e-06, "loss": 0.0028, "step": 47450 }, { "epoch": 2792.0, "learning_rate": 5.280804020100503e-06, "loss": 0.0039, "step": 47475 }, { "epoch": 2794.0, "learning_rate": 5.278291457286433e-06, "loss": 0.006, "step": 47500 }, { "epoch": 2795.0, "learning_rate": 5.275778894472362e-06, "loss": 0.0043, "step": 47525 }, { "epoch": 2797.0, "learning_rate": 5.273266331658292e-06, "loss": 0.0053, "step": 47550 }, { "epoch": 2798.0, "learning_rate": 5.270753768844221e-06, "loss": 0.0067, "step": 47575 }, { "epoch": 2799.0, "learning_rate": 5.268241206030151e-06, "loss": 0.0031, "step": 47600 }, { "epoch": 2801.0, "learning_rate": 5.265728643216081e-06, "loss": 0.004, "step": 47625 }, { "epoch": 2802.0, "learning_rate": 5.263216080402011e-06, "loss": 0.0045, "step": 47650 }, { "epoch": 2804.0, "learning_rate": 5.26070351758794e-06, "loss": 0.0054, "step": 47675 }, { "epoch": 2805.0, "learning_rate": 5.2581909547738695e-06, "loss": 0.0054, "step": 47700 }, { "epoch": 2807.0, "learning_rate": 5.2556783919598e-06, "loss": 0.0041, "step": 47725 }, { "epoch": 2808.0, "learning_rate": 5.253165829145729e-06, "loss": 0.0069, "step": 47750 }, { "epoch": 2810.0, "learning_rate": 5.250653266331659e-06, "loss": 0.0034, "step": 47775 }, { "epoch": 2811.0, "learning_rate": 5.248140703517588e-06, "loss": 0.0044, "step": 47800 }, { "epoch": 2813.0, "learning_rate": 5.245628140703518e-06, "loss": 0.0068, "step": 47825 }, { "epoch": 2814.0, "learning_rate": 5.243115577889447e-06, "loss": 0.0028, "step": 47850 }, { "epoch": 2816.0, "learning_rate": 5.240603015075377e-06, "loss": 0.0056, "step": 47875 }, { "epoch": 2817.0, "learning_rate": 5.2380904522613075e-06, "loss": 0.0043, "step": 47900 }, { "epoch": 2819.0, "learning_rate": 5.235577889447237e-06, "loss": 0.0037, "step": 47925 }, { "epoch": 2820.0, "learning_rate": 5.233065326633166e-06, "loss": 0.0037, "step": 47950 }, { "epoch": 2822.0, "learning_rate": 5.2305527638190955e-06, "loss": 0.0053, "step": 47975 }, { "epoch": 2823.0, "learning_rate": 5.228040201005026e-06, "loss": 0.0065, "step": 48000 }, { "epoch": 2823.0, "eval_loss": 0.5704354643821716, "eval_runtime": 169.7154, "eval_samples_per_second": 0.589, "eval_steps_per_second": 0.1, "eval_wer": 27.77142857142857, "step": 48000 }, { "epoch": 2824.0, "learning_rate": 5.225527638190955e-06, "loss": 0.007, "step": 48025 }, { "epoch": 2826.0, "learning_rate": 5.223015075376885e-06, "loss": 0.0055, "step": 48050 }, { "epoch": 2827.0, "learning_rate": 5.220502512562815e-06, "loss": 0.0026, "step": 48075 }, { "epoch": 2829.0, "learning_rate": 5.217989949748744e-06, "loss": 0.0059, "step": 48100 }, { "epoch": 2830.0, "learning_rate": 5.215477386934674e-06, "loss": 0.0043, "step": 48125 }, { "epoch": 2832.0, "learning_rate": 5.212964824120603e-06, "loss": 0.0056, "step": 48150 }, { "epoch": 2833.0, "learning_rate": 5.2104522613065335e-06, "loss": 0.0032, "step": 48175 }, { "epoch": 2835.0, "learning_rate": 5.207939698492463e-06, "loss": 0.0048, "step": 48200 }, { "epoch": 2836.0, "learning_rate": 5.205427135678393e-06, "loss": 0.0037, "step": 48225 }, { "epoch": 2838.0, "learning_rate": 5.2029145728643214e-06, "loss": 0.0062, "step": 48250 }, { "epoch": 2839.0, "learning_rate": 5.200402010050252e-06, "loss": 0.0032, "step": 48275 }, { "epoch": 2841.0, "learning_rate": 5.197889447236182e-06, "loss": 0.0017, "step": 48300 }, { "epoch": 2842.0, "learning_rate": 5.195376884422111e-06, "loss": 0.004, "step": 48325 }, { "epoch": 2844.0, "learning_rate": 5.192864321608041e-06, "loss": 0.0028, "step": 48350 }, { "epoch": 2845.0, "learning_rate": 5.19035175879397e-06, "loss": 0.0029, "step": 48375 }, { "epoch": 2847.0, "learning_rate": 5.1878391959799e-06, "loss": 0.0031, "step": 48400 }, { "epoch": 2848.0, "learning_rate": 5.185326633165829e-06, "loss": 0.004, "step": 48425 }, { "epoch": 2849.0, "learning_rate": 5.182814070351759e-06, "loss": 0.0025, "step": 48450 }, { "epoch": 2851.0, "learning_rate": 5.180301507537689e-06, "loss": 0.0025, "step": 48475 }, { "epoch": 2852.0, "learning_rate": 5.177788944723619e-06, "loss": 0.0032, "step": 48500 }, { "epoch": 2854.0, "learning_rate": 5.175276381909548e-06, "loss": 0.0042, "step": 48525 }, { "epoch": 2855.0, "learning_rate": 5.1727638190954775e-06, "loss": 0.0038, "step": 48550 }, { "epoch": 2857.0, "learning_rate": 5.170251256281408e-06, "loss": 0.007, "step": 48575 }, { "epoch": 2858.0, "learning_rate": 5.167738693467337e-06, "loss": 0.0038, "step": 48600 }, { "epoch": 2860.0, "learning_rate": 5.165226130653267e-06, "loss": 0.0022, "step": 48625 }, { "epoch": 2861.0, "learning_rate": 5.162713567839196e-06, "loss": 0.0023, "step": 48650 }, { "epoch": 2863.0, "learning_rate": 5.160201005025126e-06, "loss": 0.003, "step": 48675 }, { "epoch": 2864.0, "learning_rate": 5.157688442211056e-06, "loss": 0.0062, "step": 48700 }, { "epoch": 2866.0, "learning_rate": 5.155175879396985e-06, "loss": 0.0044, "step": 48725 }, { "epoch": 2867.0, "learning_rate": 5.1526633165829155e-06, "loss": 0.003, "step": 48750 }, { "epoch": 2869.0, "learning_rate": 5.150150753768845e-06, "loss": 0.0057, "step": 48775 }, { "epoch": 2870.0, "learning_rate": 5.147638190954774e-06, "loss": 0.0039, "step": 48800 }, { "epoch": 2872.0, "learning_rate": 5.1451256281407035e-06, "loss": 0.0032, "step": 48825 }, { "epoch": 2873.0, "learning_rate": 5.142613065326634e-06, "loss": 0.0043, "step": 48850 }, { "epoch": 2874.0, "learning_rate": 5.140100502512563e-06, "loss": 0.003, "step": 48875 }, { "epoch": 2876.0, "learning_rate": 5.137587939698493e-06, "loss": 0.0027, "step": 48900 }, { "epoch": 2877.0, "learning_rate": 5.135075376884423e-06, "loss": 0.004, "step": 48925 }, { "epoch": 2879.0, "learning_rate": 5.132663316582916e-06, "loss": 0.0054, "step": 48950 }, { "epoch": 2880.0, "learning_rate": 5.130150753768844e-06, "loss": 0.0071, "step": 48975 }, { "epoch": 2882.0, "learning_rate": 5.127638190954774e-06, "loss": 0.0039, "step": 49000 }, { "epoch": 2882.0, "eval_loss": 0.5740671753883362, "eval_runtime": 165.9532, "eval_samples_per_second": 0.603, "eval_steps_per_second": 0.102, "eval_wer": 27.77142857142857, "step": 49000 }, { "epoch": 2883.0, "learning_rate": 5.125125628140704e-06, "loss": 0.0057, "step": 49025 }, { "epoch": 2885.0, "learning_rate": 5.122613065326634e-06, "loss": 0.0028, "step": 49050 }, { "epoch": 2886.0, "learning_rate": 5.120100502512562e-06, "loss": 0.0035, "step": 49075 }, { "epoch": 2888.0, "learning_rate": 5.1175879396984925e-06, "loss": 0.0062, "step": 49100 }, { "epoch": 2889.0, "learning_rate": 5.115075376884423e-06, "loss": 0.003, "step": 49125 }, { "epoch": 2891.0, "learning_rate": 5.112562814070352e-06, "loss": 0.0028, "step": 49150 }, { "epoch": 2892.0, "learning_rate": 5.110050251256282e-06, "loss": 0.0053, "step": 49175 }, { "epoch": 2894.0, "learning_rate": 5.1075376884422115e-06, "loss": 0.0037, "step": 49200 }, { "epoch": 2895.0, "learning_rate": 5.105025125628142e-06, "loss": 0.0039, "step": 49225 }, { "epoch": 2897.0, "learning_rate": 5.10251256281407e-06, "loss": 0.0019, "step": 49250 }, { "epoch": 2898.0, "learning_rate": 5.1e-06, "loss": 0.0049, "step": 49275 }, { "epoch": 2899.0, "learning_rate": 5.09748743718593e-06, "loss": 0.0045, "step": 49300 }, { "epoch": 2901.0, "learning_rate": 5.09497487437186e-06, "loss": 0.0045, "step": 49325 }, { "epoch": 2902.0, "learning_rate": 5.09246231155779e-06, "loss": 0.0034, "step": 49350 }, { "epoch": 2904.0, "learning_rate": 5.0899497487437184e-06, "loss": 0.0067, "step": 49375 }, { "epoch": 2905.0, "learning_rate": 5.087437185929649e-06, "loss": 0.0028, "step": 49400 }, { "epoch": 2907.0, "learning_rate": 5.084924623115578e-06, "loss": 0.0028, "step": 49425 }, { "epoch": 2908.0, "learning_rate": 5.082412060301508e-06, "loss": 0.0041, "step": 49450 }, { "epoch": 2910.0, "learning_rate": 5.0798994974874374e-06, "loss": 0.0044, "step": 49475 }, { "epoch": 2911.0, "learning_rate": 5.077386934673368e-06, "loss": 0.0031, "step": 49500 }, { "epoch": 2913.0, "learning_rate": 5.074874371859298e-06, "loss": 0.0055, "step": 49525 }, { "epoch": 2914.0, "learning_rate": 5.072361809045226e-06, "loss": 0.0026, "step": 49550 }, { "epoch": 2916.0, "learning_rate": 5.069949748743719e-06, "loss": 0.0015, "step": 49575 }, { "epoch": 2917.0, "learning_rate": 5.067437185929649e-06, "loss": 0.0016, "step": 49600 }, { "epoch": 2919.0, "learning_rate": 5.064924623115578e-06, "loss": 0.0041, "step": 49625 }, { "epoch": 2920.0, "learning_rate": 5.062412060301508e-06, "loss": 0.0037, "step": 49650 }, { "epoch": 2922.0, "learning_rate": 5.059899497487437e-06, "loss": 0.0041, "step": 49675 }, { "epoch": 2923.0, "learning_rate": 5.057386934673367e-06, "loss": 0.0027, "step": 49700 }, { "epoch": 2924.0, "learning_rate": 5.054874371859297e-06, "loss": 0.0021, "step": 49725 }, { "epoch": 2926.0, "learning_rate": 5.0523618090452264e-06, "loss": 0.0026, "step": 49750 }, { "epoch": 2927.0, "learning_rate": 5.049849246231157e-06, "loss": 0.0035, "step": 49775 }, { "epoch": 2929.0, "learning_rate": 5.047336683417086e-06, "loss": 0.0025, "step": 49800 }, { "epoch": 2930.0, "learning_rate": 5.044824120603016e-06, "loss": 0.0018, "step": 49825 }, { "epoch": 2932.0, "learning_rate": 5.0423115577889446e-06, "loss": 0.0023, "step": 49850 }, { "epoch": 2933.0, "learning_rate": 5.039798994974875e-06, "loss": 0.0048, "step": 49875 }, { "epoch": 2935.0, "learning_rate": 5.037286432160804e-06, "loss": 0.003, "step": 49900 }, { "epoch": 2936.0, "learning_rate": 5.034773869346734e-06, "loss": 0.0032, "step": 49925 }, { "epoch": 2938.0, "learning_rate": 5.032261306532664e-06, "loss": 0.0037, "step": 49950 }, { "epoch": 2939.0, "learning_rate": 5.029748743718593e-06, "loss": 0.0026, "step": 49975 }, { "epoch": 2941.0, "learning_rate": 5.027236180904523e-06, "loss": 0.0027, "step": 50000 }, { "epoch": 2941.0, "eval_loss": 0.5762184262275696, "eval_runtime": 167.8168, "eval_samples_per_second": 0.596, "eval_steps_per_second": 0.101, "eval_wer": 26.057142857142857, "step": 50000 }, { "epoch": 2942.0, "learning_rate": 5.024723618090452e-06, "loss": 0.0035, "step": 50025 }, { "epoch": 2944.0, "learning_rate": 5.0222110552763825e-06, "loss": 0.0035, "step": 50050 }, { "epoch": 2945.0, "learning_rate": 5.019698492462312e-06, "loss": 0.0026, "step": 50075 }, { "epoch": 2947.0, "learning_rate": 5.017185929648242e-06, "loss": 0.0042, "step": 50100 }, { "epoch": 2948.0, "learning_rate": 5.0146733668341705e-06, "loss": 0.0037, "step": 50125 }, { "epoch": 2949.0, "learning_rate": 5.012160804020101e-06, "loss": 0.0019, "step": 50150 }, { "epoch": 2951.0, "learning_rate": 5.009648241206031e-06, "loss": 0.0023, "step": 50175 }, { "epoch": 2952.0, "learning_rate": 5.00713567839196e-06, "loss": 0.0037, "step": 50200 }, { "epoch": 2954.0, "learning_rate": 5.00462311557789e-06, "loss": 0.0025, "step": 50225 }, { "epoch": 2955.0, "learning_rate": 5.002110552763819e-06, "loss": 0.0029, "step": 50250 }, { "epoch": 2957.0, "learning_rate": 4.999597989949749e-06, "loss": 0.0047, "step": 50275 }, { "epoch": 2958.0, "learning_rate": 4.997085427135679e-06, "loss": 0.0042, "step": 50300 }, { "epoch": 2960.0, "learning_rate": 4.9945728643216085e-06, "loss": 0.003, "step": 50325 }, { "epoch": 2961.0, "learning_rate": 4.992060301507538e-06, "loss": 0.0028, "step": 50350 }, { "epoch": 2963.0, "learning_rate": 4.989547738693468e-06, "loss": 0.0026, "step": 50375 }, { "epoch": 2964.0, "learning_rate": 4.987035175879397e-06, "loss": 0.0043, "step": 50400 }, { "epoch": 2966.0, "learning_rate": 4.984522613065327e-06, "loss": 0.0027, "step": 50425 }, { "epoch": 2967.0, "learning_rate": 4.982010050251257e-06, "loss": 0.0041, "step": 50450 }, { "epoch": 2969.0, "learning_rate": 4.979497487437186e-06, "loss": 0.0058, "step": 50475 }, { "epoch": 2970.0, "learning_rate": 4.976984924623116e-06, "loss": 0.0052, "step": 50500 }, { "epoch": 2972.0, "learning_rate": 4.974472361809046e-06, "loss": 0.01, "step": 50525 }, { "epoch": 2973.0, "learning_rate": 4.971959798994975e-06, "loss": 0.0059, "step": 50550 }, { "epoch": 2974.0, "learning_rate": 4.969447236180905e-06, "loss": 0.0047, "step": 50575 }, { "epoch": 2976.0, "learning_rate": 4.9669346733668344e-06, "loss": 0.0052, "step": 50600 }, { "epoch": 2977.0, "learning_rate": 4.964422110552764e-06, "loss": 0.0037, "step": 50625 }, { "epoch": 2979.0, "learning_rate": 4.961909547738694e-06, "loss": 0.0053, "step": 50650 }, { "epoch": 2980.0, "learning_rate": 4.959396984924624e-06, "loss": 0.0037, "step": 50675 }, { "epoch": 2982.0, "learning_rate": 4.9568844221105534e-06, "loss": 0.0028, "step": 50700 }, { "epoch": 2983.0, "learning_rate": 4.954371859296483e-06, "loss": 0.0036, "step": 50725 }, { "epoch": 2985.0, "learning_rate": 4.951859296482412e-06, "loss": 0.0042, "step": 50750 }, { "epoch": 2986.0, "learning_rate": 4.949346733668342e-06, "loss": 0.0018, "step": 50775 }, { "epoch": 2988.0, "learning_rate": 4.9468341708542716e-06, "loss": 0.0029, "step": 50800 }, { "epoch": 2989.0, "learning_rate": 4.944321608040201e-06, "loss": 0.0065, "step": 50825 }, { "epoch": 2991.0, "learning_rate": 4.941809045226131e-06, "loss": 0.0021, "step": 50850 }, { "epoch": 2992.0, "learning_rate": 4.939296482412061e-06, "loss": 0.002, "step": 50875 }, { "epoch": 2994.0, "learning_rate": 4.9367839195979906e-06, "loss": 0.0027, "step": 50900 }, { "epoch": 2995.0, "learning_rate": 4.93427135678392e-06, "loss": 0.0039, "step": 50925 }, { "epoch": 2997.0, "learning_rate": 4.93175879396985e-06, "loss": 0.0047, "step": 50950 }, { "epoch": 2998.0, "learning_rate": 4.929246231155779e-06, "loss": 0.003, "step": 50975 }, { "epoch": 2999.0, "learning_rate": 4.926733668341709e-06, "loss": 0.0019, "step": 51000 }, { "epoch": 2999.0, "eval_loss": 0.5558891892433167, "eval_runtime": 165.5315, "eval_samples_per_second": 0.604, "eval_steps_per_second": 0.103, "eval_wer": 24.914285714285715, "step": 51000 }, { "epoch": 3001.0, "learning_rate": 4.924221105527638e-06, "loss": 0.008, "step": 51025 }, { "epoch": 3002.0, "learning_rate": 4.921708542713568e-06, "loss": 0.0036, "step": 51050 }, { "epoch": 3004.0, "learning_rate": 4.919195979899498e-06, "loss": 0.0041, "step": 51075 }, { "epoch": 3005.0, "learning_rate": 4.916683417085428e-06, "loss": 0.0044, "step": 51100 }, { "epoch": 3007.0, "learning_rate": 4.914170854271357e-06, "loss": 0.0021, "step": 51125 }, { "epoch": 3008.0, "learning_rate": 4.911658291457287e-06, "loss": 0.0024, "step": 51150 }, { "epoch": 3010.0, "learning_rate": 4.9091457286432165e-06, "loss": 0.002, "step": 51175 }, { "epoch": 3011.0, "learning_rate": 4.906633165829146e-06, "loss": 0.0051, "step": 51200 }, { "epoch": 3013.0, "learning_rate": 4.904120603015076e-06, "loss": 0.002, "step": 51225 }, { "epoch": 3014.0, "learning_rate": 4.901608040201005e-06, "loss": 0.0038, "step": 51250 }, { "epoch": 3016.0, "learning_rate": 4.899095477386935e-06, "loss": 0.0035, "step": 51275 }, { "epoch": 3017.0, "learning_rate": 4.896582914572865e-06, "loss": 0.0025, "step": 51300 }, { "epoch": 3019.0, "learning_rate": 4.894070351758794e-06, "loss": 0.0031, "step": 51325 }, { "epoch": 3020.0, "learning_rate": 4.891557788944724e-06, "loss": 0.0034, "step": 51350 }, { "epoch": 3022.0, "learning_rate": 4.889045226130654e-06, "loss": 0.002, "step": 51375 }, { "epoch": 3023.0, "learning_rate": 4.886532663316583e-06, "loss": 0.0022, "step": 51400 }, { "epoch": 3024.0, "learning_rate": 4.884020100502513e-06, "loss": 0.0018, "step": 51425 }, { "epoch": 3026.0, "learning_rate": 4.8815075376884424e-06, "loss": 0.0022, "step": 51450 }, { "epoch": 3027.0, "learning_rate": 4.878994974874372e-06, "loss": 0.0017, "step": 51475 }, { "epoch": 3029.0, "learning_rate": 4.876482412060302e-06, "loss": 0.0025, "step": 51500 }, { "epoch": 3030.0, "learning_rate": 4.873969849246232e-06, "loss": 0.0023, "step": 51525 }, { "epoch": 3032.0, "learning_rate": 4.8714572864321614e-06, "loss": 0.0013, "step": 51550 }, { "epoch": 3033.0, "learning_rate": 4.868944723618091e-06, "loss": 0.0049, "step": 51575 }, { "epoch": 3035.0, "learning_rate": 4.86643216080402e-06, "loss": 0.0025, "step": 51600 }, { "epoch": 3036.0, "learning_rate": 4.86391959798995e-06, "loss": 0.0029, "step": 51625 }, { "epoch": 3038.0, "learning_rate": 4.8614070351758796e-06, "loss": 0.0049, "step": 51650 }, { "epoch": 3039.0, "learning_rate": 4.858894472361809e-06, "loss": 0.0052, "step": 51675 }, { "epoch": 3041.0, "learning_rate": 4.856381909547739e-06, "loss": 0.0027, "step": 51700 }, { "epoch": 3042.0, "learning_rate": 4.853869346733669e-06, "loss": 0.0035, "step": 51725 }, { "epoch": 3044.0, "learning_rate": 4.8513567839195986e-06, "loss": 0.0045, "step": 51750 }, { "epoch": 3045.0, "learning_rate": 4.848844221105528e-06, "loss": 0.0047, "step": 51775 }, { "epoch": 3047.0, "learning_rate": 4.846331658291458e-06, "loss": 0.0028, "step": 51800 }, { "epoch": 3048.0, "learning_rate": 4.843819095477387e-06, "loss": 0.0029, "step": 51825 }, { "epoch": 3049.0, "learning_rate": 4.841306532663317e-06, "loss": 0.0034, "step": 51850 }, { "epoch": 3051.0, "learning_rate": 4.838793969849246e-06, "loss": 0.0046, "step": 51875 }, { "epoch": 3052.0, "learning_rate": 4.836281407035176e-06, "loss": 0.0029, "step": 51900 }, { "epoch": 3054.0, "learning_rate": 4.833768844221106e-06, "loss": 0.0033, "step": 51925 }, { "epoch": 3055.0, "learning_rate": 4.831256281407036e-06, "loss": 0.0039, "step": 51950 }, { "epoch": 3057.0, "learning_rate": 4.828743718592965e-06, "loss": 0.0046, "step": 51975 }, { "epoch": 3058.0, "learning_rate": 4.826231155778895e-06, "loss": 0.0015, "step": 52000 }, { "epoch": 3058.0, "eval_loss": 0.5777251124382019, "eval_runtime": 169.1367, "eval_samples_per_second": 0.591, "eval_steps_per_second": 0.101, "eval_wer": 28.57142857142857, "step": 52000 }, { "epoch": 3060.0, "learning_rate": 4.8237185929648245e-06, "loss": 0.0016, "step": 52025 }, { "epoch": 3061.0, "learning_rate": 4.821206030150754e-06, "loss": 0.0048, "step": 52050 }, { "epoch": 3063.0, "learning_rate": 4.818693467336684e-06, "loss": 0.0025, "step": 52075 }, { "epoch": 3064.0, "learning_rate": 4.816180904522613e-06, "loss": 0.0015, "step": 52100 }, { "epoch": 3066.0, "learning_rate": 4.8136683417085435e-06, "loss": 0.001, "step": 52125 }, { "epoch": 3067.0, "learning_rate": 4.811155778894473e-06, "loss": 0.0024, "step": 52150 }, { "epoch": 3069.0, "learning_rate": 4.808643216080402e-06, "loss": 0.0018, "step": 52175 }, { "epoch": 3070.0, "learning_rate": 4.806130653266332e-06, "loss": 0.003, "step": 52200 }, { "epoch": 3072.0, "learning_rate": 4.803618090452262e-06, "loss": 0.0037, "step": 52225 }, { "epoch": 3073.0, "learning_rate": 4.801105527638191e-06, "loss": 0.0019, "step": 52250 }, { "epoch": 3074.0, "learning_rate": 4.798592964824121e-06, "loss": 0.0034, "step": 52275 }, { "epoch": 3076.0, "learning_rate": 4.7960804020100504e-06, "loss": 0.0016, "step": 52300 }, { "epoch": 3077.0, "learning_rate": 4.793567839195981e-06, "loss": 0.0011, "step": 52325 }, { "epoch": 3079.0, "learning_rate": 4.79105527638191e-06, "loss": 0.004, "step": 52350 }, { "epoch": 3080.0, "learning_rate": 4.78854271356784e-06, "loss": 0.0029, "step": 52375 }, { "epoch": 3082.0, "learning_rate": 4.7860301507537694e-06, "loss": 0.0032, "step": 52400 }, { "epoch": 3083.0, "learning_rate": 4.783517587939699e-06, "loss": 0.0016, "step": 52425 }, { "epoch": 3085.0, "learning_rate": 4.781005025125628e-06, "loss": 0.0032, "step": 52450 }, { "epoch": 3086.0, "learning_rate": 4.778492462311558e-06, "loss": 0.0025, "step": 52475 }, { "epoch": 3088.0, "learning_rate": 4.7759798994974876e-06, "loss": 0.0019, "step": 52500 }, { "epoch": 3089.0, "learning_rate": 4.773467336683417e-06, "loss": 0.0032, "step": 52525 }, { "epoch": 3091.0, "learning_rate": 4.770954773869347e-06, "loss": 0.0025, "step": 52550 }, { "epoch": 3092.0, "learning_rate": 4.768442211055277e-06, "loss": 0.0029, "step": 52575 }, { "epoch": 3094.0, "learning_rate": 4.7659296482412066e-06, "loss": 0.0036, "step": 52600 }, { "epoch": 3095.0, "learning_rate": 4.763417085427136e-06, "loss": 0.003, "step": 52625 }, { "epoch": 3097.0, "learning_rate": 4.761005025125628e-06, "loss": 0.003, "step": 52650 }, { "epoch": 3098.0, "learning_rate": 4.7584924623115584e-06, "loss": 0.0021, "step": 52675 }, { "epoch": 3099.0, "learning_rate": 4.755979899497488e-06, "loss": 0.0057, "step": 52700 }, { "epoch": 3101.0, "learning_rate": 4.753467336683417e-06, "loss": 0.0056, "step": 52725 }, { "epoch": 3102.0, "learning_rate": 4.750954773869347e-06, "loss": 0.0047, "step": 52750 }, { "epoch": 3104.0, "learning_rate": 4.748442211055277e-06, "loss": 0.0026, "step": 52775 }, { "epoch": 3105.0, "learning_rate": 4.745929648241207e-06, "loss": 0.0024, "step": 52800 }, { "epoch": 3107.0, "learning_rate": 4.743417085427136e-06, "loss": 0.0026, "step": 52825 }, { "epoch": 3108.0, "learning_rate": 4.740904522613065e-06, "loss": 0.0036, "step": 52850 }, { "epoch": 3110.0, "learning_rate": 4.7383919597989956e-06, "loss": 0.0021, "step": 52875 }, { "epoch": 3111.0, "learning_rate": 4.735879396984925e-06, "loss": 0.0029, "step": 52900 }, { "epoch": 3113.0, "learning_rate": 4.733366834170854e-06, "loss": 0.003, "step": 52925 }, { "epoch": 3114.0, "learning_rate": 4.730854271356784e-06, "loss": 0.004, "step": 52950 }, { "epoch": 3116.0, "learning_rate": 4.728341708542714e-06, "loss": 0.0026, "step": 52975 }, { "epoch": 3117.0, "learning_rate": 4.725829145728644e-06, "loss": 0.0026, "step": 53000 }, { "epoch": 3117.0, "eval_loss": 0.5588864684104919, "eval_runtime": 163.4411, "eval_samples_per_second": 0.612, "eval_steps_per_second": 0.104, "eval_wer": 25.257142857142856, "step": 53000 }, { "epoch": 3119.0, "learning_rate": 4.723316582914573e-06, "loss": 0.0018, "step": 53025 }, { "epoch": 3120.0, "learning_rate": 4.7208040201005025e-06, "loss": 0.0022, "step": 53050 }, { "epoch": 3122.0, "learning_rate": 4.718291457286433e-06, "loss": 0.0015, "step": 53075 }, { "epoch": 3123.0, "learning_rate": 4.715778894472362e-06, "loss": 0.0033, "step": 53100 }, { "epoch": 3124.0, "learning_rate": 4.713266331658291e-06, "loss": 0.0034, "step": 53125 }, { "epoch": 3126.0, "learning_rate": 4.7107537688442215e-06, "loss": 0.0052, "step": 53150 }, { "epoch": 3127.0, "learning_rate": 4.708241206030152e-06, "loss": 0.0038, "step": 53175 }, { "epoch": 3129.0, "learning_rate": 4.705728643216081e-06, "loss": 0.0031, "step": 53200 }, { "epoch": 3130.0, "learning_rate": 4.70321608040201e-06, "loss": 0.0026, "step": 53225 }, { "epoch": 3132.0, "learning_rate": 4.7007035175879405e-06, "loss": 0.0037, "step": 53250 }, { "epoch": 3133.0, "learning_rate": 4.69819095477387e-06, "loss": 0.0033, "step": 53275 }, { "epoch": 3135.0, "learning_rate": 4.695678391959799e-06, "loss": 0.0025, "step": 53300 }, { "epoch": 3136.0, "learning_rate": 4.6931658291457285e-06, "loss": 0.0042, "step": 53325 }, { "epoch": 3138.0, "learning_rate": 4.690653266331659e-06, "loss": 0.0054, "step": 53350 }, { "epoch": 3139.0, "learning_rate": 4.688241206030151e-06, "loss": 0.0041, "step": 53375 }, { "epoch": 3141.0, "learning_rate": 4.685728643216081e-06, "loss": 0.0016, "step": 53400 }, { "epoch": 3142.0, "learning_rate": 4.6832160804020105e-06, "loss": 0.0045, "step": 53425 }, { "epoch": 3144.0, "learning_rate": 4.68070351758794e-06, "loss": 0.0022, "step": 53450 }, { "epoch": 3145.0, "learning_rate": 4.67819095477387e-06, "loss": 0.002, "step": 53475 }, { "epoch": 3147.0, "learning_rate": 4.675678391959799e-06, "loss": 0.0024, "step": 53500 }, { "epoch": 3148.0, "learning_rate": 4.673165829145729e-06, "loss": 0.0035, "step": 53525 }, { "epoch": 3149.0, "learning_rate": 4.670653266331659e-06, "loss": 0.0065, "step": 53550 }, { "epoch": 3151.0, "learning_rate": 4.668140703517588e-06, "loss": 0.0037, "step": 53575 }, { "epoch": 3152.0, "learning_rate": 4.665628140703518e-06, "loss": 0.0016, "step": 53600 }, { "epoch": 3154.0, "learning_rate": 4.663115577889448e-06, "loss": 0.0022, "step": 53625 }, { "epoch": 3155.0, "learning_rate": 4.660603015075377e-06, "loss": 0.0023, "step": 53650 }, { "epoch": 3157.0, "learning_rate": 4.658090452261307e-06, "loss": 0.0027, "step": 53675 }, { "epoch": 3158.0, "learning_rate": 4.6555778894472365e-06, "loss": 0.0023, "step": 53700 }, { "epoch": 3160.0, "learning_rate": 4.653065326633166e-06, "loss": 0.0021, "step": 53725 }, { "epoch": 3161.0, "learning_rate": 4.650552763819096e-06, "loss": 0.002, "step": 53750 }, { "epoch": 3163.0, "learning_rate": 4.648040201005026e-06, "loss": 0.0019, "step": 53775 }, { "epoch": 3164.0, "learning_rate": 4.6455276381909554e-06, "loss": 0.0034, "step": 53800 }, { "epoch": 3166.0, "learning_rate": 4.643015075376885e-06, "loss": 0.002, "step": 53825 }, { "epoch": 3167.0, "learning_rate": 4.640502512562814e-06, "loss": 0.0017, "step": 53850 }, { "epoch": 3169.0, "learning_rate": 4.637989949748744e-06, "loss": 0.0028, "step": 53875 }, { "epoch": 3170.0, "learning_rate": 4.635477386934674e-06, "loss": 0.0023, "step": 53900 }, { "epoch": 3172.0, "learning_rate": 4.632964824120603e-06, "loss": 0.003, "step": 53925 }, { "epoch": 3173.0, "learning_rate": 4.630452261306533e-06, "loss": 0.0017, "step": 53950 }, { "epoch": 3174.0, "learning_rate": 4.627939698492463e-06, "loss": 0.005, "step": 53975 }, { "epoch": 3176.0, "learning_rate": 4.6254271356783926e-06, "loss": 0.0032, "step": 54000 }, { "epoch": 3176.0, "eval_loss": 0.6060987114906311, "eval_runtime": 163.6905, "eval_samples_per_second": 0.611, "eval_steps_per_second": 0.104, "eval_wer": 26.971428571428575, "step": 54000 }, { "epoch": 3177.0, "learning_rate": 4.622914572864322e-06, "loss": 0.0034, "step": 54025 }, { "epoch": 3179.0, "learning_rate": 4.620402010050252e-06, "loss": 0.0027, "step": 54050 }, { "epoch": 3180.0, "learning_rate": 4.617889447236181e-06, "loss": 0.0028, "step": 54075 }, { "epoch": 3182.0, "learning_rate": 4.615376884422111e-06, "loss": 0.0051, "step": 54100 }, { "epoch": 3183.0, "learning_rate": 4.61286432160804e-06, "loss": 0.0036, "step": 54125 }, { "epoch": 3185.0, "learning_rate": 4.61035175879397e-06, "loss": 0.0036, "step": 54150 }, { "epoch": 3186.0, "learning_rate": 4.6078391959799e-06, "loss": 0.0019, "step": 54175 }, { "epoch": 3188.0, "learning_rate": 4.60532663316583e-06, "loss": 0.0028, "step": 54200 }, { "epoch": 3189.0, "learning_rate": 4.602814070351759e-06, "loss": 0.0018, "step": 54225 }, { "epoch": 3191.0, "learning_rate": 4.600301507537689e-06, "loss": 0.002, "step": 54250 }, { "epoch": 3192.0, "learning_rate": 4.5977889447236185e-06, "loss": 0.0017, "step": 54275 }, { "epoch": 3194.0, "learning_rate": 4.595276381909548e-06, "loss": 0.0021, "step": 54300 }, { "epoch": 3195.0, "learning_rate": 4.592763819095478e-06, "loss": 0.0069, "step": 54325 }, { "epoch": 3197.0, "learning_rate": 4.590251256281407e-06, "loss": 0.0036, "step": 54350 }, { "epoch": 3198.0, "learning_rate": 4.587738693467337e-06, "loss": 0.005, "step": 54375 }, { "epoch": 3199.0, "learning_rate": 4.585226130653267e-06, "loss": 0.0034, "step": 54400 }, { "epoch": 3201.0, "learning_rate": 4.582713567839196e-06, "loss": 0.0036, "step": 54425 }, { "epoch": 3202.0, "learning_rate": 4.580201005025126e-06, "loss": 0.0014, "step": 54450 }, { "epoch": 3204.0, "learning_rate": 4.577688442211056e-06, "loss": 0.0046, "step": 54475 }, { "epoch": 3205.0, "learning_rate": 4.575175879396985e-06, "loss": 0.0022, "step": 54500 }, { "epoch": 3207.0, "learning_rate": 4.572663316582915e-06, "loss": 0.0024, "step": 54525 }, { "epoch": 3208.0, "learning_rate": 4.5701507537688445e-06, "loss": 0.0016, "step": 54550 }, { "epoch": 3210.0, "learning_rate": 4.567638190954774e-06, "loss": 0.0019, "step": 54575 }, { "epoch": 3211.0, "learning_rate": 4.565125628140704e-06, "loss": 0.002, "step": 54600 }, { "epoch": 3213.0, "learning_rate": 4.562613065326634e-06, "loss": 0.0035, "step": 54625 }, { "epoch": 3214.0, "learning_rate": 4.5601005025125635e-06, "loss": 0.0029, "step": 54650 }, { "epoch": 3216.0, "learning_rate": 4.557587939698493e-06, "loss": 0.0029, "step": 54675 }, { "epoch": 3217.0, "learning_rate": 4.555075376884422e-06, "loss": 0.002, "step": 54700 }, { "epoch": 3219.0, "learning_rate": 4.552562814070352e-06, "loss": 0.0034, "step": 54725 }, { "epoch": 3220.0, "learning_rate": 4.550050251256282e-06, "loss": 0.003, "step": 54750 }, { "epoch": 3222.0, "learning_rate": 4.547537688442211e-06, "loss": 0.003, "step": 54775 }, { "epoch": 3223.0, "learning_rate": 4.545025125628141e-06, "loss": 0.0023, "step": 54800 }, { "epoch": 3224.0, "learning_rate": 4.542512562814071e-06, "loss": 0.0043, "step": 54825 }, { "epoch": 3226.0, "learning_rate": 4.540000000000001e-06, "loss": 0.0036, "step": 54850 }, { "epoch": 3227.0, "learning_rate": 4.53748743718593e-06, "loss": 0.0038, "step": 54875 }, { "epoch": 3229.0, "learning_rate": 4.53497487437186e-06, "loss": 0.0028, "step": 54900 }, { "epoch": 3230.0, "learning_rate": 4.532462311557789e-06, "loss": 0.0025, "step": 54925 }, { "epoch": 3232.0, "learning_rate": 4.529949748743719e-06, "loss": 0.0026, "step": 54950 }, { "epoch": 3233.0, "learning_rate": 4.527437185929648e-06, "loss": 0.001, "step": 54975 }, { "epoch": 3235.0, "learning_rate": 4.524924623115578e-06, "loss": 0.0025, "step": 55000 }, { "epoch": 3235.0, "eval_loss": 0.5776389241218567, "eval_runtime": 164.1599, "eval_samples_per_second": 0.609, "eval_steps_per_second": 0.104, "eval_wer": 25.142857142857146, "step": 55000 }, { "epoch": 3236.0, "learning_rate": 4.522412060301508e-06, "loss": 0.0041, "step": 55025 }, { "epoch": 3238.0, "learning_rate": 4.519899497487438e-06, "loss": 0.0021, "step": 55050 }, { "epoch": 3239.0, "learning_rate": 4.517386934673367e-06, "loss": 0.0034, "step": 55075 }, { "epoch": 3241.0, "learning_rate": 4.514874371859297e-06, "loss": 0.0025, "step": 55100 }, { "epoch": 3242.0, "learning_rate": 4.5123618090452265e-06, "loss": 0.0024, "step": 55125 }, { "epoch": 3244.0, "learning_rate": 4.509849246231156e-06, "loss": 0.0032, "step": 55150 }, { "epoch": 3245.0, "learning_rate": 4.507336683417086e-06, "loss": 0.0025, "step": 55175 }, { "epoch": 3247.0, "learning_rate": 4.504824120603015e-06, "loss": 0.0042, "step": 55200 }, { "epoch": 3248.0, "learning_rate": 4.5023115577889455e-06, "loss": 0.001, "step": 55225 }, { "epoch": 3249.0, "learning_rate": 4.499798994974875e-06, "loss": 0.0027, "step": 55250 }, { "epoch": 3251.0, "learning_rate": 4.497286432160804e-06, "loss": 0.0022, "step": 55275 }, { "epoch": 3252.0, "learning_rate": 4.494773869346734e-06, "loss": 0.0039, "step": 55300 }, { "epoch": 3254.0, "learning_rate": 4.492261306532664e-06, "loss": 0.0024, "step": 55325 }, { "epoch": 3255.0, "learning_rate": 4.489748743718593e-06, "loss": 0.0018, "step": 55350 }, { "epoch": 3257.0, "learning_rate": 4.487236180904523e-06, "loss": 0.0022, "step": 55375 }, { "epoch": 3258.0, "learning_rate": 4.4847236180904525e-06, "loss": 0.0039, "step": 55400 }, { "epoch": 3260.0, "learning_rate": 4.482211055276382e-06, "loss": 0.0022, "step": 55425 }, { "epoch": 3261.0, "learning_rate": 4.479698492462312e-06, "loss": 0.004, "step": 55450 }, { "epoch": 3263.0, "learning_rate": 4.477185929648242e-06, "loss": 0.0027, "step": 55475 }, { "epoch": 3264.0, "learning_rate": 4.4746733668341715e-06, "loss": 0.0019, "step": 55500 }, { "epoch": 3266.0, "learning_rate": 4.472160804020101e-06, "loss": 0.0017, "step": 55525 }, { "epoch": 3267.0, "learning_rate": 4.46964824120603e-06, "loss": 0.0023, "step": 55550 }, { "epoch": 3269.0, "learning_rate": 4.46713567839196e-06, "loss": 0.0043, "step": 55575 }, { "epoch": 3270.0, "learning_rate": 4.46462311557789e-06, "loss": 0.0024, "step": 55600 }, { "epoch": 3272.0, "learning_rate": 4.462110552763819e-06, "loss": 0.0043, "step": 55625 }, { "epoch": 3273.0, "learning_rate": 4.459597989949749e-06, "loss": 0.0054, "step": 55650 }, { "epoch": 3274.0, "learning_rate": 4.457085427135679e-06, "loss": 0.0016, "step": 55675 }, { "epoch": 3276.0, "learning_rate": 4.454572864321609e-06, "loss": 0.001, "step": 55700 }, { "epoch": 3277.0, "learning_rate": 4.452060301507538e-06, "loss": 0.0027, "step": 55725 }, { "epoch": 3279.0, "learning_rate": 4.449547738693468e-06, "loss": 0.0008, "step": 55750 }, { "epoch": 3280.0, "learning_rate": 4.447035175879397e-06, "loss": 0.0018, "step": 55775 }, { "epoch": 3282.0, "learning_rate": 4.444522613065327e-06, "loss": 0.0024, "step": 55800 }, { "epoch": 3283.0, "learning_rate": 4.442010050251256e-06, "loss": 0.0014, "step": 55825 }, { "epoch": 3285.0, "learning_rate": 4.439497487437186e-06, "loss": 0.0035, "step": 55850 }, { "epoch": 3286.0, "learning_rate": 4.436984924623116e-06, "loss": 0.0043, "step": 55875 }, { "epoch": 3288.0, "learning_rate": 4.434472361809046e-06, "loss": 0.0036, "step": 55900 }, { "epoch": 3289.0, "learning_rate": 4.431959798994975e-06, "loss": 0.0015, "step": 55925 }, { "epoch": 3291.0, "learning_rate": 4.429447236180905e-06, "loss": 0.0047, "step": 55950 }, { "epoch": 3292.0, "learning_rate": 4.4269346733668345e-06, "loss": 0.0036, "step": 55975 }, { "epoch": 3294.0, "learning_rate": 4.424422110552764e-06, "loss": 0.0046, "step": 56000 }, { "epoch": 3294.0, "eval_loss": 0.5753312110900879, "eval_runtime": 164.6461, "eval_samples_per_second": 0.607, "eval_steps_per_second": 0.103, "eval_wer": 27.314285714285713, "step": 56000 }, { "epoch": 3295.0, "learning_rate": 4.421909547738694e-06, "loss": 0.0013, "step": 56025 }, { "epoch": 3297.0, "learning_rate": 4.419396984924623e-06, "loss": 0.0017, "step": 56050 }, { "epoch": 3298.0, "learning_rate": 4.4168844221105535e-06, "loss": 0.0025, "step": 56075 }, { "epoch": 3299.0, "learning_rate": 4.414371859296483e-06, "loss": 0.0037, "step": 56100 }, { "epoch": 3301.0, "learning_rate": 4.411859296482412e-06, "loss": 0.0011, "step": 56125 }, { "epoch": 3302.0, "learning_rate": 4.409346733668342e-06, "loss": 0.0011, "step": 56150 }, { "epoch": 3304.0, "learning_rate": 4.406834170854272e-06, "loss": 0.0022, "step": 56175 }, { "epoch": 3305.0, "learning_rate": 4.404321608040201e-06, "loss": 0.0039, "step": 56200 }, { "epoch": 3307.0, "learning_rate": 4.401809045226131e-06, "loss": 0.0013, "step": 56225 }, { "epoch": 3308.0, "learning_rate": 4.3992964824120605e-06, "loss": 0.002, "step": 56250 }, { "epoch": 3310.0, "learning_rate": 4.396783919597991e-06, "loss": 0.001, "step": 56275 }, { "epoch": 3311.0, "learning_rate": 4.39427135678392e-06, "loss": 0.0032, "step": 56300 }, { "epoch": 3313.0, "learning_rate": 4.39175879396985e-06, "loss": 0.0027, "step": 56325 }, { "epoch": 3314.0, "learning_rate": 4.3892462311557795e-06, "loss": 0.0037, "step": 56350 }, { "epoch": 3316.0, "learning_rate": 4.386733668341709e-06, "loss": 0.0024, "step": 56375 }, { "epoch": 3317.0, "learning_rate": 4.384221105527638e-06, "loss": 0.0031, "step": 56400 }, { "epoch": 3319.0, "learning_rate": 4.381708542713568e-06, "loss": 0.0021, "step": 56425 }, { "epoch": 3320.0, "learning_rate": 4.379195979899498e-06, "loss": 0.0016, "step": 56450 }, { "epoch": 3322.0, "learning_rate": 4.376683417085428e-06, "loss": 0.0017, "step": 56475 }, { "epoch": 3323.0, "learning_rate": 4.374170854271357e-06, "loss": 0.0022, "step": 56500 }, { "epoch": 3324.0, "learning_rate": 4.371658291457287e-06, "loss": 0.0018, "step": 56525 }, { "epoch": 3326.0, "learning_rate": 4.369145728643217e-06, "loss": 0.0029, "step": 56550 }, { "epoch": 3327.0, "learning_rate": 4.366633165829146e-06, "loss": 0.0026, "step": 56575 }, { "epoch": 3329.0, "learning_rate": 4.364120603015076e-06, "loss": 0.0016, "step": 56600 }, { "epoch": 3330.0, "learning_rate": 4.361608040201005e-06, "loss": 0.0022, "step": 56625 }, { "epoch": 3332.0, "learning_rate": 4.359095477386935e-06, "loss": 0.0021, "step": 56650 }, { "epoch": 3333.0, "learning_rate": 4.356582914572864e-06, "loss": 0.0017, "step": 56675 }, { "epoch": 3335.0, "learning_rate": 4.354070351758794e-06, "loss": 0.0045, "step": 56700 }, { "epoch": 3336.0, "learning_rate": 4.351557788944724e-06, "loss": 0.0038, "step": 56725 }, { "epoch": 3338.0, "learning_rate": 4.349045226130654e-06, "loss": 0.0051, "step": 56750 }, { "epoch": 3339.0, "learning_rate": 4.346532663316583e-06, "loss": 0.0032, "step": 56775 }, { "epoch": 3341.0, "learning_rate": 4.344020100502513e-06, "loss": 0.0086, "step": 56800 }, { "epoch": 3342.0, "learning_rate": 4.3415075376884425e-06, "loss": 0.0028, "step": 56825 }, { "epoch": 3344.0, "learning_rate": 4.338994974874372e-06, "loss": 0.003, "step": 56850 }, { "epoch": 3345.0, "learning_rate": 4.336482412060302e-06, "loss": 0.004, "step": 56875 }, { "epoch": 3347.0, "learning_rate": 4.333969849246231e-06, "loss": 0.0039, "step": 56900 }, { "epoch": 3348.0, "learning_rate": 4.3314572864321615e-06, "loss": 0.003, "step": 56925 }, { "epoch": 3349.0, "learning_rate": 4.328944723618091e-06, "loss": 0.0035, "step": 56950 }, { "epoch": 3351.0, "learning_rate": 4.32643216080402e-06, "loss": 0.0052, "step": 56975 }, { "epoch": 3352.0, "learning_rate": 4.32391959798995e-06, "loss": 0.0015, "step": 57000 }, { "epoch": 3352.0, "eval_loss": 0.5735647678375244, "eval_runtime": 164.9088, "eval_samples_per_second": 0.606, "eval_steps_per_second": 0.103, "eval_wer": 27.200000000000003, "step": 57000 }, { "epoch": 3354.0, "learning_rate": 4.32140703517588e-06, "loss": 0.002, "step": 57025 }, { "epoch": 3355.0, "learning_rate": 4.318894472361809e-06, "loss": 0.0042, "step": 57050 }, { "epoch": 3357.0, "learning_rate": 4.316381909547739e-06, "loss": 0.0012, "step": 57075 }, { "epoch": 3358.0, "learning_rate": 4.3138693467336685e-06, "loss": 0.0009, "step": 57100 }, { "epoch": 3360.0, "learning_rate": 4.311356783919599e-06, "loss": 0.0013, "step": 57125 }, { "epoch": 3361.0, "learning_rate": 4.308844221105528e-06, "loss": 0.0019, "step": 57150 }, { "epoch": 3363.0, "learning_rate": 4.306331658291458e-06, "loss": 0.0023, "step": 57175 }, { "epoch": 3364.0, "learning_rate": 4.3038190954773875e-06, "loss": 0.0023, "step": 57200 }, { "epoch": 3366.0, "learning_rate": 4.301306532663317e-06, "loss": 0.003, "step": 57225 }, { "epoch": 3367.0, "learning_rate": 4.298793969849246e-06, "loss": 0.0017, "step": 57250 }, { "epoch": 3369.0, "learning_rate": 4.296281407035176e-06, "loss": 0.0016, "step": 57275 }, { "epoch": 3370.0, "learning_rate": 4.293768844221106e-06, "loss": 0.0044, "step": 57300 }, { "epoch": 3372.0, "learning_rate": 4.291256281407036e-06, "loss": 0.0017, "step": 57325 }, { "epoch": 3373.0, "learning_rate": 4.288743718592965e-06, "loss": 0.0024, "step": 57350 }, { "epoch": 3374.0, "learning_rate": 4.286231155778895e-06, "loss": 0.0017, "step": 57375 }, { "epoch": 3376.0, "learning_rate": 4.283718592964825e-06, "loss": 0.0022, "step": 57400 }, { "epoch": 3377.0, "learning_rate": 4.281206030150754e-06, "loss": 0.0016, "step": 57425 }, { "epoch": 3379.0, "learning_rate": 4.278693467336684e-06, "loss": 0.002, "step": 57450 }, { "epoch": 3380.0, "learning_rate": 4.276180904522613e-06, "loss": 0.002, "step": 57475 }, { "epoch": 3382.0, "learning_rate": 4.273668341708543e-06, "loss": 0.0012, "step": 57500 }, { "epoch": 3383.0, "learning_rate": 4.271155778894473e-06, "loss": 0.0006, "step": 57525 }, { "epoch": 3385.0, "learning_rate": 4.268643216080402e-06, "loss": 0.0009, "step": 57550 }, { "epoch": 3386.0, "learning_rate": 4.266130653266332e-06, "loss": 0.0026, "step": 57575 }, { "epoch": 3388.0, "learning_rate": 4.263618090452262e-06, "loss": 0.0015, "step": 57600 }, { "epoch": 3389.0, "learning_rate": 4.261105527638191e-06, "loss": 0.0026, "step": 57625 }, { "epoch": 3391.0, "learning_rate": 4.258592964824121e-06, "loss": 0.001, "step": 57650 }, { "epoch": 3392.0, "learning_rate": 4.2560804020100505e-06, "loss": 0.0033, "step": 57675 }, { "epoch": 3394.0, "learning_rate": 4.25356783919598e-06, "loss": 0.0014, "step": 57700 }, { "epoch": 3395.0, "learning_rate": 4.25105527638191e-06, "loss": 0.0015, "step": 57725 }, { "epoch": 3397.0, "learning_rate": 4.248542713567839e-06, "loss": 0.0011, "step": 57750 }, { "epoch": 3398.0, "learning_rate": 4.2460301507537695e-06, "loss": 0.0016, "step": 57775 }, { "epoch": 3399.0, "learning_rate": 4.243517587939699e-06, "loss": 0.0032, "step": 57800 }, { "epoch": 3401.0, "learning_rate": 4.241005025125628e-06, "loss": 0.0009, "step": 57825 }, { "epoch": 3402.0, "learning_rate": 4.238492462311558e-06, "loss": 0.0014, "step": 57850 }, { "epoch": 3404.0, "learning_rate": 4.235979899497488e-06, "loss": 0.0019, "step": 57875 }, { "epoch": 3405.0, "learning_rate": 4.233467336683417e-06, "loss": 0.0025, "step": 57900 }, { "epoch": 3407.0, "learning_rate": 4.230954773869347e-06, "loss": 0.0017, "step": 57925 }, { "epoch": 3408.0, "learning_rate": 4.228442211055277e-06, "loss": 0.0018, "step": 57950 }, { "epoch": 3410.0, "learning_rate": 4.225929648241207e-06, "loss": 0.0037, "step": 57975 }, { "epoch": 3411.0, "learning_rate": 4.223417085427136e-06, "loss": 0.003, "step": 58000 }, { "epoch": 3411.0, "eval_loss": 0.5933066010475159, "eval_runtime": 165.5425, "eval_samples_per_second": 0.604, "eval_steps_per_second": 0.103, "eval_wer": 25.6, "step": 58000 }, { "epoch": 3413.0, "learning_rate": 4.220904522613065e-06, "loss": 0.0027, "step": 58025 }, { "epoch": 3414.0, "learning_rate": 4.2183919597989955e-06, "loss": 0.0031, "step": 58050 }, { "epoch": 3416.0, "learning_rate": 4.215879396984925e-06, "loss": 0.0033, "step": 58075 }, { "epoch": 3417.0, "learning_rate": 4.213366834170854e-06, "loss": 0.002, "step": 58100 }, { "epoch": 3419.0, "learning_rate": 4.210854271356784e-06, "loss": 0.0014, "step": 58125 }, { "epoch": 3420.0, "learning_rate": 4.2083417085427144e-06, "loss": 0.0017, "step": 58150 }, { "epoch": 3422.0, "learning_rate": 4.205829145728644e-06, "loss": 0.0012, "step": 58175 }, { "epoch": 3423.0, "learning_rate": 4.203316582914573e-06, "loss": 0.0016, "step": 58200 }, { "epoch": 3424.0, "learning_rate": 4.200804020100503e-06, "loss": 0.0034, "step": 58225 }, { "epoch": 3426.0, "learning_rate": 4.198291457286433e-06, "loss": 0.0035, "step": 58250 }, { "epoch": 3427.0, "learning_rate": 4.195778894472362e-06, "loss": 0.0043, "step": 58275 }, { "epoch": 3429.0, "learning_rate": 4.193266331658292e-06, "loss": 0.0033, "step": 58300 }, { "epoch": 3430.0, "learning_rate": 4.190753768844221e-06, "loss": 0.0035, "step": 58325 }, { "epoch": 3432.0, "learning_rate": 4.188241206030151e-06, "loss": 0.002, "step": 58350 }, { "epoch": 3433.0, "learning_rate": 4.185728643216081e-06, "loss": 0.0016, "step": 58375 }, { "epoch": 3435.0, "learning_rate": 4.18321608040201e-06, "loss": 0.0007, "step": 58400 }, { "epoch": 3436.0, "learning_rate": 4.18070351758794e-06, "loss": 0.0016, "step": 58425 }, { "epoch": 3438.0, "learning_rate": 4.17819095477387e-06, "loss": 0.0013, "step": 58450 }, { "epoch": 3439.0, "learning_rate": 4.175678391959799e-06, "loss": 0.0061, "step": 58475 }, { "epoch": 3441.0, "learning_rate": 4.173165829145729e-06, "loss": 0.0019, "step": 58500 }, { "epoch": 3442.0, "learning_rate": 4.1706532663316585e-06, "loss": 0.0008, "step": 58525 }, { "epoch": 3444.0, "learning_rate": 4.168140703517588e-06, "loss": 0.0019, "step": 58550 }, { "epoch": 3445.0, "learning_rate": 4.165628140703518e-06, "loss": 0.0023, "step": 58575 }, { "epoch": 3447.0, "learning_rate": 4.163115577889447e-06, "loss": 0.0012, "step": 58600 }, { "epoch": 3448.0, "learning_rate": 4.1606030150753775e-06, "loss": 0.0031, "step": 58625 }, { "epoch": 3449.0, "learning_rate": 4.158090452261307e-06, "loss": 0.0038, "step": 58650 }, { "epoch": 3451.0, "learning_rate": 4.155577889447236e-06, "loss": 0.0013, "step": 58675 }, { "epoch": 3452.0, "learning_rate": 4.153065326633166e-06, "loss": 0.0017, "step": 58700 }, { "epoch": 3454.0, "learning_rate": 4.150552763819096e-06, "loss": 0.002, "step": 58725 }, { "epoch": 3455.0, "learning_rate": 4.148040201005025e-06, "loss": 0.0016, "step": 58750 }, { "epoch": 3457.0, "learning_rate": 4.145527638190955e-06, "loss": 0.0018, "step": 58775 }, { "epoch": 3458.0, "learning_rate": 4.143015075376885e-06, "loss": 0.0013, "step": 58800 }, { "epoch": 3460.0, "learning_rate": 4.140502512562815e-06, "loss": 0.0028, "step": 58825 }, { "epoch": 3461.0, "learning_rate": 4.137989949748744e-06, "loss": 0.0008, "step": 58850 }, { "epoch": 3463.0, "learning_rate": 4.135477386934673e-06, "loss": 0.0012, "step": 58875 }, { "epoch": 3464.0, "learning_rate": 4.1329648241206035e-06, "loss": 0.0013, "step": 58900 }, { "epoch": 3466.0, "learning_rate": 4.130452261306533e-06, "loss": 0.0033, "step": 58925 }, { "epoch": 3467.0, "learning_rate": 4.127939698492462e-06, "loss": 0.0024, "step": 58950 }, { "epoch": 3469.0, "learning_rate": 4.125427135678392e-06, "loss": 0.0017, "step": 58975 }, { "epoch": 3470.0, "learning_rate": 4.1229145728643225e-06, "loss": 0.002, "step": 59000 }, { "epoch": 3470.0, "eval_loss": 0.6035776734352112, "eval_runtime": 163.7788, "eval_samples_per_second": 0.611, "eval_steps_per_second": 0.104, "eval_wer": 25.6, "step": 59000 }, { "epoch": 1.0, "learning_rate": 1.6773109243697482e-07, "loss": 0.0021, "step": 59025 }, { "epoch": 2.0, "learning_rate": 1.635294117647059e-07, "loss": 0.0036, "step": 59050 }, { "epoch": 4.0, "learning_rate": 1.5932773109243698e-07, "loss": 0.0017, "step": 59075 }, { "epoch": 5.0, "learning_rate": 1.5512605042016808e-07, "loss": 0.0006, "step": 59100 }, { "epoch": 7.0, "learning_rate": 1.5092436974789917e-07, "loss": 0.0019, "step": 59125 }, { "epoch": 8.0, "learning_rate": 1.4672268907563027e-07, "loss": 0.0021, "step": 59150 }, { "epoch": 10.0, "learning_rate": 1.4252100840336136e-07, "loss": 0.002, "step": 59175 }, { "epoch": 11.0, "learning_rate": 1.3831932773109243e-07, "loss": 0.0019, "step": 59200 }, { "epoch": 13.0, "learning_rate": 1.3411764705882353e-07, "loss": 0.0005, "step": 59225 }, { "epoch": 14.0, "learning_rate": 1.2991596638655465e-07, "loss": 0.0022, "step": 59250 }, { "epoch": 16.0, "learning_rate": 1.2571428571428572e-07, "loss": 0.0007, "step": 59275 }, { "epoch": 17.0, "learning_rate": 1.215126050420168e-07, "loss": 0.0017, "step": 59300 }, { "epoch": 19.0, "learning_rate": 1.1731092436974791e-07, "loss": 0.002, "step": 59325 }, { "epoch": 20.0, "learning_rate": 1.13109243697479e-07, "loss": 0.0011, "step": 59350 }, { "epoch": 22.0, "learning_rate": 1.0890756302521008e-07, "loss": 0.0017, "step": 59375 }, { "epoch": 23.0, "learning_rate": 1.0470588235294118e-07, "loss": 0.0014, "step": 59400 }, { "epoch": 24.0, "learning_rate": 1.0050420168067229e-07, "loss": 0.0006, "step": 59425 }, { "epoch": 26.0, "learning_rate": 9.630252100840337e-08, "loss": 0.0009, "step": 59450 }, { "epoch": 27.0, "learning_rate": 9.210084033613446e-08, "loss": 0.0007, "step": 59475 }, { "epoch": 29.0, "learning_rate": 8.789915966386556e-08, "loss": 0.0007, "step": 59500 }, { "epoch": 30.0, "learning_rate": 8.369747899159664e-08, "loss": 0.0011, "step": 59525 }, { "epoch": 32.0, "learning_rate": 7.949579831932774e-08, "loss": 0.0006, "step": 59550 }, { "epoch": 33.0, "learning_rate": 7.529411764705883e-08, "loss": 0.0009, "step": 59575 }, { "epoch": 35.0, "learning_rate": 7.109243697478993e-08, "loss": 0.0021, "step": 59600 }, { "epoch": 36.0, "learning_rate": 6.689075630252101e-08, "loss": 0.002, "step": 59625 }, { "epoch": 38.0, "learning_rate": 6.26890756302521e-08, "loss": 0.0055, "step": 59650 }, { "epoch": 39.0, "learning_rate": 5.84873949579832e-08, "loss": 0.0012, "step": 59675 }, { "epoch": 41.0, "learning_rate": 5.428571428571429e-08, "loss": 0.0006, "step": 59700 }, { "epoch": 42.0, "learning_rate": 5.0084033613445375e-08, "loss": 0.0016, "step": 59725 }, { "epoch": 44.0, "learning_rate": 4.588235294117648e-08, "loss": 0.0015, "step": 59750 }, { "epoch": 45.0, "learning_rate": 4.1680672268907565e-08, "loss": 0.0009, "step": 59775 }, { "epoch": 47.0, "learning_rate": 3.747899159663866e-08, "loss": 0.0009, "step": 59800 }, { "epoch": 48.0, "learning_rate": 3.327731092436975e-08, "loss": 0.0014, "step": 59825 }, { "epoch": 49.0, "learning_rate": 2.9075630252100844e-08, "loss": 0.0036, "step": 59850 }, { "epoch": 51.0, "learning_rate": 2.4873949579831933e-08, "loss": 0.0028, "step": 59875 }, { "epoch": 52.0, "learning_rate": 2.0672268907563028e-08, "loss": 0.0004, "step": 59900 }, { "epoch": 54.0, "learning_rate": 1.647058823529412e-08, "loss": 0.0013, "step": 59925 }, { "epoch": 55.0, "learning_rate": 1.2268907563025211e-08, "loss": 0.0008, "step": 59950 }, { "epoch": 57.0, "learning_rate": 8.067226890756303e-09, "loss": 0.0014, "step": 59975 }, { "epoch": 58.0, "learning_rate": 3.8655462184873955e-09, "loss": 0.0007, "step": 60000 }, { "epoch": 58.0, "eval_loss": 0.5974761843681335, "eval_runtime": 167.98, "eval_samples_per_second": 0.595, "eval_steps_per_second": 0.101, "eval_wer": 25.257142857142856, "step": 60000 }, { "epoch": 1.0, "step": 60001, "total_flos": 1.498746476474384e+21, "train_loss": 3.482638488374606e-09, "train_runtime": 45.4914, "train_samples_per_second": 15827.168, "train_steps_per_second": 1318.931 } ], "max_steps": 60000, "num_train_epochs": 9223372036854775807, "total_flos": 1.498746476474384e+21, "trial_name": null, "trial_params": null }