diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,19933 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 15.0, + "global_step": 3270, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.0, + "loss": 16.8021, + "step": 1 + }, + { + "epoch": 0.01, + "learning_rate": 0.0, + "loss": 14.8655, + "step": 2 + }, + { + "epoch": 0.01, + "learning_rate": 0.0, + "loss": 16.0233, + "step": 3 + }, + { + "epoch": 0.02, + "learning_rate": 6e-07, + "loss": 16.0853, + "step": 4 + }, + { + "epoch": 0.02, + "learning_rate": 1.2e-06, + "loss": 14.4195, + "step": 5 + }, + { + "epoch": 0.03, + "learning_rate": 1.8e-06, + "loss": 15.0956, + "step": 6 + }, + { + "epoch": 0.03, + "learning_rate": 2.4e-06, + "loss": 15.4529, + "step": 7 + }, + { + "epoch": 0.04, + "learning_rate": 2.9999999999999997e-06, + "loss": 14.6598, + "step": 8 + }, + { + "epoch": 0.04, + "learning_rate": 3.6e-06, + "loss": 13.3131, + "step": 9 + }, + { + "epoch": 0.05, + "learning_rate": 4.2e-06, + "loss": 13.0855, + "step": 10 + }, + { + "epoch": 0.05, + "learning_rate": 4.8e-06, + "loss": 13.453, + "step": 11 + }, + { + "epoch": 0.06, + "learning_rate": 5.399999999999999e-06, + "loss": 14.372, + "step": 12 + }, + { + "epoch": 0.06, + "learning_rate": 5.999999999999999e-06, + "loss": 16.54, + "step": 13 + }, + { + "epoch": 0.06, + "learning_rate": 6.599999999999999e-06, + "loss": 16.0381, + "step": 14 + }, + { + "epoch": 0.07, + "learning_rate": 7.2e-06, + "loss": 15.8946, + "step": 15 + }, + { + "epoch": 0.07, + "learning_rate": 7.799999999999998e-06, + "loss": 16.1676, + "step": 16 + }, + { + "epoch": 0.08, + "learning_rate": 8.4e-06, + "loss": 14.5807, + "step": 17 + }, + { + "epoch": 0.08, + "learning_rate": 8.999999999999999e-06, + "loss": 14.0519, + "step": 18 + }, + { + "epoch": 0.09, + "learning_rate": 9.6e-06, + "loss": 13.5016, + "step": 19 + }, + { + "epoch": 0.09, + "learning_rate": 1.02e-05, + "loss": 15.7898, + "step": 20 + }, + { + "epoch": 0.1, + "learning_rate": 1.0799999999999998e-05, + "loss": 12.5886, + "step": 21 + }, + { + "epoch": 0.1, + "learning_rate": 1.14e-05, + "loss": 15.3797, + "step": 22 + }, + { + "epoch": 0.11, + "learning_rate": 1.1999999999999999e-05, + "loss": 14.4543, + "step": 23 + }, + { + "epoch": 0.11, + "learning_rate": 1.26e-05, + "loss": 14.2973, + "step": 24 + }, + { + "epoch": 0.11, + "learning_rate": 1.3199999999999997e-05, + "loss": 14.2664, + "step": 25 + }, + { + "epoch": 0.12, + "learning_rate": 1.3799999999999998e-05, + "loss": 16.8258, + "step": 26 + }, + { + "epoch": 0.12, + "learning_rate": 1.44e-05, + "loss": 15.7966, + "step": 27 + }, + { + "epoch": 0.13, + "learning_rate": 1.4999999999999999e-05, + "loss": 15.055, + "step": 28 + }, + { + "epoch": 0.13, + "learning_rate": 1.5599999999999996e-05, + "loss": 15.0205, + "step": 29 + }, + { + "epoch": 0.14, + "learning_rate": 1.6199999999999997e-05, + "loss": 14.2214, + "step": 30 + }, + { + "epoch": 0.14, + "learning_rate": 1.68e-05, + "loss": 15.2074, + "step": 31 + }, + { + "epoch": 0.15, + "learning_rate": 1.74e-05, + "loss": 15.798, + "step": 32 + }, + { + "epoch": 0.15, + "learning_rate": 1.7999999999999997e-05, + "loss": 13.8965, + "step": 33 + }, + { + "epoch": 0.16, + "learning_rate": 1.8599999999999998e-05, + "loss": 14.3536, + "step": 34 + }, + { + "epoch": 0.16, + "learning_rate": 1.92e-05, + "loss": 14.3478, + "step": 35 + }, + { + "epoch": 0.17, + "learning_rate": 1.98e-05, + "loss": 14.9752, + "step": 36 + }, + { + "epoch": 0.17, + "learning_rate": 2.04e-05, + "loss": 18.6472, + "step": 37 + }, + { + "epoch": 0.17, + "learning_rate": 2.1e-05, + "loss": 14.5226, + "step": 38 + }, + { + "epoch": 0.18, + "learning_rate": 2.1599999999999996e-05, + "loss": 14.5589, + "step": 39 + }, + { + "epoch": 0.18, + "learning_rate": 2.2199999999999998e-05, + "loss": 16.0441, + "step": 40 + }, + { + "epoch": 0.19, + "learning_rate": 2.28e-05, + "loss": 13.8213, + "step": 41 + }, + { + "epoch": 0.19, + "learning_rate": 2.34e-05, + "loss": 14.5297, + "step": 42 + }, + { + "epoch": 0.2, + "learning_rate": 2.3999999999999997e-05, + "loss": 13.1724, + "step": 43 + }, + { + "epoch": 0.2, + "learning_rate": 2.4599999999999998e-05, + "loss": 14.2611, + "step": 44 + }, + { + "epoch": 0.21, + "learning_rate": 2.52e-05, + "loss": 11.9516, + "step": 45 + }, + { + "epoch": 0.21, + "learning_rate": 2.5799999999999997e-05, + "loss": 13.0899, + "step": 46 + }, + { + "epoch": 0.22, + "learning_rate": 2.6399999999999995e-05, + "loss": 12.0712, + "step": 47 + }, + { + "epoch": 0.22, + "learning_rate": 2.6999999999999996e-05, + "loss": 12.1539, + "step": 48 + }, + { + "epoch": 0.22, + "learning_rate": 2.7599999999999997e-05, + "loss": 9.8547, + "step": 49 + }, + { + "epoch": 0.23, + "learning_rate": 2.8199999999999998e-05, + "loss": 12.4266, + "step": 50 + }, + { + "epoch": 0.23, + "learning_rate": 2.88e-05, + "loss": 12.3663, + "step": 51 + }, + { + "epoch": 0.24, + "learning_rate": 2.94e-05, + "loss": 10.4339, + "step": 52 + }, + { + "epoch": 0.24, + "learning_rate": 2.9999999999999997e-05, + "loss": 10.4794, + "step": 53 + }, + { + "epoch": 0.25, + "learning_rate": 3.06e-05, + "loss": 10.4132, + "step": 54 + }, + { + "epoch": 0.25, + "learning_rate": 3.119999999999999e-05, + "loss": 9.4857, + "step": 55 + }, + { + "epoch": 0.26, + "learning_rate": 3.1799999999999994e-05, + "loss": 8.9554, + "step": 56 + }, + { + "epoch": 0.26, + "learning_rate": 3.2399999999999995e-05, + "loss": 8.5082, + "step": 57 + }, + { + "epoch": 0.27, + "learning_rate": 3.2999999999999996e-05, + "loss": 7.8569, + "step": 58 + }, + { + "epoch": 0.27, + "learning_rate": 3.36e-05, + "loss": 6.6837, + "step": 59 + }, + { + "epoch": 0.28, + "learning_rate": 3.42e-05, + "loss": 6.4398, + "step": 60 + }, + { + "epoch": 0.28, + "learning_rate": 3.48e-05, + "loss": 8.0112, + "step": 61 + }, + { + "epoch": 0.28, + "learning_rate": 3.539999999999999e-05, + "loss": 6.4081, + "step": 62 + }, + { + "epoch": 0.29, + "learning_rate": 3.5999999999999994e-05, + "loss": 7.1122, + "step": 63 + }, + { + "epoch": 0.29, + "learning_rate": 3.6599999999999995e-05, + "loss": 6.9262, + "step": 64 + }, + { + "epoch": 0.3, + "learning_rate": 3.7199999999999996e-05, + "loss": 5.5841, + "step": 65 + }, + { + "epoch": 0.3, + "learning_rate": 3.78e-05, + "loss": 5.5462, + "step": 66 + }, + { + "epoch": 0.31, + "learning_rate": 3.84e-05, + "loss": 5.4808, + "step": 67 + }, + { + "epoch": 0.31, + "learning_rate": 3.9e-05, + "loss": 5.0315, + "step": 68 + }, + { + "epoch": 0.32, + "learning_rate": 3.96e-05, + "loss": 5.0318, + "step": 69 + }, + { + "epoch": 0.32, + "learning_rate": 4.02e-05, + "loss": 4.9626, + "step": 70 + }, + { + "epoch": 0.33, + "learning_rate": 4.08e-05, + "loss": 4.7453, + "step": 71 + }, + { + "epoch": 0.33, + "learning_rate": 4.14e-05, + "loss": 4.3912, + "step": 72 + }, + { + "epoch": 0.33, + "learning_rate": 4.2e-05, + "loss": 4.3047, + "step": 73 + }, + { + "epoch": 0.34, + "learning_rate": 4.259999999999999e-05, + "loss": 4.5548, + "step": 74 + }, + { + "epoch": 0.34, + "learning_rate": 4.319999999999999e-05, + "loss": 4.508, + "step": 75 + }, + { + "epoch": 0.35, + "learning_rate": 4.3799999999999994e-05, + "loss": 4.4464, + "step": 76 + }, + { + "epoch": 0.35, + "learning_rate": 4.4399999999999995e-05, + "loss": 4.2414, + "step": 77 + }, + { + "epoch": 0.36, + "learning_rate": 4.4999999999999996e-05, + "loss": 4.1008, + "step": 78 + }, + { + "epoch": 0.36, + "learning_rate": 4.56e-05, + "loss": 4.1237, + "step": 79 + }, + { + "epoch": 0.37, + "learning_rate": 4.62e-05, + "loss": 4.0586, + "step": 80 + }, + { + "epoch": 0.37, + "learning_rate": 4.68e-05, + "loss": 3.9452, + "step": 81 + }, + { + "epoch": 0.38, + "learning_rate": 4.7399999999999993e-05, + "loss": 3.9169, + "step": 82 + }, + { + "epoch": 0.38, + "learning_rate": 4.7999999999999994e-05, + "loss": 3.8635, + "step": 83 + }, + { + "epoch": 0.39, + "learning_rate": 4.8599999999999995e-05, + "loss": 3.7665, + "step": 84 + }, + { + "epoch": 0.39, + "learning_rate": 4.9199999999999997e-05, + "loss": 3.8492, + "step": 85 + }, + { + "epoch": 0.39, + "learning_rate": 4.98e-05, + "loss": 3.9107, + "step": 86 + }, + { + "epoch": 0.4, + "learning_rate": 5.04e-05, + "loss": 3.9151, + "step": 87 + }, + { + "epoch": 0.4, + "learning_rate": 5.1e-05, + "loss": 3.8423, + "step": 88 + }, + { + "epoch": 0.41, + "learning_rate": 5.1599999999999994e-05, + "loss": 3.7597, + "step": 89 + }, + { + "epoch": 0.41, + "learning_rate": 5.2199999999999995e-05, + "loss": 3.681, + "step": 90 + }, + { + "epoch": 0.42, + "learning_rate": 5.279999999999999e-05, + "loss": 3.6785, + "step": 91 + }, + { + "epoch": 0.42, + "learning_rate": 5.339999999999999e-05, + "loss": 3.5951, + "step": 92 + }, + { + "epoch": 0.43, + "learning_rate": 5.399999999999999e-05, + "loss": 3.5703, + "step": 93 + }, + { + "epoch": 0.43, + "learning_rate": 5.459999999999999e-05, + "loss": 3.532, + "step": 94 + }, + { + "epoch": 0.44, + "learning_rate": 5.519999999999999e-05, + "loss": 3.5184, + "step": 95 + }, + { + "epoch": 0.44, + "learning_rate": 5.5799999999999994e-05, + "loss": 3.5752, + "step": 96 + }, + { + "epoch": 0.44, + "learning_rate": 5.6399999999999995e-05, + "loss": 3.4547, + "step": 97 + }, + { + "epoch": 0.45, + "learning_rate": 5.6999999999999996e-05, + "loss": 3.4775, + "step": 98 + }, + { + "epoch": 0.45, + "learning_rate": 5.76e-05, + "loss": 3.5405, + "step": 99 + }, + { + "epoch": 0.46, + "learning_rate": 5.82e-05, + "loss": 3.5279, + "step": 100 + }, + { + "epoch": 0.46, + "eval_loss": 3.6259937286376953, + "eval_runtime": 20.4326, + "eval_samples_per_second": 80.606, + "eval_steps_per_second": 2.545, + "eval_wer": 1.0, + "step": 100 + }, + { + "epoch": 0.46, + "learning_rate": 5.88e-05, + "loss": 3.5642, + "step": 101 + }, + { + "epoch": 0.47, + "learning_rate": 5.94e-05, + "loss": 3.4489, + "step": 102 + }, + { + "epoch": 0.47, + "learning_rate": 5.9999999999999995e-05, + "loss": 3.4725, + "step": 103 + }, + { + "epoch": 0.48, + "learning_rate": 6.0599999999999996e-05, + "loss": 3.4266, + "step": 104 + }, + { + "epoch": 0.48, + "learning_rate": 6.12e-05, + "loss": 3.4013, + "step": 105 + }, + { + "epoch": 0.49, + "learning_rate": 6.18e-05, + "loss": 3.4105, + "step": 106 + }, + { + "epoch": 0.49, + "learning_rate": 6.239999999999999e-05, + "loss": 3.3563, + "step": 107 + }, + { + "epoch": 0.5, + "learning_rate": 6.299999999999999e-05, + "loss": 3.3259, + "step": 108 + }, + { + "epoch": 0.5, + "learning_rate": 6.359999999999999e-05, + "loss": 3.3905, + "step": 109 + }, + { + "epoch": 0.5, + "learning_rate": 6.419999999999999e-05, + "loss": 3.3447, + "step": 110 + }, + { + "epoch": 0.51, + "learning_rate": 6.479999999999999e-05, + "loss": 3.2851, + "step": 111 + }, + { + "epoch": 0.51, + "learning_rate": 6.539999999999999e-05, + "loss": 3.3613, + "step": 112 + }, + { + "epoch": 0.52, + "learning_rate": 6.599999999999999e-05, + "loss": 3.3664, + "step": 113 + }, + { + "epoch": 0.52, + "learning_rate": 6.659999999999999e-05, + "loss": 3.2941, + "step": 114 + }, + { + "epoch": 0.53, + "learning_rate": 6.72e-05, + "loss": 3.3653, + "step": 115 + }, + { + "epoch": 0.53, + "learning_rate": 6.78e-05, + "loss": 3.2863, + "step": 116 + }, + { + "epoch": 0.54, + "learning_rate": 6.84e-05, + "loss": 3.2686, + "step": 117 + }, + { + "epoch": 0.54, + "learning_rate": 6.9e-05, + "loss": 3.2546, + "step": 118 + }, + { + "epoch": 0.55, + "learning_rate": 6.96e-05, + "loss": 3.2985, + "step": 119 + }, + { + "epoch": 0.55, + "learning_rate": 7.02e-05, + "loss": 3.2561, + "step": 120 + }, + { + "epoch": 0.56, + "learning_rate": 7.079999999999999e-05, + "loss": 3.3089, + "step": 121 + }, + { + "epoch": 0.56, + "learning_rate": 7.139999999999999e-05, + "loss": 3.1919, + "step": 122 + }, + { + "epoch": 0.56, + "learning_rate": 7.199999999999999e-05, + "loss": 3.2224, + "step": 123 + }, + { + "epoch": 0.57, + "learning_rate": 7.259999999999999e-05, + "loss": 3.2414, + "step": 124 + }, + { + "epoch": 0.57, + "learning_rate": 7.319999999999999e-05, + "loss": 3.4551, + "step": 125 + }, + { + "epoch": 0.58, + "learning_rate": 7.379999999999999e-05, + "loss": 3.2746, + "step": 126 + }, + { + "epoch": 0.58, + "learning_rate": 7.439999999999999e-05, + "loss": 3.1855, + "step": 127 + }, + { + "epoch": 0.59, + "learning_rate": 7.5e-05, + "loss": 3.2839, + "step": 128 + }, + { + "epoch": 0.59, + "learning_rate": 7.56e-05, + "loss": 3.1777, + "step": 129 + }, + { + "epoch": 0.6, + "learning_rate": 7.62e-05, + "loss": 3.2051, + "step": 130 + }, + { + "epoch": 0.6, + "learning_rate": 7.68e-05, + "loss": 3.2333, + "step": 131 + }, + { + "epoch": 0.61, + "learning_rate": 7.74e-05, + "loss": 3.1937, + "step": 132 + }, + { + "epoch": 0.61, + "learning_rate": 7.8e-05, + "loss": 3.2026, + "step": 133 + }, + { + "epoch": 0.61, + "learning_rate": 7.86e-05, + "loss": 3.2164, + "step": 134 + }, + { + "epoch": 0.62, + "learning_rate": 7.92e-05, + "loss": 3.3889, + "step": 135 + }, + { + "epoch": 0.62, + "learning_rate": 7.98e-05, + "loss": 3.209, + "step": 136 + }, + { + "epoch": 0.63, + "learning_rate": 8.04e-05, + "loss": 3.1708, + "step": 137 + }, + { + "epoch": 0.63, + "learning_rate": 8.1e-05, + "loss": 3.1733, + "step": 138 + }, + { + "epoch": 0.64, + "learning_rate": 8.16e-05, + "loss": 3.252, + "step": 139 + }, + { + "epoch": 0.64, + "learning_rate": 8.22e-05, + "loss": 3.1518, + "step": 140 + }, + { + "epoch": 0.65, + "learning_rate": 8.28e-05, + "loss": 3.1317, + "step": 141 + }, + { + "epoch": 0.65, + "learning_rate": 8.34e-05, + "loss": 3.1526, + "step": 142 + }, + { + "epoch": 0.66, + "learning_rate": 8.4e-05, + "loss": 3.1526, + "step": 143 + }, + { + "epoch": 0.66, + "learning_rate": 8.459999999999998e-05, + "loss": 3.1376, + "step": 144 + }, + { + "epoch": 0.67, + "learning_rate": 8.519999999999998e-05, + "loss": 3.1413, + "step": 145 + }, + { + "epoch": 0.67, + "learning_rate": 8.579999999999998e-05, + "loss": 3.1527, + "step": 146 + }, + { + "epoch": 0.67, + "learning_rate": 8.639999999999999e-05, + "loss": 3.1245, + "step": 147 + }, + { + "epoch": 0.68, + "learning_rate": 8.699999999999999e-05, + "loss": 3.1634, + "step": 148 + }, + { + "epoch": 0.68, + "learning_rate": 8.759999999999999e-05, + "loss": 3.1574, + "step": 149 + }, + { + "epoch": 0.69, + "learning_rate": 8.819999999999999e-05, + "loss": 3.1455, + "step": 150 + }, + { + "epoch": 0.69, + "learning_rate": 8.879999999999999e-05, + "loss": 3.1262, + "step": 151 + }, + { + "epoch": 0.7, + "learning_rate": 8.939999999999999e-05, + "loss": 3.126, + "step": 152 + }, + { + "epoch": 0.7, + "learning_rate": 8.999999999999999e-05, + "loss": 3.1169, + "step": 153 + }, + { + "epoch": 0.71, + "learning_rate": 9.059999999999999e-05, + "loss": 3.1067, + "step": 154 + }, + { + "epoch": 0.71, + "learning_rate": 9.12e-05, + "loss": 3.1491, + "step": 155 + }, + { + "epoch": 0.72, + "learning_rate": 9.18e-05, + "loss": 3.1132, + "step": 156 + }, + { + "epoch": 0.72, + "learning_rate": 9.24e-05, + "loss": 3.1862, + "step": 157 + }, + { + "epoch": 0.72, + "learning_rate": 9.3e-05, + "loss": 3.1043, + "step": 158 + }, + { + "epoch": 0.73, + "learning_rate": 9.36e-05, + "loss": 3.1087, + "step": 159 + }, + { + "epoch": 0.73, + "learning_rate": 9.419999999999999e-05, + "loss": 3.1317, + "step": 160 + }, + { + "epoch": 0.74, + "learning_rate": 9.479999999999999e-05, + "loss": 3.1448, + "step": 161 + }, + { + "epoch": 0.74, + "learning_rate": 9.539999999999999e-05, + "loss": 3.2031, + "step": 162 + }, + { + "epoch": 0.75, + "learning_rate": 9.599999999999999e-05, + "loss": 3.1747, + "step": 163 + }, + { + "epoch": 0.75, + "learning_rate": 9.659999999999999e-05, + "loss": 3.123, + "step": 164 + }, + { + "epoch": 0.76, + "learning_rate": 9.719999999999999e-05, + "loss": 3.0936, + "step": 165 + }, + { + "epoch": 0.76, + "learning_rate": 9.779999999999999e-05, + "loss": 3.0991, + "step": 166 + }, + { + "epoch": 0.77, + "learning_rate": 9.839999999999999e-05, + "loss": 3.1379, + "step": 167 + }, + { + "epoch": 0.77, + "learning_rate": 9.9e-05, + "loss": 3.1083, + "step": 168 + }, + { + "epoch": 0.78, + "learning_rate": 9.96e-05, + "loss": 3.113, + "step": 169 + }, + { + "epoch": 0.78, + "learning_rate": 0.0001002, + "loss": 3.112, + "step": 170 + }, + { + "epoch": 0.78, + "learning_rate": 0.0001008, + "loss": 3.1219, + "step": 171 + }, + { + "epoch": 0.79, + "learning_rate": 0.0001014, + "loss": 3.0831, + "step": 172 + }, + { + "epoch": 0.79, + "learning_rate": 0.000102, + "loss": 3.1023, + "step": 173 + }, + { + "epoch": 0.8, + "learning_rate": 0.0001026, + "loss": 3.1149, + "step": 174 + }, + { + "epoch": 0.8, + "learning_rate": 0.00010319999999999999, + "loss": 3.2964, + "step": 175 + }, + { + "epoch": 0.81, + "learning_rate": 0.00010379999999999999, + "loss": 3.0681, + "step": 176 + }, + { + "epoch": 0.81, + "learning_rate": 0.00010439999999999999, + "loss": 3.0941, + "step": 177 + }, + { + "epoch": 0.82, + "learning_rate": 0.00010499999999999999, + "loss": 3.0497, + "step": 178 + }, + { + "epoch": 0.82, + "learning_rate": 0.00010559999999999998, + "loss": 3.1096, + "step": 179 + }, + { + "epoch": 0.83, + "learning_rate": 0.00010619999999999998, + "loss": 3.094, + "step": 180 + }, + { + "epoch": 0.83, + "learning_rate": 0.00010679999999999998, + "loss": 3.0534, + "step": 181 + }, + { + "epoch": 0.83, + "learning_rate": 0.00010739999999999998, + "loss": 3.0854, + "step": 182 + }, + { + "epoch": 0.84, + "learning_rate": 0.00010799999999999998, + "loss": 3.0604, + "step": 183 + }, + { + "epoch": 0.84, + "learning_rate": 0.00010859999999999998, + "loss": 3.065, + "step": 184 + }, + { + "epoch": 0.85, + "learning_rate": 0.00010919999999999998, + "loss": 3.0594, + "step": 185 + }, + { + "epoch": 0.85, + "learning_rate": 0.00010979999999999999, + "loss": 3.0544, + "step": 186 + }, + { + "epoch": 0.86, + "learning_rate": 0.00011039999999999999, + "loss": 3.1025, + "step": 187 + }, + { + "epoch": 0.86, + "learning_rate": 0.00011099999999999999, + "loss": 3.0866, + "step": 188 + }, + { + "epoch": 0.87, + "learning_rate": 0.00011159999999999999, + "loss": 3.0763, + "step": 189 + }, + { + "epoch": 0.87, + "learning_rate": 0.00011219999999999999, + "loss": 3.1308, + "step": 190 + }, + { + "epoch": 0.88, + "learning_rate": 0.00011279999999999999, + "loss": 3.0958, + "step": 191 + }, + { + "epoch": 0.88, + "learning_rate": 0.00011339999999999999, + "loss": 3.0392, + "step": 192 + }, + { + "epoch": 0.89, + "learning_rate": 0.00011399999999999999, + "loss": 3.0337, + "step": 193 + }, + { + "epoch": 0.89, + "learning_rate": 0.0001146, + "loss": 3.073, + "step": 194 + }, + { + "epoch": 0.89, + "learning_rate": 0.0001152, + "loss": 3.0556, + "step": 195 + }, + { + "epoch": 0.9, + "learning_rate": 0.0001158, + "loss": 3.0388, + "step": 196 + }, + { + "epoch": 0.9, + "learning_rate": 0.0001164, + "loss": 3.0549, + "step": 197 + }, + { + "epoch": 0.91, + "learning_rate": 0.000117, + "loss": 3.0708, + "step": 198 + }, + { + "epoch": 0.91, + "learning_rate": 0.0001176, + "loss": 3.0248, + "step": 199 + }, + { + "epoch": 0.92, + "learning_rate": 0.0001182, + "loss": 3.1065, + "step": 200 + }, + { + "epoch": 0.92, + "eval_loss": 3.0854454040527344, + "eval_runtime": 19.3192, + "eval_samples_per_second": 85.252, + "eval_steps_per_second": 2.692, + "eval_wer": 0.9998978653865795, + "step": 200 + }, + { + "epoch": 0.92, + "learning_rate": 0.0001188, + "loss": 2.9984, + "step": 201 + }, + { + "epoch": 0.93, + "learning_rate": 0.0001194, + "loss": 3.0534, + "step": 202 + }, + { + "epoch": 0.93, + "learning_rate": 0.00011999999999999999, + "loss": 3.0231, + "step": 203 + }, + { + "epoch": 0.94, + "learning_rate": 0.00012059999999999999, + "loss": 3.0253, + "step": 204 + }, + { + "epoch": 0.94, + "learning_rate": 0.00012119999999999999, + "loss": 3.039, + "step": 205 + }, + { + "epoch": 0.94, + "learning_rate": 0.00012179999999999999, + "loss": 2.9975, + "step": 206 + }, + { + "epoch": 0.95, + "learning_rate": 0.0001224, + "loss": 3.0295, + "step": 207 + }, + { + "epoch": 0.95, + "learning_rate": 0.00012299999999999998, + "loss": 2.9992, + "step": 208 + }, + { + "epoch": 0.96, + "learning_rate": 0.0001236, + "loss": 3.0003, + "step": 209 + }, + { + "epoch": 0.96, + "learning_rate": 0.00012419999999999998, + "loss": 3.0434, + "step": 210 + }, + { + "epoch": 0.97, + "learning_rate": 0.00012479999999999997, + "loss": 3.0253, + "step": 211 + }, + { + "epoch": 0.97, + "learning_rate": 0.00012539999999999999, + "loss": 2.9991, + "step": 212 + }, + { + "epoch": 0.98, + "learning_rate": 0.00012599999999999997, + "loss": 2.9954, + "step": 213 + }, + { + "epoch": 0.98, + "learning_rate": 0.0001266, + "loss": 2.9762, + "step": 214 + }, + { + "epoch": 0.99, + "learning_rate": 0.00012719999999999997, + "loss": 2.9941, + "step": 215 + }, + { + "epoch": 0.99, + "learning_rate": 0.0001278, + "loss": 2.9615, + "step": 216 + }, + { + "epoch": 1.0, + "learning_rate": 0.00012839999999999998, + "loss": 2.9958, + "step": 217 + }, + { + "epoch": 1.0, + "learning_rate": 0.000129, + "loss": 2.9472, + "step": 218 + }, + { + "epoch": 1.0, + "learning_rate": 0.00012959999999999998, + "loss": 2.9857, + "step": 219 + }, + { + "epoch": 1.01, + "learning_rate": 0.0001302, + "loss": 2.999, + "step": 220 + }, + { + "epoch": 1.01, + "learning_rate": 0.00013079999999999998, + "loss": 2.9784, + "step": 221 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001314, + "loss": 2.9604, + "step": 222 + }, + { + "epoch": 1.02, + "learning_rate": 0.00013199999999999998, + "loss": 2.9818, + "step": 223 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001326, + "loss": 2.9194, + "step": 224 + }, + { + "epoch": 1.03, + "learning_rate": 0.00013319999999999999, + "loss": 2.9667, + "step": 225 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001338, + "loss": 2.9552, + "step": 226 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001344, + "loss": 2.9878, + "step": 227 + }, + { + "epoch": 1.05, + "learning_rate": 0.000135, + "loss": 2.9488, + "step": 228 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001356, + "loss": 2.906, + "step": 229 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001362, + "loss": 2.8929, + "step": 230 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001368, + "loss": 3.1133, + "step": 231 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001374, + "loss": 2.9066, + "step": 232 + }, + { + "epoch": 1.07, + "learning_rate": 0.000138, + "loss": 2.9071, + "step": 233 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001386, + "loss": 2.8765, + "step": 234 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001392, + "loss": 2.9141, + "step": 235 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013979999999999998, + "loss": 2.8857, + "step": 236 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001404, + "loss": 2.9141, + "step": 237 + }, + { + "epoch": 1.09, + "learning_rate": 0.00014099999999999998, + "loss": 2.8668, + "step": 238 + }, + { + "epoch": 1.1, + "learning_rate": 0.00014159999999999997, + "loss": 2.9031, + "step": 239 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001422, + "loss": 2.8726, + "step": 240 + }, + { + "epoch": 1.11, + "learning_rate": 0.00014279999999999997, + "loss": 2.8211, + "step": 241 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001434, + "loss": 2.8378, + "step": 242 + }, + { + "epoch": 1.11, + "learning_rate": 0.00014399999999999998, + "loss": 2.7359, + "step": 243 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001446, + "loss": 2.8586, + "step": 244 + }, + { + "epoch": 1.12, + "learning_rate": 0.00014519999999999998, + "loss": 2.9244, + "step": 245 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001458, + "loss": 2.7991, + "step": 246 + }, + { + "epoch": 1.13, + "learning_rate": 0.00014639999999999998, + "loss": 2.7786, + "step": 247 + }, + { + "epoch": 1.14, + "learning_rate": 0.000147, + "loss": 2.7631, + "step": 248 + }, + { + "epoch": 1.14, + "learning_rate": 0.00014759999999999998, + "loss": 2.7781, + "step": 249 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001482, + "loss": 2.7549, + "step": 250 + }, + { + "epoch": 1.15, + "learning_rate": 0.00014879999999999998, + "loss": 2.7679, + "step": 251 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001494, + "loss": 2.6569, + "step": 252 + }, + { + "epoch": 1.16, + "learning_rate": 0.00015, + "loss": 2.7576, + "step": 253 + }, + { + "epoch": 1.17, + "learning_rate": 0.00015059999999999997, + "loss": 2.6871, + "step": 254 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001512, + "loss": 2.6551, + "step": 255 + }, + { + "epoch": 1.17, + "learning_rate": 0.00015179999999999998, + "loss": 2.7003, + "step": 256 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001524, + "loss": 2.6276, + "step": 257 + }, + { + "epoch": 1.18, + "learning_rate": 0.00015299999999999998, + "loss": 2.5764, + "step": 258 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001536, + "loss": 2.5949, + "step": 259 + }, + { + "epoch": 1.19, + "learning_rate": 0.00015419999999999998, + "loss": 2.6128, + "step": 260 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001548, + "loss": 2.5063, + "step": 261 + }, + { + "epoch": 1.2, + "learning_rate": 0.00015539999999999998, + "loss": 2.5349, + "step": 262 + }, + { + "epoch": 1.21, + "learning_rate": 0.000156, + "loss": 2.4755, + "step": 263 + }, + { + "epoch": 1.21, + "learning_rate": 0.00015659999999999998, + "loss": 2.4868, + "step": 264 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001572, + "loss": 2.4275, + "step": 265 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001578, + "loss": 2.4221, + "step": 266 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001584, + "loss": 2.4349, + "step": 267 + }, + { + "epoch": 1.23, + "learning_rate": 0.000159, + "loss": 2.4545, + "step": 268 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001596, + "loss": 2.2887, + "step": 269 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001602, + "loss": 2.2839, + "step": 270 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001608, + "loss": 2.293, + "step": 271 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001614, + "loss": 2.2178, + "step": 272 + }, + { + "epoch": 1.25, + "learning_rate": 0.000162, + "loss": 2.3226, + "step": 273 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001626, + "loss": 2.1947, + "step": 274 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001632, + "loss": 2.3214, + "step": 275 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001638, + "loss": 2.1865, + "step": 276 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001644, + "loss": 2.1142, + "step": 277 + }, + { + "epoch": 1.28, + "learning_rate": 0.000165, + "loss": 2.1584, + "step": 278 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001656, + "loss": 2.0077, + "step": 279 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001662, + "loss": 2.1195, + "step": 280 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001668, + "loss": 2.0604, + "step": 281 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001674, + "loss": 2.0327, + "step": 282 + }, + { + "epoch": 1.3, + "learning_rate": 0.000168, + "loss": 1.9262, + "step": 283 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001686, + "loss": 1.8818, + "step": 284 + }, + { + "epoch": 1.31, + "learning_rate": 0.00016919999999999997, + "loss": 1.8269, + "step": 285 + }, + { + "epoch": 1.31, + "learning_rate": 0.00016979999999999998, + "loss": 1.8953, + "step": 286 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017039999999999997, + "loss": 1.7336, + "step": 287 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017099999999999998, + "loss": 1.645, + "step": 288 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017159999999999997, + "loss": 1.8061, + "step": 289 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017219999999999998, + "loss": 1.7541, + "step": 290 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017279999999999997, + "loss": 1.6656, + "step": 291 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017339999999999996, + "loss": 1.6104, + "step": 292 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017399999999999997, + "loss": 1.5956, + "step": 293 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017459999999999996, + "loss": 1.5557, + "step": 294 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017519999999999998, + "loss": 1.5096, + "step": 295 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017579999999999996, + "loss": 1.4378, + "step": 296 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017639999999999998, + "loss": 1.3679, + "step": 297 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017699999999999997, + "loss": 1.2993, + "step": 298 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017759999999999998, + "loss": 1.3469, + "step": 299 + }, + { + "epoch": 1.38, + "learning_rate": 0.00017819999999999997, + "loss": 1.4111, + "step": 300 + }, + { + "epoch": 1.38, + "eval_loss": 1.3343250751495361, + "eval_runtime": 19.9971, + "eval_samples_per_second": 82.362, + "eval_steps_per_second": 2.6, + "eval_wer": 0.8838729445409049, + "step": 300 + }, + { + "epoch": 1.38, + "learning_rate": 0.00017879999999999998, + "loss": 1.3293, + "step": 301 + }, + { + "epoch": 1.39, + "learning_rate": 0.00017939999999999997, + "loss": 1.3517, + "step": 302 + }, + { + "epoch": 1.39, + "learning_rate": 0.00017999999999999998, + "loss": 1.4294, + "step": 303 + }, + { + "epoch": 1.39, + "learning_rate": 0.00018059999999999997, + "loss": 1.2516, + "step": 304 + }, + { + "epoch": 1.4, + "learning_rate": 0.00018119999999999999, + "loss": 1.37, + "step": 305 + }, + { + "epoch": 1.4, + "learning_rate": 0.00018179999999999997, + "loss": 1.5296, + "step": 306 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001824, + "loss": 1.3691, + "step": 307 + }, + { + "epoch": 1.41, + "learning_rate": 0.00018299999999999998, + "loss": 1.2799, + "step": 308 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001836, + "loss": 1.0779, + "step": 309 + }, + { + "epoch": 1.42, + "learning_rate": 0.00018419999999999998, + "loss": 1.2617, + "step": 310 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001848, + "loss": 1.3178, + "step": 311 + }, + { + "epoch": 1.43, + "learning_rate": 0.00018539999999999998, + "loss": 1.1695, + "step": 312 + }, + { + "epoch": 1.44, + "learning_rate": 0.000186, + "loss": 1.2951, + "step": 313 + }, + { + "epoch": 1.44, + "learning_rate": 0.00018659999999999998, + "loss": 1.3405, + "step": 314 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001872, + "loss": 1.1029, + "step": 315 + }, + { + "epoch": 1.45, + "learning_rate": 0.00018779999999999998, + "loss": 1.1497, + "step": 316 + }, + { + "epoch": 1.45, + "learning_rate": 0.00018839999999999997, + "loss": 1.4485, + "step": 317 + }, + { + "epoch": 1.46, + "learning_rate": 0.00018899999999999999, + "loss": 1.3151, + "step": 318 + }, + { + "epoch": 1.46, + "learning_rate": 0.00018959999999999997, + "loss": 1.155, + "step": 319 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001902, + "loss": 1.0607, + "step": 320 + }, + { + "epoch": 1.47, + "learning_rate": 0.00019079999999999998, + "loss": 1.0575, + "step": 321 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001914, + "loss": 0.936, + "step": 322 + }, + { + "epoch": 1.48, + "learning_rate": 0.00019199999999999998, + "loss": 1.036, + "step": 323 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001926, + "loss": 1.0238, + "step": 324 + }, + { + "epoch": 1.49, + "learning_rate": 0.00019319999999999998, + "loss": 0.9693, + "step": 325 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001938, + "loss": 1.1125, + "step": 326 + }, + { + "epoch": 1.5, + "learning_rate": 0.00019439999999999998, + "loss": 0.95, + "step": 327 + }, + { + "epoch": 1.5, + "learning_rate": 0.000195, + "loss": 1.1083, + "step": 328 + }, + { + "epoch": 1.51, + "learning_rate": 0.00019559999999999998, + "loss": 1.192, + "step": 329 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001962, + "loss": 1.1514, + "step": 330 + }, + { + "epoch": 1.52, + "learning_rate": 0.00019679999999999999, + "loss": 1.099, + "step": 331 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001974, + "loss": 0.9299, + "step": 332 + }, + { + "epoch": 1.53, + "learning_rate": 0.000198, + "loss": 0.9884, + "step": 333 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001986, + "loss": 0.7696, + "step": 334 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001992, + "loss": 0.9232, + "step": 335 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001998, + "loss": 0.8012, + "step": 336 + }, + { + "epoch": 1.55, + "learning_rate": 0.0002004, + "loss": 0.8451, + "step": 337 + }, + { + "epoch": 1.55, + "learning_rate": 0.000201, + "loss": 1.0069, + "step": 338 + }, + { + "epoch": 1.56, + "learning_rate": 0.0002016, + "loss": 1.0612, + "step": 339 + }, + { + "epoch": 1.56, + "learning_rate": 0.0002022, + "loss": 1.0388, + "step": 340 + }, + { + "epoch": 1.56, + "learning_rate": 0.0002028, + "loss": 0.9696, + "step": 341 + }, + { + "epoch": 1.57, + "learning_rate": 0.00020339999999999998, + "loss": 0.9102, + "step": 342 + }, + { + "epoch": 1.57, + "learning_rate": 0.000204, + "loss": 1.0963, + "step": 343 + }, + { + "epoch": 1.58, + "learning_rate": 0.00020459999999999999, + "loss": 0.8709, + "step": 344 + }, + { + "epoch": 1.58, + "learning_rate": 0.0002052, + "loss": 0.9816, + "step": 345 + }, + { + "epoch": 1.59, + "learning_rate": 0.0002058, + "loss": 1.2273, + "step": 346 + }, + { + "epoch": 1.59, + "learning_rate": 0.00020639999999999998, + "loss": 0.9663, + "step": 347 + }, + { + "epoch": 1.6, + "learning_rate": 0.00020699999999999996, + "loss": 0.9226, + "step": 348 + }, + { + "epoch": 1.6, + "learning_rate": 0.00020759999999999998, + "loss": 1.1023, + "step": 349 + }, + { + "epoch": 1.61, + "learning_rate": 0.00020819999999999996, + "loss": 0.9998, + "step": 350 + }, + { + "epoch": 1.61, + "learning_rate": 0.00020879999999999998, + "loss": 0.8283, + "step": 351 + }, + { + "epoch": 1.61, + "learning_rate": 0.00020939999999999997, + "loss": 0.9796, + "step": 352 + }, + { + "epoch": 1.62, + "learning_rate": 0.00020999999999999998, + "loss": 0.8152, + "step": 353 + }, + { + "epoch": 1.62, + "learning_rate": 0.00021059999999999997, + "loss": 0.8963, + "step": 354 + }, + { + "epoch": 1.63, + "learning_rate": 0.00021119999999999996, + "loss": 1.1644, + "step": 355 + }, + { + "epoch": 1.63, + "learning_rate": 0.00021179999999999997, + "loss": 0.988, + "step": 356 + }, + { + "epoch": 1.64, + "learning_rate": 0.00021239999999999996, + "loss": 0.8421, + "step": 357 + }, + { + "epoch": 1.64, + "learning_rate": 0.00021299999999999997, + "loss": 0.8731, + "step": 358 + }, + { + "epoch": 1.65, + "learning_rate": 0.00021359999999999996, + "loss": 0.8543, + "step": 359 + }, + { + "epoch": 1.65, + "learning_rate": 0.00021419999999999998, + "loss": 0.6779, + "step": 360 + }, + { + "epoch": 1.66, + "learning_rate": 0.00021479999999999996, + "loss": 0.8892, + "step": 361 + }, + { + "epoch": 1.66, + "learning_rate": 0.00021539999999999998, + "loss": 0.8471, + "step": 362 + }, + { + "epoch": 1.67, + "learning_rate": 0.00021599999999999996, + "loss": 0.8519, + "step": 363 + }, + { + "epoch": 1.67, + "learning_rate": 0.00021659999999999998, + "loss": 0.8634, + "step": 364 + }, + { + "epoch": 1.67, + "learning_rate": 0.00021719999999999997, + "loss": 0.9264, + "step": 365 + }, + { + "epoch": 1.68, + "learning_rate": 0.00021779999999999998, + "loss": 0.857, + "step": 366 + }, + { + "epoch": 1.68, + "learning_rate": 0.00021839999999999997, + "loss": 0.9735, + "step": 367 + }, + { + "epoch": 1.69, + "learning_rate": 0.00021899999999999998, + "loss": 0.9344, + "step": 368 + }, + { + "epoch": 1.69, + "learning_rate": 0.00021959999999999997, + "loss": 0.7254, + "step": 369 + }, + { + "epoch": 1.7, + "learning_rate": 0.00022019999999999999, + "loss": 0.7991, + "step": 370 + }, + { + "epoch": 1.7, + "learning_rate": 0.00022079999999999997, + "loss": 0.8007, + "step": 371 + }, + { + "epoch": 1.71, + "learning_rate": 0.0002214, + "loss": 0.8409, + "step": 372 + }, + { + "epoch": 1.71, + "learning_rate": 0.00022199999999999998, + "loss": 0.9158, + "step": 373 + }, + { + "epoch": 1.72, + "learning_rate": 0.0002226, + "loss": 0.7143, + "step": 374 + }, + { + "epoch": 1.72, + "learning_rate": 0.00022319999999999998, + "loss": 0.8136, + "step": 375 + }, + { + "epoch": 1.72, + "learning_rate": 0.0002238, + "loss": 0.7984, + "step": 376 + }, + { + "epoch": 1.73, + "learning_rate": 0.00022439999999999998, + "loss": 0.8392, + "step": 377 + }, + { + "epoch": 1.73, + "learning_rate": 0.000225, + "loss": 0.89, + "step": 378 + }, + { + "epoch": 1.74, + "learning_rate": 0.00022559999999999998, + "loss": 0.9143, + "step": 379 + }, + { + "epoch": 1.74, + "learning_rate": 0.00022619999999999997, + "loss": 0.991, + "step": 380 + }, + { + "epoch": 1.75, + "learning_rate": 0.00022679999999999998, + "loss": 0.8197, + "step": 381 + }, + { + "epoch": 1.75, + "learning_rate": 0.00022739999999999997, + "loss": 0.8955, + "step": 382 + }, + { + "epoch": 1.76, + "learning_rate": 0.00022799999999999999, + "loss": 0.7606, + "step": 383 + }, + { + "epoch": 1.76, + "learning_rate": 0.00022859999999999997, + "loss": 0.7698, + "step": 384 + }, + { + "epoch": 1.77, + "learning_rate": 0.0002292, + "loss": 0.6944, + "step": 385 + }, + { + "epoch": 1.77, + "learning_rate": 0.00022979999999999997, + "loss": 0.7642, + "step": 386 + }, + { + "epoch": 1.78, + "learning_rate": 0.0002304, + "loss": 0.719, + "step": 387 + }, + { + "epoch": 1.78, + "learning_rate": 0.00023099999999999998, + "loss": 0.8895, + "step": 388 + }, + { + "epoch": 1.78, + "learning_rate": 0.0002316, + "loss": 0.7644, + "step": 389 + }, + { + "epoch": 1.79, + "learning_rate": 0.00023219999999999998, + "loss": 0.7878, + "step": 390 + }, + { + "epoch": 1.79, + "learning_rate": 0.0002328, + "loss": 0.873, + "step": 391 + }, + { + "epoch": 1.8, + "learning_rate": 0.00023339999999999998, + "loss": 0.7841, + "step": 392 + }, + { + "epoch": 1.8, + "learning_rate": 0.000234, + "loss": 1.0839, + "step": 393 + }, + { + "epoch": 1.81, + "learning_rate": 0.00023459999999999998, + "loss": 0.7284, + "step": 394 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002352, + "loss": 0.6401, + "step": 395 + }, + { + "epoch": 1.82, + "learning_rate": 0.00023579999999999999, + "loss": 0.7563, + "step": 396 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002364, + "loss": 0.6997, + "step": 397 + }, + { + "epoch": 1.83, + "learning_rate": 0.000237, + "loss": 0.6203, + "step": 398 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002376, + "loss": 0.6935, + "step": 399 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002382, + "loss": 0.8468, + "step": 400 + }, + { + "epoch": 1.83, + "eval_loss": 0.692014753818512, + "eval_runtime": 19.5046, + "eval_samples_per_second": 84.442, + "eval_steps_per_second": 2.666, + "eval_wer": 0.6825656214891227, + "step": 400 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002388, + "loss": 0.6707, + "step": 401 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002394, + "loss": 0.8036, + "step": 402 + }, + { + "epoch": 1.85, + "learning_rate": 0.00023999999999999998, + "loss": 0.971, + "step": 403 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002406, + "loss": 0.6798, + "step": 404 + }, + { + "epoch": 1.86, + "learning_rate": 0.00024119999999999998, + "loss": 0.7999, + "step": 405 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002418, + "loss": 0.9365, + "step": 406 + }, + { + "epoch": 1.87, + "learning_rate": 0.00024239999999999998, + "loss": 0.7161, + "step": 407 + }, + { + "epoch": 1.87, + "learning_rate": 0.000243, + "loss": 0.8427, + "step": 408 + }, + { + "epoch": 1.88, + "learning_rate": 0.00024359999999999999, + "loss": 0.6813, + "step": 409 + }, + { + "epoch": 1.88, + "learning_rate": 0.00024419999999999997, + "loss": 0.6434, + "step": 410 + }, + { + "epoch": 1.89, + "learning_rate": 0.0002448, + "loss": 0.6436, + "step": 411 + }, + { + "epoch": 1.89, + "learning_rate": 0.00024539999999999995, + "loss": 0.7713, + "step": 412 + }, + { + "epoch": 1.89, + "learning_rate": 0.00024599999999999996, + "loss": 0.7949, + "step": 413 + }, + { + "epoch": 1.9, + "learning_rate": 0.0002466, + "loss": 0.7668, + "step": 414 + }, + { + "epoch": 1.9, + "learning_rate": 0.0002472, + "loss": 0.8215, + "step": 415 + }, + { + "epoch": 1.91, + "learning_rate": 0.00024779999999999995, + "loss": 0.8111, + "step": 416 + }, + { + "epoch": 1.91, + "learning_rate": 0.00024839999999999997, + "loss": 0.6129, + "step": 417 + }, + { + "epoch": 1.92, + "learning_rate": 0.000249, + "loss": 0.8391, + "step": 418 + }, + { + "epoch": 1.92, + "learning_rate": 0.00024959999999999994, + "loss": 0.6582, + "step": 419 + }, + { + "epoch": 1.93, + "learning_rate": 0.00025019999999999996, + "loss": 0.7226, + "step": 420 + }, + { + "epoch": 1.93, + "learning_rate": 0.00025079999999999997, + "loss": 0.623, + "step": 421 + }, + { + "epoch": 1.94, + "learning_rate": 0.0002514, + "loss": 0.7838, + "step": 422 + }, + { + "epoch": 1.94, + "learning_rate": 0.00025199999999999995, + "loss": 0.7061, + "step": 423 + }, + { + "epoch": 1.94, + "learning_rate": 0.00025259999999999996, + "loss": 0.6168, + "step": 424 + }, + { + "epoch": 1.95, + "learning_rate": 0.0002532, + "loss": 0.7388, + "step": 425 + }, + { + "epoch": 1.95, + "learning_rate": 0.0002538, + "loss": 0.8077, + "step": 426 + }, + { + "epoch": 1.96, + "learning_rate": 0.00025439999999999995, + "loss": 0.6856, + "step": 427 + }, + { + "epoch": 1.96, + "learning_rate": 0.00025499999999999996, + "loss": 0.7415, + "step": 428 + }, + { + "epoch": 1.97, + "learning_rate": 0.0002556, + "loss": 0.7806, + "step": 429 + }, + { + "epoch": 1.97, + "learning_rate": 0.0002562, + "loss": 0.8834, + "step": 430 + }, + { + "epoch": 1.98, + "learning_rate": 0.00025679999999999995, + "loss": 0.7889, + "step": 431 + }, + { + "epoch": 1.98, + "learning_rate": 0.00025739999999999997, + "loss": 0.7095, + "step": 432 + }, + { + "epoch": 1.99, + "learning_rate": 0.000258, + "loss": 0.6953, + "step": 433 + }, + { + "epoch": 1.99, + "learning_rate": 0.0002586, + "loss": 0.6881, + "step": 434 + }, + { + "epoch": 2.0, + "learning_rate": 0.00025919999999999996, + "loss": 0.7854, + "step": 435 + }, + { + "epoch": 2.0, + "learning_rate": 0.00025979999999999997, + "loss": 0.6099, + "step": 436 + }, + { + "epoch": 2.0, + "learning_rate": 0.0002604, + "loss": 0.5593, + "step": 437 + }, + { + "epoch": 2.01, + "learning_rate": 0.000261, + "loss": 0.5701, + "step": 438 + }, + { + "epoch": 2.01, + "learning_rate": 0.00026159999999999996, + "loss": 0.6773, + "step": 439 + }, + { + "epoch": 2.02, + "learning_rate": 0.0002622, + "loss": 0.5321, + "step": 440 + }, + { + "epoch": 2.02, + "learning_rate": 0.0002628, + "loss": 0.6292, + "step": 441 + }, + { + "epoch": 2.03, + "learning_rate": 0.00026339999999999995, + "loss": 0.6741, + "step": 442 + }, + { + "epoch": 2.03, + "learning_rate": 0.00026399999999999997, + "loss": 0.699, + "step": 443 + }, + { + "epoch": 2.04, + "learning_rate": 0.0002646, + "loss": 0.5483, + "step": 444 + }, + { + "epoch": 2.04, + "learning_rate": 0.0002652, + "loss": 0.8357, + "step": 445 + }, + { + "epoch": 2.05, + "learning_rate": 0.00026579999999999996, + "loss": 0.6346, + "step": 446 + }, + { + "epoch": 2.05, + "learning_rate": 0.00026639999999999997, + "loss": 0.5685, + "step": 447 + }, + { + "epoch": 2.06, + "learning_rate": 0.000267, + "loss": 0.7488, + "step": 448 + }, + { + "epoch": 2.06, + "learning_rate": 0.0002676, + "loss": 0.7929, + "step": 449 + }, + { + "epoch": 2.06, + "learning_rate": 0.00026819999999999996, + "loss": 0.4677, + "step": 450 + }, + { + "epoch": 2.07, + "learning_rate": 0.0002688, + "loss": 0.4193, + "step": 451 + }, + { + "epoch": 2.07, + "learning_rate": 0.0002694, + "loss": 0.5116, + "step": 452 + }, + { + "epoch": 2.08, + "learning_rate": 0.00027, + "loss": 0.5462, + "step": 453 + }, + { + "epoch": 2.08, + "learning_rate": 0.00027059999999999996, + "loss": 0.4695, + "step": 454 + }, + { + "epoch": 2.09, + "learning_rate": 0.0002712, + "loss": 0.549, + "step": 455 + }, + { + "epoch": 2.09, + "learning_rate": 0.0002718, + "loss": 0.5873, + "step": 456 + }, + { + "epoch": 2.1, + "learning_rate": 0.0002724, + "loss": 0.6156, + "step": 457 + }, + { + "epoch": 2.1, + "learning_rate": 0.00027299999999999997, + "loss": 0.4681, + "step": 458 + }, + { + "epoch": 2.11, + "learning_rate": 0.0002736, + "loss": 0.5675, + "step": 459 + }, + { + "epoch": 2.11, + "learning_rate": 0.0002742, + "loss": 0.4059, + "step": 460 + }, + { + "epoch": 2.11, + "learning_rate": 0.0002748, + "loss": 0.7245, + "step": 461 + }, + { + "epoch": 2.12, + "learning_rate": 0.00027539999999999997, + "loss": 0.5192, + "step": 462 + }, + { + "epoch": 2.12, + "learning_rate": 0.000276, + "loss": 0.5812, + "step": 463 + }, + { + "epoch": 2.13, + "learning_rate": 0.0002766, + "loss": 0.5368, + "step": 464 + }, + { + "epoch": 2.13, + "learning_rate": 0.0002772, + "loss": 0.5222, + "step": 465 + }, + { + "epoch": 2.14, + "learning_rate": 0.0002778, + "loss": 0.7377, + "step": 466 + }, + { + "epoch": 2.14, + "learning_rate": 0.0002784, + "loss": 0.5249, + "step": 467 + }, + { + "epoch": 2.15, + "learning_rate": 0.000279, + "loss": 0.6471, + "step": 468 + }, + { + "epoch": 2.15, + "learning_rate": 0.00027959999999999997, + "loss": 0.4833, + "step": 469 + }, + { + "epoch": 2.16, + "learning_rate": 0.0002802, + "loss": 0.5598, + "step": 470 + }, + { + "epoch": 2.16, + "learning_rate": 0.0002808, + "loss": 0.7067, + "step": 471 + }, + { + "epoch": 2.17, + "learning_rate": 0.00028139999999999996, + "loss": 0.6439, + "step": 472 + }, + { + "epoch": 2.17, + "learning_rate": 0.00028199999999999997, + "loss": 0.7628, + "step": 473 + }, + { + "epoch": 2.17, + "learning_rate": 0.0002826, + "loss": 0.7442, + "step": 474 + }, + { + "epoch": 2.18, + "learning_rate": 0.00028319999999999994, + "loss": 0.5266, + "step": 475 + }, + { + "epoch": 2.18, + "learning_rate": 0.00028379999999999996, + "loss": 0.5018, + "step": 476 + }, + { + "epoch": 2.19, + "learning_rate": 0.0002844, + "loss": 0.651, + "step": 477 + }, + { + "epoch": 2.19, + "learning_rate": 0.000285, + "loss": 0.4145, + "step": 478 + }, + { + "epoch": 2.2, + "learning_rate": 0.00028559999999999995, + "loss": 0.4896, + "step": 479 + }, + { + "epoch": 2.2, + "learning_rate": 0.00028619999999999996, + "loss": 0.4544, + "step": 480 + }, + { + "epoch": 2.21, + "learning_rate": 0.0002868, + "loss": 0.6213, + "step": 481 + }, + { + "epoch": 2.21, + "learning_rate": 0.00028739999999999994, + "loss": 0.6391, + "step": 482 + }, + { + "epoch": 2.22, + "learning_rate": 0.00028799999999999995, + "loss": 0.5104, + "step": 483 + }, + { + "epoch": 2.22, + "learning_rate": 0.00028859999999999997, + "loss": 0.5111, + "step": 484 + }, + { + "epoch": 2.22, + "learning_rate": 0.0002892, + "loss": 0.5529, + "step": 485 + }, + { + "epoch": 2.23, + "learning_rate": 0.00028979999999999994, + "loss": 0.6238, + "step": 486 + }, + { + "epoch": 2.23, + "learning_rate": 0.00029039999999999996, + "loss": 0.5365, + "step": 487 + }, + { + "epoch": 2.24, + "learning_rate": 0.00029099999999999997, + "loss": 0.5393, + "step": 488 + }, + { + "epoch": 2.24, + "learning_rate": 0.0002916, + "loss": 0.4915, + "step": 489 + }, + { + "epoch": 2.25, + "learning_rate": 0.00029219999999999995, + "loss": 0.5283, + "step": 490 + }, + { + "epoch": 2.25, + "learning_rate": 0.00029279999999999996, + "loss": 0.4564, + "step": 491 + }, + { + "epoch": 2.26, + "learning_rate": 0.0002934, + "loss": 0.5635, + "step": 492 + }, + { + "epoch": 2.26, + "learning_rate": 0.000294, + "loss": 0.4919, + "step": 493 + }, + { + "epoch": 2.27, + "learning_rate": 0.00029459999999999995, + "loss": 0.5222, + "step": 494 + }, + { + "epoch": 2.27, + "learning_rate": 0.00029519999999999997, + "loss": 0.6204, + "step": 495 + }, + { + "epoch": 2.28, + "learning_rate": 0.0002958, + "loss": 0.5362, + "step": 496 + }, + { + "epoch": 2.28, + "learning_rate": 0.0002964, + "loss": 0.678, + "step": 497 + }, + { + "epoch": 2.28, + "learning_rate": 0.00029699999999999996, + "loss": 0.6999, + "step": 498 + }, + { + "epoch": 2.29, + "learning_rate": 0.00029759999999999997, + "loss": 0.4806, + "step": 499 + }, + { + "epoch": 2.29, + "learning_rate": 0.0002982, + "loss": 0.6242, + "step": 500 + }, + { + "epoch": 2.29, + "eval_loss": 0.6000840663909912, + "eval_runtime": 19.7908, + "eval_samples_per_second": 83.22, + "eval_steps_per_second": 2.627, + "eval_wer": 0.5996323153916863, + "step": 500 + }, + { + "epoch": 2.3, + "learning_rate": 0.0002988, + "loss": 0.6511, + "step": 501 + }, + { + "epoch": 2.3, + "learning_rate": 0.00029939999999999996, + "loss": 0.4897, + "step": 502 + }, + { + "epoch": 2.31, + "learning_rate": 0.0003, + "loss": 0.5596, + "step": 503 + }, + { + "epoch": 2.31, + "learning_rate": 0.0002998916967509025, + "loss": 0.4925, + "step": 504 + }, + { + "epoch": 2.32, + "learning_rate": 0.000299783393501805, + "loss": 0.6507, + "step": 505 + }, + { + "epoch": 2.32, + "learning_rate": 0.00029967509025270755, + "loss": 0.4848, + "step": 506 + }, + { + "epoch": 2.33, + "learning_rate": 0.0002995667870036101, + "loss": 0.6709, + "step": 507 + }, + { + "epoch": 2.33, + "learning_rate": 0.0002994584837545126, + "loss": 0.5344, + "step": 508 + }, + { + "epoch": 2.33, + "learning_rate": 0.0002993501805054151, + "loss": 0.6344, + "step": 509 + }, + { + "epoch": 2.34, + "learning_rate": 0.00029924187725631767, + "loss": 0.5436, + "step": 510 + }, + { + "epoch": 2.34, + "learning_rate": 0.00029913357400722016, + "loss": 0.5667, + "step": 511 + }, + { + "epoch": 2.35, + "learning_rate": 0.0002990252707581227, + "loss": 0.4495, + "step": 512 + }, + { + "epoch": 2.35, + "learning_rate": 0.00029891696750902524, + "loss": 0.5633, + "step": 513 + }, + { + "epoch": 2.36, + "learning_rate": 0.0002988086642599278, + "loss": 0.4858, + "step": 514 + }, + { + "epoch": 2.36, + "learning_rate": 0.00029870036101083033, + "loss": 0.5676, + "step": 515 + }, + { + "epoch": 2.37, + "learning_rate": 0.0002985920577617328, + "loss": 0.503, + "step": 516 + }, + { + "epoch": 2.37, + "learning_rate": 0.00029848375451263536, + "loss": 0.47, + "step": 517 + }, + { + "epoch": 2.38, + "learning_rate": 0.0002983754512635379, + "loss": 0.5169, + "step": 518 + }, + { + "epoch": 2.38, + "learning_rate": 0.0002982671480144404, + "loss": 0.712, + "step": 519 + }, + { + "epoch": 2.39, + "learning_rate": 0.00029815884476534294, + "loss": 0.516, + "step": 520 + }, + { + "epoch": 2.39, + "learning_rate": 0.0002980505415162455, + "loss": 0.564, + "step": 521 + }, + { + "epoch": 2.39, + "learning_rate": 0.00029794223826714797, + "loss": 0.6259, + "step": 522 + }, + { + "epoch": 2.4, + "learning_rate": 0.0002978339350180505, + "loss": 0.7627, + "step": 523 + }, + { + "epoch": 2.4, + "learning_rate": 0.00029772563176895306, + "loss": 0.5792, + "step": 524 + }, + { + "epoch": 2.41, + "learning_rate": 0.00029761732851985555, + "loss": 0.5537, + "step": 525 + }, + { + "epoch": 2.41, + "learning_rate": 0.0002975090252707581, + "loss": 0.4447, + "step": 526 + }, + { + "epoch": 2.42, + "learning_rate": 0.00029740072202166063, + "loss": 0.4556, + "step": 527 + }, + { + "epoch": 2.42, + "learning_rate": 0.0002972924187725631, + "loss": 0.5139, + "step": 528 + }, + { + "epoch": 2.43, + "learning_rate": 0.00029718411552346566, + "loss": 0.4527, + "step": 529 + }, + { + "epoch": 2.43, + "learning_rate": 0.0002970758122743682, + "loss": 0.4748, + "step": 530 + }, + { + "epoch": 2.44, + "learning_rate": 0.0002969675090252707, + "loss": 0.5797, + "step": 531 + }, + { + "epoch": 2.44, + "learning_rate": 0.00029685920577617324, + "loss": 0.4655, + "step": 532 + }, + { + "epoch": 2.44, + "learning_rate": 0.0002967509025270758, + "loss": 0.5742, + "step": 533 + }, + { + "epoch": 2.45, + "learning_rate": 0.0002966425992779783, + "loss": 0.5864, + "step": 534 + }, + { + "epoch": 2.45, + "learning_rate": 0.0002965342960288808, + "loss": 0.764, + "step": 535 + }, + { + "epoch": 2.46, + "learning_rate": 0.00029642599277978336, + "loss": 0.5817, + "step": 536 + }, + { + "epoch": 2.46, + "learning_rate": 0.0002963176895306859, + "loss": 0.4436, + "step": 537 + }, + { + "epoch": 2.47, + "learning_rate": 0.00029620938628158844, + "loss": 0.5775, + "step": 538 + }, + { + "epoch": 2.47, + "learning_rate": 0.00029610108303249093, + "loss": 0.3841, + "step": 539 + }, + { + "epoch": 2.48, + "learning_rate": 0.0002959927797833935, + "loss": 0.4008, + "step": 540 + }, + { + "epoch": 2.48, + "learning_rate": 0.000295884476534296, + "loss": 0.6345, + "step": 541 + }, + { + "epoch": 2.49, + "learning_rate": 0.00029577617328519856, + "loss": 0.5683, + "step": 542 + }, + { + "epoch": 2.49, + "learning_rate": 0.00029566787003610105, + "loss": 0.4884, + "step": 543 + }, + { + "epoch": 2.5, + "learning_rate": 0.0002955595667870036, + "loss": 0.6826, + "step": 544 + }, + { + "epoch": 2.5, + "learning_rate": 0.00029545126353790614, + "loss": 0.5133, + "step": 545 + }, + { + "epoch": 2.5, + "learning_rate": 0.00029534296028880863, + "loss": 0.6574, + "step": 546 + }, + { + "epoch": 2.51, + "learning_rate": 0.00029523465703971117, + "loss": 0.6143, + "step": 547 + }, + { + "epoch": 2.51, + "learning_rate": 0.0002951263537906137, + "loss": 0.5325, + "step": 548 + }, + { + "epoch": 2.52, + "learning_rate": 0.0002950180505415162, + "loss": 0.4957, + "step": 549 + }, + { + "epoch": 2.52, + "learning_rate": 0.00029490974729241875, + "loss": 0.4457, + "step": 550 + }, + { + "epoch": 2.53, + "learning_rate": 0.0002948014440433213, + "loss": 0.3796, + "step": 551 + }, + { + "epoch": 2.53, + "learning_rate": 0.0002946931407942238, + "loss": 0.5252, + "step": 552 + }, + { + "epoch": 2.54, + "learning_rate": 0.0002945848375451263, + "loss": 0.4691, + "step": 553 + }, + { + "epoch": 2.54, + "learning_rate": 0.00029447653429602887, + "loss": 0.4819, + "step": 554 + }, + { + "epoch": 2.55, + "learning_rate": 0.00029436823104693135, + "loss": 0.5265, + "step": 555 + }, + { + "epoch": 2.55, + "learning_rate": 0.0002942599277978339, + "loss": 0.5858, + "step": 556 + }, + { + "epoch": 2.56, + "learning_rate": 0.00029415162454873644, + "loss": 0.4844, + "step": 557 + }, + { + "epoch": 2.56, + "learning_rate": 0.000294043321299639, + "loss": 0.5176, + "step": 558 + }, + { + "epoch": 2.56, + "learning_rate": 0.00029393501805054153, + "loss": 0.4422, + "step": 559 + }, + { + "epoch": 2.57, + "learning_rate": 0.000293826714801444, + "loss": 0.5515, + "step": 560 + }, + { + "epoch": 2.57, + "learning_rate": 0.00029371841155234656, + "loss": 0.5222, + "step": 561 + }, + { + "epoch": 2.58, + "learning_rate": 0.0002936101083032491, + "loss": 0.6092, + "step": 562 + }, + { + "epoch": 2.58, + "learning_rate": 0.0002935018050541516, + "loss": 0.5076, + "step": 563 + }, + { + "epoch": 2.59, + "learning_rate": 0.00029339350180505414, + "loss": 0.4148, + "step": 564 + }, + { + "epoch": 2.59, + "learning_rate": 0.0002932851985559567, + "loss": 0.3874, + "step": 565 + }, + { + "epoch": 2.6, + "learning_rate": 0.00029317689530685917, + "loss": 0.4601, + "step": 566 + }, + { + "epoch": 2.6, + "learning_rate": 0.0002930685920577617, + "loss": 0.4127, + "step": 567 + }, + { + "epoch": 2.61, + "learning_rate": 0.00029296028880866425, + "loss": 0.4375, + "step": 568 + }, + { + "epoch": 2.61, + "learning_rate": 0.00029285198555956674, + "loss": 0.5872, + "step": 569 + }, + { + "epoch": 2.61, + "learning_rate": 0.0002927436823104693, + "loss": 0.5204, + "step": 570 + }, + { + "epoch": 2.62, + "learning_rate": 0.00029263537906137183, + "loss": 0.6556, + "step": 571 + }, + { + "epoch": 2.62, + "learning_rate": 0.0002925270758122743, + "loss": 0.793, + "step": 572 + }, + { + "epoch": 2.63, + "learning_rate": 0.00029241877256317686, + "loss": 0.6039, + "step": 573 + }, + { + "epoch": 2.63, + "learning_rate": 0.0002923104693140794, + "loss": 0.6518, + "step": 574 + }, + { + "epoch": 2.64, + "learning_rate": 0.0002922021660649819, + "loss": 0.4078, + "step": 575 + }, + { + "epoch": 2.64, + "learning_rate": 0.00029209386281588444, + "loss": 0.608, + "step": 576 + }, + { + "epoch": 2.65, + "learning_rate": 0.000291985559566787, + "loss": 0.3842, + "step": 577 + }, + { + "epoch": 2.65, + "learning_rate": 0.00029187725631768947, + "loss": 0.4884, + "step": 578 + }, + { + "epoch": 2.66, + "learning_rate": 0.00029176895306859207, + "loss": 0.4042, + "step": 579 + }, + { + "epoch": 2.66, + "learning_rate": 0.00029166064981949456, + "loss": 0.4497, + "step": 580 + }, + { + "epoch": 2.67, + "learning_rate": 0.0002915523465703971, + "loss": 0.4968, + "step": 581 + }, + { + "epoch": 2.67, + "learning_rate": 0.00029144404332129964, + "loss": 0.5535, + "step": 582 + }, + { + "epoch": 2.67, + "learning_rate": 0.00029133574007220213, + "loss": 0.5891, + "step": 583 + }, + { + "epoch": 2.68, + "learning_rate": 0.0002912274368231047, + "loss": 0.5702, + "step": 584 + }, + { + "epoch": 2.68, + "learning_rate": 0.0002911191335740072, + "loss": 0.5751, + "step": 585 + }, + { + "epoch": 2.69, + "learning_rate": 0.0002910108303249097, + "loss": 0.7514, + "step": 586 + }, + { + "epoch": 2.69, + "learning_rate": 0.00029090252707581225, + "loss": 0.5542, + "step": 587 + }, + { + "epoch": 2.7, + "learning_rate": 0.0002907942238267148, + "loss": 0.5657, + "step": 588 + }, + { + "epoch": 2.7, + "learning_rate": 0.0002906859205776173, + "loss": 0.4795, + "step": 589 + }, + { + "epoch": 2.71, + "learning_rate": 0.0002905776173285198, + "loss": 0.4262, + "step": 590 + }, + { + "epoch": 2.71, + "learning_rate": 0.00029046931407942237, + "loss": 0.5337, + "step": 591 + }, + { + "epoch": 2.72, + "learning_rate": 0.00029036101083032486, + "loss": 0.58, + "step": 592 + }, + { + "epoch": 2.72, + "learning_rate": 0.0002902527075812274, + "loss": 0.4537, + "step": 593 + }, + { + "epoch": 2.72, + "learning_rate": 0.00029014440433212994, + "loss": 0.5398, + "step": 594 + }, + { + "epoch": 2.73, + "learning_rate": 0.00029003610108303243, + "loss": 0.4871, + "step": 595 + }, + { + "epoch": 2.73, + "learning_rate": 0.000289927797833935, + "loss": 0.5195, + "step": 596 + }, + { + "epoch": 2.74, + "learning_rate": 0.0002898194945848375, + "loss": 0.5605, + "step": 597 + }, + { + "epoch": 2.74, + "learning_rate": 0.00028971119133574, + "loss": 0.8264, + "step": 598 + }, + { + "epoch": 2.75, + "learning_rate": 0.00028960288808664255, + "loss": 0.3304, + "step": 599 + }, + { + "epoch": 2.75, + "learning_rate": 0.0002894945848375451, + "loss": 0.4181, + "step": 600 + }, + { + "epoch": 2.75, + "eval_loss": 0.5655181407928467, + "eval_runtime": 19.9711, + "eval_samples_per_second": 82.469, + "eval_steps_per_second": 2.604, + "eval_wer": 0.5679705852313349, + "step": 600 + }, + { + "epoch": 2.76, + "learning_rate": 0.00028938628158844764, + "loss": 0.5162, + "step": 601 + }, + { + "epoch": 2.76, + "learning_rate": 0.0002892779783393502, + "loss": 0.5396, + "step": 602 + }, + { + "epoch": 2.77, + "learning_rate": 0.00028916967509025267, + "loss": 0.3875, + "step": 603 + }, + { + "epoch": 2.77, + "learning_rate": 0.0002890613718411552, + "loss": 0.6693, + "step": 604 + }, + { + "epoch": 2.78, + "learning_rate": 0.00028895306859205776, + "loss": 0.3991, + "step": 605 + }, + { + "epoch": 2.78, + "learning_rate": 0.00028884476534296025, + "loss": 0.6312, + "step": 606 + }, + { + "epoch": 2.78, + "learning_rate": 0.0002887364620938628, + "loss": 0.464, + "step": 607 + }, + { + "epoch": 2.79, + "learning_rate": 0.00028862815884476533, + "loss": 0.6506, + "step": 608 + }, + { + "epoch": 2.79, + "learning_rate": 0.0002885198555956678, + "loss": 0.5566, + "step": 609 + }, + { + "epoch": 2.8, + "learning_rate": 0.00028841155234657036, + "loss": 0.5535, + "step": 610 + }, + { + "epoch": 2.8, + "learning_rate": 0.0002883032490974729, + "loss": 0.5893, + "step": 611 + }, + { + "epoch": 2.81, + "learning_rate": 0.00028819494584837545, + "loss": 0.4431, + "step": 612 + }, + { + "epoch": 2.81, + "learning_rate": 0.00028808664259927794, + "loss": 0.4739, + "step": 613 + }, + { + "epoch": 2.82, + "learning_rate": 0.0002879783393501805, + "loss": 0.384, + "step": 614 + }, + { + "epoch": 2.82, + "learning_rate": 0.000287870036101083, + "loss": 0.3911, + "step": 615 + }, + { + "epoch": 2.83, + "learning_rate": 0.0002877617328519855, + "loss": 0.3936, + "step": 616 + }, + { + "epoch": 2.83, + "learning_rate": 0.00028765342960288806, + "loss": 0.5363, + "step": 617 + }, + { + "epoch": 2.83, + "learning_rate": 0.0002875451263537906, + "loss": 0.4602, + "step": 618 + }, + { + "epoch": 2.84, + "learning_rate": 0.0002874368231046931, + "loss": 0.4991, + "step": 619 + }, + { + "epoch": 2.84, + "learning_rate": 0.00028732851985559563, + "loss": 0.3796, + "step": 620 + }, + { + "epoch": 2.85, + "learning_rate": 0.0002872202166064982, + "loss": 0.5334, + "step": 621 + }, + { + "epoch": 2.85, + "learning_rate": 0.00028711191335740067, + "loss": 0.6248, + "step": 622 + }, + { + "epoch": 2.86, + "learning_rate": 0.00028700361010830326, + "loss": 0.5501, + "step": 623 + }, + { + "epoch": 2.86, + "learning_rate": 0.00028689530685920575, + "loss": 0.5136, + "step": 624 + }, + { + "epoch": 2.87, + "learning_rate": 0.0002867870036101083, + "loss": 0.4279, + "step": 625 + }, + { + "epoch": 2.87, + "learning_rate": 0.00028667870036101084, + "loss": 0.4217, + "step": 626 + }, + { + "epoch": 2.88, + "learning_rate": 0.00028657039711191333, + "loss": 0.463, + "step": 627 + }, + { + "epoch": 2.88, + "learning_rate": 0.00028646209386281587, + "loss": 0.4229, + "step": 628 + }, + { + "epoch": 2.89, + "learning_rate": 0.0002863537906137184, + "loss": 0.4861, + "step": 629 + }, + { + "epoch": 2.89, + "learning_rate": 0.0002862454873646209, + "loss": 0.5143, + "step": 630 + }, + { + "epoch": 2.89, + "learning_rate": 0.00028613718411552345, + "loss": 0.4451, + "step": 631 + }, + { + "epoch": 2.9, + "learning_rate": 0.000286028880866426, + "loss": 0.4398, + "step": 632 + }, + { + "epoch": 2.9, + "learning_rate": 0.0002859205776173285, + "loss": 0.5457, + "step": 633 + }, + { + "epoch": 2.91, + "learning_rate": 0.000285812274368231, + "loss": 0.5604, + "step": 634 + }, + { + "epoch": 2.91, + "learning_rate": 0.00028570397111913357, + "loss": 0.5485, + "step": 635 + }, + { + "epoch": 2.92, + "learning_rate": 0.00028559566787003606, + "loss": 0.593, + "step": 636 + }, + { + "epoch": 2.92, + "learning_rate": 0.0002854873646209386, + "loss": 0.512, + "step": 637 + }, + { + "epoch": 2.93, + "learning_rate": 0.00028537906137184114, + "loss": 0.5294, + "step": 638 + }, + { + "epoch": 2.93, + "learning_rate": 0.00028527075812274363, + "loss": 0.4985, + "step": 639 + }, + { + "epoch": 2.94, + "learning_rate": 0.0002851624548736462, + "loss": 0.384, + "step": 640 + }, + { + "epoch": 2.94, + "learning_rate": 0.0002850541516245487, + "loss": 0.481, + "step": 641 + }, + { + "epoch": 2.94, + "learning_rate": 0.0002849458483754512, + "loss": 0.5185, + "step": 642 + }, + { + "epoch": 2.95, + "learning_rate": 0.00028483754512635375, + "loss": 0.4804, + "step": 643 + }, + { + "epoch": 2.95, + "learning_rate": 0.0002847292418772563, + "loss": 0.4808, + "step": 644 + }, + { + "epoch": 2.96, + "learning_rate": 0.00028462093862815884, + "loss": 0.3256, + "step": 645 + }, + { + "epoch": 2.96, + "learning_rate": 0.0002845126353790614, + "loss": 0.5852, + "step": 646 + }, + { + "epoch": 2.97, + "learning_rate": 0.00028440433212996387, + "loss": 0.5344, + "step": 647 + }, + { + "epoch": 2.97, + "learning_rate": 0.0002842960288808664, + "loss": 0.5453, + "step": 648 + }, + { + "epoch": 2.98, + "learning_rate": 0.00028418772563176895, + "loss": 0.7126, + "step": 649 + }, + { + "epoch": 2.98, + "learning_rate": 0.00028407942238267144, + "loss": 0.3433, + "step": 650 + }, + { + "epoch": 2.99, + "learning_rate": 0.000283971119133574, + "loss": 0.3986, + "step": 651 + }, + { + "epoch": 2.99, + "learning_rate": 0.00028386281588447653, + "loss": 0.4164, + "step": 652 + }, + { + "epoch": 3.0, + "learning_rate": 0.000283754512635379, + "loss": 0.6289, + "step": 653 + }, + { + "epoch": 3.0, + "learning_rate": 0.00028364620938628156, + "loss": 0.2716, + "step": 654 + }, + { + "epoch": 3.0, + "learning_rate": 0.0002835379061371841, + "loss": 0.3405, + "step": 655 + }, + { + "epoch": 3.01, + "learning_rate": 0.0002834296028880866, + "loss": 0.2922, + "step": 656 + }, + { + "epoch": 3.01, + "learning_rate": 0.00028332129963898914, + "loss": 0.3421, + "step": 657 + }, + { + "epoch": 3.02, + "learning_rate": 0.0002832129963898917, + "loss": 0.3598, + "step": 658 + }, + { + "epoch": 3.02, + "learning_rate": 0.00028310469314079417, + "loss": 0.3437, + "step": 659 + }, + { + "epoch": 3.03, + "learning_rate": 0.0002829963898916967, + "loss": 0.3243, + "step": 660 + }, + { + "epoch": 3.03, + "learning_rate": 0.00028288808664259926, + "loss": 0.3734, + "step": 661 + }, + { + "epoch": 3.04, + "learning_rate": 0.00028277978339350175, + "loss": 0.367, + "step": 662 + }, + { + "epoch": 3.04, + "learning_rate": 0.0002826714801444043, + "loss": 0.4269, + "step": 663 + }, + { + "epoch": 3.05, + "learning_rate": 0.00028256317689530683, + "loss": 0.3289, + "step": 664 + }, + { + "epoch": 3.05, + "learning_rate": 0.0002824548736462093, + "loss": 0.4578, + "step": 665 + }, + { + "epoch": 3.06, + "learning_rate": 0.0002823465703971119, + "loss": 0.5304, + "step": 666 + }, + { + "epoch": 3.06, + "learning_rate": 0.0002822382671480144, + "loss": 0.383, + "step": 667 + }, + { + "epoch": 3.06, + "learning_rate": 0.00028212996389891695, + "loss": 0.2455, + "step": 668 + }, + { + "epoch": 3.07, + "learning_rate": 0.0002820216606498195, + "loss": 0.263, + "step": 669 + }, + { + "epoch": 3.07, + "learning_rate": 0.000281913357400722, + "loss": 0.3725, + "step": 670 + }, + { + "epoch": 3.08, + "learning_rate": 0.0002818050541516245, + "loss": 0.2746, + "step": 671 + }, + { + "epoch": 3.08, + "learning_rate": 0.00028169675090252707, + "loss": 0.3551, + "step": 672 + }, + { + "epoch": 3.09, + "learning_rate": 0.00028158844765342956, + "loss": 0.3843, + "step": 673 + }, + { + "epoch": 3.09, + "learning_rate": 0.0002814801444043321, + "loss": 0.4519, + "step": 674 + }, + { + "epoch": 3.1, + "learning_rate": 0.00028137184115523464, + "loss": 0.3327, + "step": 675 + }, + { + "epoch": 3.1, + "learning_rate": 0.00028126353790613713, + "loss": 0.4053, + "step": 676 + }, + { + "epoch": 3.11, + "learning_rate": 0.0002811552346570397, + "loss": 0.3607, + "step": 677 + }, + { + "epoch": 3.11, + "learning_rate": 0.0002810469314079422, + "loss": 0.2963, + "step": 678 + }, + { + "epoch": 3.11, + "learning_rate": 0.0002809386281588447, + "loss": 0.6399, + "step": 679 + }, + { + "epoch": 3.12, + "learning_rate": 0.00028083032490974725, + "loss": 0.2759, + "step": 680 + }, + { + "epoch": 3.12, + "learning_rate": 0.0002807220216606498, + "loss": 0.3783, + "step": 681 + }, + { + "epoch": 3.13, + "learning_rate": 0.00028061371841155234, + "loss": 0.3471, + "step": 682 + }, + { + "epoch": 3.13, + "learning_rate": 0.00028050541516245483, + "loss": 0.2981, + "step": 683 + }, + { + "epoch": 3.14, + "learning_rate": 0.00028039711191335737, + "loss": 0.3588, + "step": 684 + }, + { + "epoch": 3.14, + "learning_rate": 0.0002802888086642599, + "loss": 0.3476, + "step": 685 + }, + { + "epoch": 3.15, + "learning_rate": 0.0002801805054151624, + "loss": 0.2562, + "step": 686 + }, + { + "epoch": 3.15, + "learning_rate": 0.000280072202166065, + "loss": 0.3765, + "step": 687 + }, + { + "epoch": 3.16, + "learning_rate": 0.0002799638989169675, + "loss": 0.3134, + "step": 688 + }, + { + "epoch": 3.16, + "learning_rate": 0.00027985559566787003, + "loss": 0.377, + "step": 689 + }, + { + "epoch": 3.17, + "learning_rate": 0.0002797472924187726, + "loss": 0.3129, + "step": 690 + }, + { + "epoch": 3.17, + "learning_rate": 0.00027963898916967507, + "loss": 0.4633, + "step": 691 + }, + { + "epoch": 3.17, + "learning_rate": 0.0002795306859205776, + "loss": 0.558, + "step": 692 + }, + { + "epoch": 3.18, + "learning_rate": 0.00027942238267148015, + "loss": 0.2914, + "step": 693 + }, + { + "epoch": 3.18, + "learning_rate": 0.00027931407942238264, + "loss": 0.3383, + "step": 694 + }, + { + "epoch": 3.19, + "learning_rate": 0.0002792057761732852, + "loss": 0.3544, + "step": 695 + }, + { + "epoch": 3.19, + "learning_rate": 0.00027909747292418773, + "loss": 0.299, + "step": 696 + }, + { + "epoch": 3.2, + "learning_rate": 0.0002789891696750902, + "loss": 0.3876, + "step": 697 + }, + { + "epoch": 3.2, + "learning_rate": 0.00027888086642599276, + "loss": 0.249, + "step": 698 + }, + { + "epoch": 3.21, + "learning_rate": 0.0002787725631768953, + "loss": 0.3505, + "step": 699 + }, + { + "epoch": 3.21, + "learning_rate": 0.0002786642599277978, + "loss": 0.4311, + "step": 700 + }, + { + "epoch": 3.21, + "eval_loss": 0.44779741764068604, + "eval_runtime": 20.0012, + "eval_samples_per_second": 82.345, + "eval_steps_per_second": 2.6, + "eval_wer": 0.5002553365335513, + "step": 700 + }, + { + "epoch": 3.22, + "learning_rate": 0.00027855595667870034, + "loss": 0.3386, + "step": 701 + }, + { + "epoch": 3.22, + "learning_rate": 0.0002784476534296029, + "loss": 0.3837, + "step": 702 + }, + { + "epoch": 3.22, + "learning_rate": 0.00027833935018050537, + "loss": 0.45, + "step": 703 + }, + { + "epoch": 3.23, + "learning_rate": 0.0002782310469314079, + "loss": 0.3722, + "step": 704 + }, + { + "epoch": 3.23, + "learning_rate": 0.00027812274368231045, + "loss": 0.2731, + "step": 705 + }, + { + "epoch": 3.24, + "learning_rate": 0.00027801444043321294, + "loss": 0.3827, + "step": 706 + }, + { + "epoch": 3.24, + "learning_rate": 0.0002779061371841155, + "loss": 0.2535, + "step": 707 + }, + { + "epoch": 3.25, + "learning_rate": 0.00027779783393501803, + "loss": 0.3389, + "step": 708 + }, + { + "epoch": 3.25, + "learning_rate": 0.00027768953068592057, + "loss": 0.4179, + "step": 709 + }, + { + "epoch": 3.26, + "learning_rate": 0.0002775812274368231, + "loss": 0.3804, + "step": 710 + }, + { + "epoch": 3.26, + "learning_rate": 0.0002774729241877256, + "loss": 0.4061, + "step": 711 + }, + { + "epoch": 3.27, + "learning_rate": 0.00027736462093862815, + "loss": 0.4442, + "step": 712 + }, + { + "epoch": 3.27, + "learning_rate": 0.0002772563176895307, + "loss": 0.43, + "step": 713 + }, + { + "epoch": 3.28, + "learning_rate": 0.0002771480144404332, + "loss": 0.2428, + "step": 714 + }, + { + "epoch": 3.28, + "learning_rate": 0.0002770397111913357, + "loss": 0.49, + "step": 715 + }, + { + "epoch": 3.28, + "learning_rate": 0.00027693140794223827, + "loss": 0.5203, + "step": 716 + }, + { + "epoch": 3.29, + "learning_rate": 0.00027682310469314076, + "loss": 0.3733, + "step": 717 + }, + { + "epoch": 3.29, + "learning_rate": 0.0002767148014440433, + "loss": 0.3149, + "step": 718 + }, + { + "epoch": 3.3, + "learning_rate": 0.00027660649819494584, + "loss": 0.3167, + "step": 719 + }, + { + "epoch": 3.3, + "learning_rate": 0.00027649819494584833, + "loss": 0.2529, + "step": 720 + }, + { + "epoch": 3.31, + "learning_rate": 0.0002763898916967509, + "loss": 0.2426, + "step": 721 + }, + { + "epoch": 3.31, + "learning_rate": 0.0002762815884476534, + "loss": 0.3321, + "step": 722 + }, + { + "epoch": 3.32, + "learning_rate": 0.0002761732851985559, + "loss": 0.434, + "step": 723 + }, + { + "epoch": 3.32, + "learning_rate": 0.00027606498194945845, + "loss": 0.2556, + "step": 724 + }, + { + "epoch": 3.33, + "learning_rate": 0.000275956678700361, + "loss": 0.2861, + "step": 725 + }, + { + "epoch": 3.33, + "learning_rate": 0.0002758483754512635, + "loss": 0.4216, + "step": 726 + }, + { + "epoch": 3.33, + "learning_rate": 0.000275740072202166, + "loss": 0.2906, + "step": 727 + }, + { + "epoch": 3.34, + "learning_rate": 0.00027563176895306857, + "loss": 0.2919, + "step": 728 + }, + { + "epoch": 3.34, + "learning_rate": 0.00027552346570397106, + "loss": 0.3153, + "step": 729 + }, + { + "epoch": 3.35, + "learning_rate": 0.0002754151624548736, + "loss": 0.3382, + "step": 730 + }, + { + "epoch": 3.35, + "learning_rate": 0.00027530685920577614, + "loss": 0.2369, + "step": 731 + }, + { + "epoch": 3.36, + "learning_rate": 0.0002751985559566787, + "loss": 0.2926, + "step": 732 + }, + { + "epoch": 3.36, + "learning_rate": 0.00027509025270758123, + "loss": 0.2799, + "step": 733 + }, + { + "epoch": 3.37, + "learning_rate": 0.0002749819494584837, + "loss": 0.3164, + "step": 734 + }, + { + "epoch": 3.37, + "learning_rate": 0.00027487364620938626, + "loss": 0.3825, + "step": 735 + }, + { + "epoch": 3.38, + "learning_rate": 0.0002747653429602888, + "loss": 0.3105, + "step": 736 + }, + { + "epoch": 3.38, + "learning_rate": 0.0002746570397111913, + "loss": 0.3794, + "step": 737 + }, + { + "epoch": 3.39, + "learning_rate": 0.00027454873646209384, + "loss": 0.26, + "step": 738 + }, + { + "epoch": 3.39, + "learning_rate": 0.0002744404332129964, + "loss": 0.3872, + "step": 739 + }, + { + "epoch": 3.39, + "learning_rate": 0.00027433212996389887, + "loss": 0.4146, + "step": 740 + }, + { + "epoch": 3.4, + "learning_rate": 0.0002742238267148014, + "loss": 0.4495, + "step": 741 + }, + { + "epoch": 3.4, + "learning_rate": 0.00027411552346570396, + "loss": 0.5478, + "step": 742 + }, + { + "epoch": 3.41, + "learning_rate": 0.00027400722021660645, + "loss": 0.4425, + "step": 743 + }, + { + "epoch": 3.41, + "learning_rate": 0.000273898916967509, + "loss": 0.3123, + "step": 744 + }, + { + "epoch": 3.42, + "learning_rate": 0.00027379061371841153, + "loss": 0.3453, + "step": 745 + }, + { + "epoch": 3.42, + "learning_rate": 0.000273682310469314, + "loss": 0.314, + "step": 746 + }, + { + "epoch": 3.43, + "learning_rate": 0.00027357400722021656, + "loss": 0.3172, + "step": 747 + }, + { + "epoch": 3.43, + "learning_rate": 0.0002734657039711191, + "loss": 0.3136, + "step": 748 + }, + { + "epoch": 3.44, + "learning_rate": 0.00027335740072202165, + "loss": 0.4644, + "step": 749 + }, + { + "epoch": 3.44, + "learning_rate": 0.00027324909747292414, + "loss": 0.4007, + "step": 750 + }, + { + "epoch": 3.44, + "learning_rate": 0.0002731407942238267, + "loss": 0.3443, + "step": 751 + }, + { + "epoch": 3.45, + "learning_rate": 0.0002730324909747292, + "loss": 0.2997, + "step": 752 + }, + { + "epoch": 3.45, + "learning_rate": 0.00027292418772563177, + "loss": 0.4435, + "step": 753 + }, + { + "epoch": 3.46, + "learning_rate": 0.00027281588447653426, + "loss": 0.3587, + "step": 754 + }, + { + "epoch": 3.46, + "learning_rate": 0.0002727075812274368, + "loss": 0.2643, + "step": 755 + }, + { + "epoch": 3.47, + "learning_rate": 0.00027259927797833935, + "loss": 0.257, + "step": 756 + }, + { + "epoch": 3.47, + "learning_rate": 0.0002724909747292419, + "loss": 0.3726, + "step": 757 + }, + { + "epoch": 3.48, + "learning_rate": 0.0002723826714801444, + "loss": 0.3071, + "step": 758 + }, + { + "epoch": 3.48, + "learning_rate": 0.0002722743682310469, + "loss": 0.2505, + "step": 759 + }, + { + "epoch": 3.49, + "learning_rate": 0.00027216606498194946, + "loss": 0.3168, + "step": 760 + }, + { + "epoch": 3.49, + "learning_rate": 0.00027205776173285195, + "loss": 0.4075, + "step": 761 + }, + { + "epoch": 3.5, + "learning_rate": 0.0002719494584837545, + "loss": 0.2564, + "step": 762 + }, + { + "epoch": 3.5, + "learning_rate": 0.00027184115523465704, + "loss": 0.3366, + "step": 763 + }, + { + "epoch": 3.5, + "learning_rate": 0.00027173285198555953, + "loss": 0.4375, + "step": 764 + }, + { + "epoch": 3.51, + "learning_rate": 0.00027162454873646207, + "loss": 0.3942, + "step": 765 + }, + { + "epoch": 3.51, + "learning_rate": 0.0002715162454873646, + "loss": 0.4108, + "step": 766 + }, + { + "epoch": 3.52, + "learning_rate": 0.0002714079422382671, + "loss": 0.2857, + "step": 767 + }, + { + "epoch": 3.52, + "learning_rate": 0.00027129963898916965, + "loss": 0.2876, + "step": 768 + }, + { + "epoch": 3.53, + "learning_rate": 0.0002711913357400722, + "loss": 0.259, + "step": 769 + }, + { + "epoch": 3.53, + "learning_rate": 0.0002710830324909747, + "loss": 0.2747, + "step": 770 + }, + { + "epoch": 3.54, + "learning_rate": 0.0002709747292418772, + "loss": 0.3624, + "step": 771 + }, + { + "epoch": 3.54, + "learning_rate": 0.00027086642599277977, + "loss": 0.3212, + "step": 772 + }, + { + "epoch": 3.55, + "learning_rate": 0.00027075812274368226, + "loss": 0.3189, + "step": 773 + }, + { + "epoch": 3.55, + "learning_rate": 0.00027064981949458485, + "loss": 0.4975, + "step": 774 + }, + { + "epoch": 3.56, + "learning_rate": 0.00027054151624548734, + "loss": 0.3971, + "step": 775 + }, + { + "epoch": 3.56, + "learning_rate": 0.0002704332129963899, + "loss": 0.4076, + "step": 776 + }, + { + "epoch": 3.56, + "learning_rate": 0.00027032490974729243, + "loss": 0.3208, + "step": 777 + }, + { + "epoch": 3.57, + "learning_rate": 0.0002702166064981949, + "loss": 0.3849, + "step": 778 + }, + { + "epoch": 3.57, + "learning_rate": 0.00027010830324909746, + "loss": 0.6146, + "step": 779 + }, + { + "epoch": 3.58, + "learning_rate": 0.00027, + "loss": 0.3471, + "step": 780 + }, + { + "epoch": 3.58, + "learning_rate": 0.0002698916967509025, + "loss": 0.3029, + "step": 781 + }, + { + "epoch": 3.59, + "learning_rate": 0.00026978339350180504, + "loss": 0.2863, + "step": 782 + }, + { + "epoch": 3.59, + "learning_rate": 0.0002696750902527076, + "loss": 0.2311, + "step": 783 + }, + { + "epoch": 3.6, + "learning_rate": 0.00026956678700361007, + "loss": 0.3261, + "step": 784 + }, + { + "epoch": 3.6, + "learning_rate": 0.0002694584837545126, + "loss": 0.3336, + "step": 785 + }, + { + "epoch": 3.61, + "learning_rate": 0.00026935018050541515, + "loss": 0.2629, + "step": 786 + }, + { + "epoch": 3.61, + "learning_rate": 0.00026924187725631764, + "loss": 0.3281, + "step": 787 + }, + { + "epoch": 3.61, + "learning_rate": 0.0002691335740072202, + "loss": 0.4322, + "step": 788 + }, + { + "epoch": 3.62, + "learning_rate": 0.00026902527075812273, + "loss": 0.4366, + "step": 789 + }, + { + "epoch": 3.62, + "learning_rate": 0.0002689169675090252, + "loss": 0.4905, + "step": 790 + }, + { + "epoch": 3.63, + "learning_rate": 0.00026880866425992776, + "loss": 0.5752, + "step": 791 + }, + { + "epoch": 3.63, + "learning_rate": 0.0002687003610108303, + "loss": 0.4722, + "step": 792 + }, + { + "epoch": 3.64, + "learning_rate": 0.0002685920577617328, + "loss": 0.3058, + "step": 793 + }, + { + "epoch": 3.64, + "learning_rate": 0.00026848375451263534, + "loss": 0.3482, + "step": 794 + }, + { + "epoch": 3.65, + "learning_rate": 0.0002683754512635379, + "loss": 0.3407, + "step": 795 + }, + { + "epoch": 3.65, + "learning_rate": 0.0002682671480144404, + "loss": 0.2049, + "step": 796 + }, + { + "epoch": 3.66, + "learning_rate": 0.00026815884476534297, + "loss": 0.478, + "step": 797 + }, + { + "epoch": 3.66, + "learning_rate": 0.00026805054151624546, + "loss": 0.3157, + "step": 798 + }, + { + "epoch": 3.67, + "learning_rate": 0.000267942238267148, + "loss": 0.3692, + "step": 799 + }, + { + "epoch": 3.67, + "learning_rate": 0.00026783393501805054, + "loss": 0.3601, + "step": 800 + }, + { + "epoch": 3.67, + "eval_loss": 0.45478907227516174, + "eval_runtime": 19.7962, + "eval_samples_per_second": 83.198, + "eval_steps_per_second": 2.627, + "eval_wer": 0.5010724134409151, + "step": 800 + }, + { + "epoch": 3.67, + "learning_rate": 0.00026772563176895303, + "loss": 0.3703, + "step": 801 + }, + { + "epoch": 3.68, + "learning_rate": 0.0002676173285198556, + "loss": 0.398, + "step": 802 + }, + { + "epoch": 3.68, + "learning_rate": 0.0002675090252707581, + "loss": 0.4373, + "step": 803 + }, + { + "epoch": 3.69, + "learning_rate": 0.0002674007220216606, + "loss": 0.3731, + "step": 804 + }, + { + "epoch": 3.69, + "learning_rate": 0.00026729241877256315, + "loss": 0.2735, + "step": 805 + }, + { + "epoch": 3.7, + "learning_rate": 0.0002671841155234657, + "loss": 0.3951, + "step": 806 + }, + { + "epoch": 3.7, + "learning_rate": 0.0002670758122743682, + "loss": 0.2064, + "step": 807 + }, + { + "epoch": 3.71, + "learning_rate": 0.0002669675090252707, + "loss": 0.3735, + "step": 808 + }, + { + "epoch": 3.71, + "learning_rate": 0.00026685920577617327, + "loss": 0.2886, + "step": 809 + }, + { + "epoch": 3.72, + "learning_rate": 0.00026675090252707576, + "loss": 0.2482, + "step": 810 + }, + { + "epoch": 3.72, + "learning_rate": 0.0002666425992779783, + "loss": 0.2518, + "step": 811 + }, + { + "epoch": 3.72, + "learning_rate": 0.00026653429602888084, + "loss": 0.368, + "step": 812 + }, + { + "epoch": 3.73, + "learning_rate": 0.00026642599277978333, + "loss": 0.3422, + "step": 813 + }, + { + "epoch": 3.73, + "learning_rate": 0.0002663176895306859, + "loss": 0.339, + "step": 814 + }, + { + "epoch": 3.74, + "learning_rate": 0.0002662093862815884, + "loss": 0.4676, + "step": 815 + }, + { + "epoch": 3.74, + "learning_rate": 0.0002661010830324909, + "loss": 0.3939, + "step": 816 + }, + { + "epoch": 3.75, + "learning_rate": 0.0002659927797833935, + "loss": 0.4948, + "step": 817 + }, + { + "epoch": 3.75, + "learning_rate": 0.000265884476534296, + "loss": 0.2465, + "step": 818 + }, + { + "epoch": 3.76, + "learning_rate": 0.00026577617328519854, + "loss": 0.3428, + "step": 819 + }, + { + "epoch": 3.76, + "learning_rate": 0.0002656678700361011, + "loss": 0.2945, + "step": 820 + }, + { + "epoch": 3.77, + "learning_rate": 0.00026555956678700357, + "loss": 0.3127, + "step": 821 + }, + { + "epoch": 3.77, + "learning_rate": 0.0002654512635379061, + "loss": 0.3658, + "step": 822 + }, + { + "epoch": 3.78, + "learning_rate": 0.00026534296028880866, + "loss": 0.3139, + "step": 823 + }, + { + "epoch": 3.78, + "learning_rate": 0.00026523465703971115, + "loss": 0.4656, + "step": 824 + }, + { + "epoch": 3.78, + "learning_rate": 0.0002651263537906137, + "loss": 0.4426, + "step": 825 + }, + { + "epoch": 3.79, + "learning_rate": 0.00026501805054151623, + "loss": 0.3801, + "step": 826 + }, + { + "epoch": 3.79, + "learning_rate": 0.0002649097472924188, + "loss": 0.5255, + "step": 827 + }, + { + "epoch": 3.8, + "learning_rate": 0.00026480144404332127, + "loss": 0.4954, + "step": 828 + }, + { + "epoch": 3.8, + "learning_rate": 0.0002646931407942238, + "loss": 0.6328, + "step": 829 + }, + { + "epoch": 3.81, + "learning_rate": 0.00026458483754512635, + "loss": 0.2726, + "step": 830 + }, + { + "epoch": 3.81, + "learning_rate": 0.00026447653429602884, + "loss": 0.3547, + "step": 831 + }, + { + "epoch": 3.82, + "learning_rate": 0.0002643682310469314, + "loss": 0.3416, + "step": 832 + }, + { + "epoch": 3.82, + "learning_rate": 0.00026425992779783393, + "loss": 0.252, + "step": 833 + }, + { + "epoch": 3.83, + "learning_rate": 0.0002641516245487364, + "loss": 0.1793, + "step": 834 + }, + { + "epoch": 3.83, + "learning_rate": 0.00026404332129963896, + "loss": 0.2301, + "step": 835 + }, + { + "epoch": 3.83, + "learning_rate": 0.0002639350180505415, + "loss": 0.3576, + "step": 836 + }, + { + "epoch": 3.84, + "learning_rate": 0.000263826714801444, + "loss": 0.3177, + "step": 837 + }, + { + "epoch": 3.84, + "learning_rate": 0.00026371841155234654, + "loss": 0.305, + "step": 838 + }, + { + "epoch": 3.85, + "learning_rate": 0.0002636101083032491, + "loss": 0.3451, + "step": 839 + }, + { + "epoch": 3.85, + "learning_rate": 0.0002635018050541516, + "loss": 0.467, + "step": 840 + }, + { + "epoch": 3.86, + "learning_rate": 0.00026339350180505416, + "loss": 0.2991, + "step": 841 + }, + { + "epoch": 3.86, + "learning_rate": 0.00026328519855595665, + "loss": 0.5397, + "step": 842 + }, + { + "epoch": 3.87, + "learning_rate": 0.0002631768953068592, + "loss": 0.2436, + "step": 843 + }, + { + "epoch": 3.87, + "learning_rate": 0.00026306859205776174, + "loss": 0.2155, + "step": 844 + }, + { + "epoch": 3.88, + "learning_rate": 0.00026296028880866423, + "loss": 0.3429, + "step": 845 + }, + { + "epoch": 3.88, + "learning_rate": 0.00026285198555956677, + "loss": 0.4259, + "step": 846 + }, + { + "epoch": 3.89, + "learning_rate": 0.0002627436823104693, + "loss": 0.4325, + "step": 847 + }, + { + "epoch": 3.89, + "learning_rate": 0.0002626353790613718, + "loss": 0.3047, + "step": 848 + }, + { + "epoch": 3.89, + "learning_rate": 0.00026252707581227435, + "loss": 0.2883, + "step": 849 + }, + { + "epoch": 3.9, + "learning_rate": 0.0002624187725631769, + "loss": 0.2938, + "step": 850 + }, + { + "epoch": 3.9, + "learning_rate": 0.0002623104693140794, + "loss": 0.4563, + "step": 851 + }, + { + "epoch": 3.91, + "learning_rate": 0.0002622021660649819, + "loss": 0.3937, + "step": 852 + }, + { + "epoch": 3.91, + "learning_rate": 0.00026209386281588447, + "loss": 0.3691, + "step": 853 + }, + { + "epoch": 3.92, + "learning_rate": 0.00026198555956678696, + "loss": 0.3489, + "step": 854 + }, + { + "epoch": 3.92, + "learning_rate": 0.0002618772563176895, + "loss": 0.3404, + "step": 855 + }, + { + "epoch": 3.93, + "learning_rate": 0.00026176895306859204, + "loss": 0.3915, + "step": 856 + }, + { + "epoch": 3.93, + "learning_rate": 0.00026166064981949453, + "loss": 0.2927, + "step": 857 + }, + { + "epoch": 3.94, + "learning_rate": 0.0002615523465703971, + "loss": 0.1956, + "step": 858 + }, + { + "epoch": 3.94, + "learning_rate": 0.0002614440433212996, + "loss": 0.2184, + "step": 859 + }, + { + "epoch": 3.94, + "learning_rate": 0.0002613357400722021, + "loss": 0.2447, + "step": 860 + }, + { + "epoch": 3.95, + "learning_rate": 0.0002612274368231047, + "loss": 0.2648, + "step": 861 + }, + { + "epoch": 3.95, + "learning_rate": 0.0002611191335740072, + "loss": 0.4299, + "step": 862 + }, + { + "epoch": 3.96, + "learning_rate": 0.00026101083032490974, + "loss": 0.2794, + "step": 863 + }, + { + "epoch": 3.96, + "learning_rate": 0.0002609025270758123, + "loss": 0.3866, + "step": 864 + }, + { + "epoch": 3.97, + "learning_rate": 0.00026079422382671477, + "loss": 0.345, + "step": 865 + }, + { + "epoch": 3.97, + "learning_rate": 0.0002606859205776173, + "loss": 0.4033, + "step": 866 + }, + { + "epoch": 3.98, + "learning_rate": 0.00026057761732851986, + "loss": 0.2637, + "step": 867 + }, + { + "epoch": 3.98, + "learning_rate": 0.00026046931407942234, + "loss": 0.3641, + "step": 868 + }, + { + "epoch": 3.99, + "learning_rate": 0.0002603610108303249, + "loss": 0.3507, + "step": 869 + }, + { + "epoch": 3.99, + "learning_rate": 0.00026025270758122743, + "loss": 0.3651, + "step": 870 + }, + { + "epoch": 4.0, + "learning_rate": 0.0002601444043321299, + "loss": 0.2841, + "step": 871 + }, + { + "epoch": 4.0, + "learning_rate": 0.00026003610108303246, + "loss": 0.4099, + "step": 872 + }, + { + "epoch": 4.0, + "learning_rate": 0.000259927797833935, + "loss": 0.228, + "step": 873 + }, + { + "epoch": 4.01, + "learning_rate": 0.0002598194945848375, + "loss": 0.2568, + "step": 874 + }, + { + "epoch": 4.01, + "learning_rate": 0.00025971119133574004, + "loss": 0.1772, + "step": 875 + }, + { + "epoch": 4.02, + "learning_rate": 0.0002596028880866426, + "loss": 0.2884, + "step": 876 + }, + { + "epoch": 4.02, + "learning_rate": 0.00025949458483754507, + "loss": 0.2704, + "step": 877 + }, + { + "epoch": 4.03, + "learning_rate": 0.0002593862815884476, + "loss": 0.2617, + "step": 878 + }, + { + "epoch": 4.03, + "learning_rate": 0.00025927797833935016, + "loss": 0.2481, + "step": 879 + }, + { + "epoch": 4.04, + "learning_rate": 0.00025916967509025265, + "loss": 0.2272, + "step": 880 + }, + { + "epoch": 4.04, + "learning_rate": 0.0002590613718411552, + "loss": 0.25, + "step": 881 + }, + { + "epoch": 4.05, + "learning_rate": 0.00025895306859205773, + "loss": 0.4122, + "step": 882 + }, + { + "epoch": 4.05, + "learning_rate": 0.0002588447653429603, + "loss": 0.2489, + "step": 883 + }, + { + "epoch": 4.06, + "learning_rate": 0.0002587364620938628, + "loss": 0.3241, + "step": 884 + }, + { + "epoch": 4.06, + "learning_rate": 0.0002586281588447653, + "loss": 0.2703, + "step": 885 + }, + { + "epoch": 4.06, + "learning_rate": 0.00025851985559566785, + "loss": 0.3894, + "step": 886 + }, + { + "epoch": 4.07, + "learning_rate": 0.0002584115523465704, + "loss": 0.2275, + "step": 887 + }, + { + "epoch": 4.07, + "learning_rate": 0.0002583032490974729, + "loss": 0.209, + "step": 888 + }, + { + "epoch": 4.08, + "learning_rate": 0.0002581949458483754, + "loss": 0.2478, + "step": 889 + }, + { + "epoch": 4.08, + "learning_rate": 0.00025808664259927797, + "loss": 0.1824, + "step": 890 + }, + { + "epoch": 4.09, + "learning_rate": 0.00025797833935018046, + "loss": 0.2134, + "step": 891 + }, + { + "epoch": 4.09, + "learning_rate": 0.000257870036101083, + "loss": 0.2152, + "step": 892 + }, + { + "epoch": 4.1, + "learning_rate": 0.00025776173285198555, + "loss": 0.2231, + "step": 893 + }, + { + "epoch": 4.1, + "learning_rate": 0.0002576534296028881, + "loss": 0.182, + "step": 894 + }, + { + "epoch": 4.11, + "learning_rate": 0.0002575451263537906, + "loss": 0.2941, + "step": 895 + }, + { + "epoch": 4.11, + "learning_rate": 0.0002574368231046931, + "loss": 0.2608, + "step": 896 + }, + { + "epoch": 4.11, + "learning_rate": 0.00025732851985559566, + "loss": 0.6074, + "step": 897 + }, + { + "epoch": 4.12, + "learning_rate": 0.00025722021660649815, + "loss": 0.3406, + "step": 898 + }, + { + "epoch": 4.12, + "learning_rate": 0.0002571119133574007, + "loss": 0.1803, + "step": 899 + }, + { + "epoch": 4.13, + "learning_rate": 0.00025700361010830324, + "loss": 0.2756, + "step": 900 + }, + { + "epoch": 4.13, + "eval_loss": 0.44437775015830994, + "eval_runtime": 21.2824, + "eval_samples_per_second": 77.388, + "eval_steps_per_second": 2.443, + "eval_wer": 0.4681850679195179, + "step": 900 + }, + { + "epoch": 4.13, + "learning_rate": 0.00025689530685920573, + "loss": 0.2066, + "step": 901 + }, + { + "epoch": 4.14, + "learning_rate": 0.00025678700361010827, + "loss": 0.196, + "step": 902 + }, + { + "epoch": 4.14, + "learning_rate": 0.0002566787003610108, + "loss": 0.2003, + "step": 903 + }, + { + "epoch": 4.15, + "learning_rate": 0.00025657039711191336, + "loss": 0.23, + "step": 904 + }, + { + "epoch": 4.15, + "learning_rate": 0.0002564620938628159, + "loss": 0.3632, + "step": 905 + }, + { + "epoch": 4.16, + "learning_rate": 0.0002563537906137184, + "loss": 0.3123, + "step": 906 + }, + { + "epoch": 4.16, + "learning_rate": 0.00025624548736462093, + "loss": 0.335, + "step": 907 + }, + { + "epoch": 4.17, + "learning_rate": 0.0002561371841155235, + "loss": 0.3561, + "step": 908 + }, + { + "epoch": 4.17, + "learning_rate": 0.00025602888086642597, + "loss": 0.417, + "step": 909 + }, + { + "epoch": 4.17, + "learning_rate": 0.0002559205776173285, + "loss": 0.1828, + "step": 910 + }, + { + "epoch": 4.18, + "learning_rate": 0.00025581227436823105, + "loss": 0.2032, + "step": 911 + }, + { + "epoch": 4.18, + "learning_rate": 0.00025570397111913354, + "loss": 0.2922, + "step": 912 + }, + { + "epoch": 4.19, + "learning_rate": 0.0002555956678700361, + "loss": 0.2785, + "step": 913 + }, + { + "epoch": 4.19, + "learning_rate": 0.00025548736462093863, + "loss": 0.2055, + "step": 914 + }, + { + "epoch": 4.2, + "learning_rate": 0.0002553790613718411, + "loss": 0.2526, + "step": 915 + }, + { + "epoch": 4.2, + "learning_rate": 0.00025527075812274366, + "loss": 0.1948, + "step": 916 + }, + { + "epoch": 4.21, + "learning_rate": 0.0002551624548736462, + "loss": 0.2642, + "step": 917 + }, + { + "epoch": 4.21, + "learning_rate": 0.0002550541516245487, + "loss": 0.2267, + "step": 918 + }, + { + "epoch": 4.22, + "learning_rate": 0.00025494584837545124, + "loss": 0.2365, + "step": 919 + }, + { + "epoch": 4.22, + "learning_rate": 0.0002548375451263538, + "loss": 0.2628, + "step": 920 + }, + { + "epoch": 4.22, + "learning_rate": 0.00025472924187725627, + "loss": 0.2963, + "step": 921 + }, + { + "epoch": 4.23, + "learning_rate": 0.0002546209386281588, + "loss": 0.315, + "step": 922 + }, + { + "epoch": 4.23, + "learning_rate": 0.00025451263537906135, + "loss": 0.208, + "step": 923 + }, + { + "epoch": 4.24, + "learning_rate": 0.00025440433212996384, + "loss": 0.2674, + "step": 924 + }, + { + "epoch": 4.24, + "learning_rate": 0.00025429602888086644, + "loss": 0.2296, + "step": 925 + }, + { + "epoch": 4.25, + "learning_rate": 0.00025418772563176893, + "loss": 0.2882, + "step": 926 + }, + { + "epoch": 4.25, + "learning_rate": 0.0002540794223826715, + "loss": 0.2359, + "step": 927 + }, + { + "epoch": 4.26, + "learning_rate": 0.000253971119133574, + "loss": 0.2224, + "step": 928 + }, + { + "epoch": 4.26, + "learning_rate": 0.0002538628158844765, + "loss": 0.2908, + "step": 929 + }, + { + "epoch": 4.27, + "learning_rate": 0.00025375451263537905, + "loss": 0.2182, + "step": 930 + }, + { + "epoch": 4.27, + "learning_rate": 0.0002536462093862816, + "loss": 0.297, + "step": 931 + }, + { + "epoch": 4.28, + "learning_rate": 0.0002535379061371841, + "loss": 0.3345, + "step": 932 + }, + { + "epoch": 4.28, + "learning_rate": 0.0002534296028880866, + "loss": 0.2312, + "step": 933 + }, + { + "epoch": 4.28, + "learning_rate": 0.00025332129963898917, + "loss": 0.3107, + "step": 934 + }, + { + "epoch": 4.29, + "learning_rate": 0.00025321299638989166, + "loss": 0.2248, + "step": 935 + }, + { + "epoch": 4.29, + "learning_rate": 0.0002531046931407942, + "loss": 0.2035, + "step": 936 + }, + { + "epoch": 4.3, + "learning_rate": 0.00025299638989169674, + "loss": 0.1552, + "step": 937 + }, + { + "epoch": 4.3, + "learning_rate": 0.00025288808664259923, + "loss": 0.2033, + "step": 938 + }, + { + "epoch": 4.31, + "learning_rate": 0.0002527797833935018, + "loss": 0.156, + "step": 939 + }, + { + "epoch": 4.31, + "learning_rate": 0.0002526714801444043, + "loss": 0.2203, + "step": 940 + }, + { + "epoch": 4.32, + "learning_rate": 0.0002525631768953068, + "loss": 0.2946, + "step": 941 + }, + { + "epoch": 4.32, + "learning_rate": 0.00025245487364620935, + "loss": 0.1778, + "step": 942 + }, + { + "epoch": 4.33, + "learning_rate": 0.0002523465703971119, + "loss": 0.2763, + "step": 943 + }, + { + "epoch": 4.33, + "learning_rate": 0.0002522382671480144, + "loss": 0.2498, + "step": 944 + }, + { + "epoch": 4.33, + "learning_rate": 0.0002521299638989169, + "loss": 0.2089, + "step": 945 + }, + { + "epoch": 4.34, + "learning_rate": 0.00025202166064981947, + "loss": 0.2617, + "step": 946 + }, + { + "epoch": 4.34, + "learning_rate": 0.000251913357400722, + "loss": 0.3433, + "step": 947 + }, + { + "epoch": 4.35, + "learning_rate": 0.00025180505415162456, + "loss": 0.2043, + "step": 948 + }, + { + "epoch": 4.35, + "learning_rate": 0.00025169675090252704, + "loss": 0.1543, + "step": 949 + }, + { + "epoch": 4.36, + "learning_rate": 0.0002515884476534296, + "loss": 0.2208, + "step": 950 + }, + { + "epoch": 4.36, + "learning_rate": 0.00025148014440433213, + "loss": 0.1462, + "step": 951 + }, + { + "epoch": 4.37, + "learning_rate": 0.0002513718411552346, + "loss": 0.2778, + "step": 952 + }, + { + "epoch": 4.37, + "learning_rate": 0.00025126353790613716, + "loss": 0.2605, + "step": 953 + }, + { + "epoch": 4.38, + "learning_rate": 0.0002511552346570397, + "loss": 0.2026, + "step": 954 + }, + { + "epoch": 4.38, + "learning_rate": 0.0002510469314079422, + "loss": 0.2352, + "step": 955 + }, + { + "epoch": 4.39, + "learning_rate": 0.00025093862815884474, + "loss": 0.2214, + "step": 956 + }, + { + "epoch": 4.39, + "learning_rate": 0.0002508303249097473, + "loss": 0.3178, + "step": 957 + }, + { + "epoch": 4.39, + "learning_rate": 0.00025072202166064977, + "loss": 0.2221, + "step": 958 + }, + { + "epoch": 4.4, + "learning_rate": 0.0002506137184115523, + "loss": 0.2474, + "step": 959 + }, + { + "epoch": 4.4, + "learning_rate": 0.00025050541516245486, + "loss": 0.2611, + "step": 960 + }, + { + "epoch": 4.41, + "learning_rate": 0.00025039711191335735, + "loss": 0.255, + "step": 961 + }, + { + "epoch": 4.41, + "learning_rate": 0.0002502888086642599, + "loss": 0.3132, + "step": 962 + }, + { + "epoch": 4.42, + "learning_rate": 0.00025018050541516243, + "loss": 0.1714, + "step": 963 + }, + { + "epoch": 4.42, + "learning_rate": 0.000250072202166065, + "loss": 0.1702, + "step": 964 + }, + { + "epoch": 4.43, + "learning_rate": 0.00024996389891696747, + "loss": 0.2401, + "step": 965 + }, + { + "epoch": 4.43, + "learning_rate": 0.00024985559566787, + "loss": 0.1915, + "step": 966 + }, + { + "epoch": 4.44, + "learning_rate": 0.00024974729241877255, + "loss": 0.3365, + "step": 967 + }, + { + "epoch": 4.44, + "learning_rate": 0.00024963898916967504, + "loss": 0.3295, + "step": 968 + }, + { + "epoch": 4.44, + "learning_rate": 0.0002495306859205776, + "loss": 0.3081, + "step": 969 + }, + { + "epoch": 4.45, + "learning_rate": 0.00024942238267148013, + "loss": 0.3131, + "step": 970 + }, + { + "epoch": 4.45, + "learning_rate": 0.00024931407942238267, + "loss": 0.2646, + "step": 971 + }, + { + "epoch": 4.46, + "learning_rate": 0.0002492057761732852, + "loss": 0.3324, + "step": 972 + }, + { + "epoch": 4.46, + "learning_rate": 0.0002490974729241877, + "loss": 0.232, + "step": 973 + }, + { + "epoch": 4.47, + "learning_rate": 0.00024898916967509025, + "loss": 0.3071, + "step": 974 + }, + { + "epoch": 4.47, + "learning_rate": 0.0002488808664259928, + "loss": 0.2205, + "step": 975 + }, + { + "epoch": 4.48, + "learning_rate": 0.0002487725631768953, + "loss": 0.225, + "step": 976 + }, + { + "epoch": 4.48, + "learning_rate": 0.0002486642599277978, + "loss": 0.1916, + "step": 977 + }, + { + "epoch": 4.49, + "learning_rate": 0.00024855595667870036, + "loss": 0.2004, + "step": 978 + }, + { + "epoch": 4.49, + "learning_rate": 0.00024844765342960285, + "loss": 0.2448, + "step": 979 + }, + { + "epoch": 4.5, + "learning_rate": 0.0002483393501805054, + "loss": 0.3579, + "step": 980 + }, + { + "epoch": 4.5, + "learning_rate": 0.00024823104693140794, + "loss": 0.2404, + "step": 981 + }, + { + "epoch": 4.5, + "learning_rate": 0.00024812274368231043, + "loss": 0.2826, + "step": 982 + }, + { + "epoch": 4.51, + "learning_rate": 0.00024801444043321297, + "loss": 0.2404, + "step": 983 + }, + { + "epoch": 4.51, + "learning_rate": 0.0002479061371841155, + "loss": 0.1771, + "step": 984 + }, + { + "epoch": 4.52, + "learning_rate": 0.000247797833935018, + "loss": 0.4036, + "step": 985 + }, + { + "epoch": 4.52, + "learning_rate": 0.00024768953068592055, + "loss": 0.1809, + "step": 986 + }, + { + "epoch": 4.53, + "learning_rate": 0.0002475812274368231, + "loss": 0.2435, + "step": 987 + }, + { + "epoch": 4.53, + "learning_rate": 0.0002474729241877256, + "loss": 0.2398, + "step": 988 + }, + { + "epoch": 4.54, + "learning_rate": 0.0002473646209386281, + "loss": 0.136, + "step": 989 + }, + { + "epoch": 4.54, + "learning_rate": 0.00024725631768953067, + "loss": 0.227, + "step": 990 + }, + { + "epoch": 4.55, + "learning_rate": 0.0002471480144404332, + "loss": 0.2346, + "step": 991 + }, + { + "epoch": 4.55, + "learning_rate": 0.00024703971119133575, + "loss": 0.2635, + "step": 992 + }, + { + "epoch": 4.56, + "learning_rate": 0.00024693140794223824, + "loss": 0.1909, + "step": 993 + }, + { + "epoch": 4.56, + "learning_rate": 0.0002468231046931408, + "loss": 0.337, + "step": 994 + }, + { + "epoch": 4.56, + "learning_rate": 0.00024671480144404333, + "loss": 0.288, + "step": 995 + }, + { + "epoch": 4.57, + "learning_rate": 0.0002466064981949458, + "loss": 0.2903, + "step": 996 + }, + { + "epoch": 4.57, + "learning_rate": 0.00024649819494584836, + "loss": 0.1993, + "step": 997 + }, + { + "epoch": 4.58, + "learning_rate": 0.0002463898916967509, + "loss": 0.156, + "step": 998 + }, + { + "epoch": 4.58, + "learning_rate": 0.0002462815884476534, + "loss": 0.2833, + "step": 999 + }, + { + "epoch": 4.59, + "learning_rate": 0.00024617328519855594, + "loss": 0.2373, + "step": 1000 + }, + { + "epoch": 4.59, + "eval_loss": 0.41109123826026917, + "eval_runtime": 20.0855, + "eval_samples_per_second": 82.0, + "eval_steps_per_second": 2.589, + "eval_wer": 0.44316208763149834, + "step": 1000 + }, + { + "epoch": 4.59, + "learning_rate": 0.0002460649819494585, + "loss": 0.1667, + "step": 1001 + }, + { + "epoch": 4.6, + "learning_rate": 0.00024595667870036097, + "loss": 0.2066, + "step": 1002 + }, + { + "epoch": 4.6, + "learning_rate": 0.0002458483754512635, + "loss": 0.1946, + "step": 1003 + }, + { + "epoch": 4.61, + "learning_rate": 0.00024574007220216606, + "loss": 0.2566, + "step": 1004 + }, + { + "epoch": 4.61, + "learning_rate": 0.00024563176895306854, + "loss": 0.2578, + "step": 1005 + }, + { + "epoch": 4.61, + "learning_rate": 0.0002455234657039711, + "loss": 0.2445, + "step": 1006 + }, + { + "epoch": 4.62, + "learning_rate": 0.00024541516245487363, + "loss": 0.2997, + "step": 1007 + }, + { + "epoch": 4.62, + "learning_rate": 0.0002453068592057761, + "loss": 0.2255, + "step": 1008 + }, + { + "epoch": 4.63, + "learning_rate": 0.00024519855595667866, + "loss": 0.2007, + "step": 1009 + }, + { + "epoch": 4.63, + "learning_rate": 0.0002450902527075812, + "loss": 0.2465, + "step": 1010 + }, + { + "epoch": 4.64, + "learning_rate": 0.0002449819494584837, + "loss": 0.2142, + "step": 1011 + }, + { + "epoch": 4.64, + "learning_rate": 0.0002448736462093863, + "loss": 0.2324, + "step": 1012 + }, + { + "epoch": 4.65, + "learning_rate": 0.0002447653429602888, + "loss": 0.2295, + "step": 1013 + }, + { + "epoch": 4.65, + "learning_rate": 0.0002446570397111913, + "loss": 0.1672, + "step": 1014 + }, + { + "epoch": 4.66, + "learning_rate": 0.00024454873646209387, + "loss": 0.242, + "step": 1015 + }, + { + "epoch": 4.66, + "learning_rate": 0.00024444043321299636, + "loss": 0.2292, + "step": 1016 + }, + { + "epoch": 4.67, + "learning_rate": 0.0002443321299638989, + "loss": 0.2236, + "step": 1017 + }, + { + "epoch": 4.67, + "learning_rate": 0.00024422382671480144, + "loss": 0.2654, + "step": 1018 + }, + { + "epoch": 4.67, + "learning_rate": 0.00024411552346570396, + "loss": 0.3037, + "step": 1019 + }, + { + "epoch": 4.68, + "learning_rate": 0.00024400722021660648, + "loss": 0.2341, + "step": 1020 + }, + { + "epoch": 4.68, + "learning_rate": 0.00024389891696750902, + "loss": 0.4602, + "step": 1021 + }, + { + "epoch": 4.69, + "learning_rate": 0.00024379061371841154, + "loss": 0.4068, + "step": 1022 + }, + { + "epoch": 4.69, + "learning_rate": 0.00024368231046931405, + "loss": 0.2204, + "step": 1023 + }, + { + "epoch": 4.7, + "learning_rate": 0.0002435740072202166, + "loss": 0.2602, + "step": 1024 + }, + { + "epoch": 4.7, + "learning_rate": 0.0002434657039711191, + "loss": 0.1994, + "step": 1025 + }, + { + "epoch": 4.71, + "learning_rate": 0.00024335740072202163, + "loss": 0.1598, + "step": 1026 + }, + { + "epoch": 4.71, + "learning_rate": 0.00024324909747292417, + "loss": 0.1603, + "step": 1027 + }, + { + "epoch": 4.72, + "learning_rate": 0.00024314079422382669, + "loss": 0.2571, + "step": 1028 + }, + { + "epoch": 4.72, + "learning_rate": 0.0002430324909747292, + "loss": 0.2004, + "step": 1029 + }, + { + "epoch": 4.72, + "learning_rate": 0.00024292418772563175, + "loss": 0.2159, + "step": 1030 + }, + { + "epoch": 4.73, + "learning_rate": 0.00024281588447653426, + "loss": 0.2145, + "step": 1031 + }, + { + "epoch": 4.73, + "learning_rate": 0.00024270758122743678, + "loss": 0.3055, + "step": 1032 + }, + { + "epoch": 4.74, + "learning_rate": 0.00024259927797833932, + "loss": 0.3923, + "step": 1033 + }, + { + "epoch": 4.74, + "learning_rate": 0.00024249097472924186, + "loss": 0.4797, + "step": 1034 + }, + { + "epoch": 4.75, + "learning_rate": 0.0002423826714801444, + "loss": 0.3232, + "step": 1035 + }, + { + "epoch": 4.75, + "learning_rate": 0.00024227436823104692, + "loss": 0.1694, + "step": 1036 + }, + { + "epoch": 4.76, + "learning_rate": 0.00024216606498194944, + "loss": 0.2261, + "step": 1037 + }, + { + "epoch": 4.76, + "learning_rate": 0.00024205776173285198, + "loss": 0.2278, + "step": 1038 + }, + { + "epoch": 4.77, + "learning_rate": 0.0002419494584837545, + "loss": 0.195, + "step": 1039 + }, + { + "epoch": 4.77, + "learning_rate": 0.00024184115523465702, + "loss": 0.2873, + "step": 1040 + }, + { + "epoch": 4.78, + "learning_rate": 0.00024173285198555956, + "loss": 0.2304, + "step": 1041 + }, + { + "epoch": 4.78, + "learning_rate": 0.00024162454873646207, + "loss": 0.2621, + "step": 1042 + }, + { + "epoch": 4.78, + "learning_rate": 0.0002415162454873646, + "loss": 0.235, + "step": 1043 + }, + { + "epoch": 4.79, + "learning_rate": 0.00024140794223826713, + "loss": 0.2301, + "step": 1044 + }, + { + "epoch": 4.79, + "learning_rate": 0.00024129963898916965, + "loss": 0.3049, + "step": 1045 + }, + { + "epoch": 4.8, + "learning_rate": 0.00024119133574007217, + "loss": 0.2641, + "step": 1046 + }, + { + "epoch": 4.8, + "learning_rate": 0.0002410830324909747, + "loss": 0.2638, + "step": 1047 + }, + { + "epoch": 4.81, + "learning_rate": 0.00024097472924187723, + "loss": 0.249, + "step": 1048 + }, + { + "epoch": 4.81, + "learning_rate": 0.00024086642599277974, + "loss": 0.1635, + "step": 1049 + }, + { + "epoch": 4.82, + "learning_rate": 0.00024075812274368228, + "loss": 0.2095, + "step": 1050 + }, + { + "epoch": 4.82, + "learning_rate": 0.0002406498194945848, + "loss": 0.2339, + "step": 1051 + }, + { + "epoch": 4.83, + "learning_rate": 0.00024054151624548734, + "loss": 0.2968, + "step": 1052 + }, + { + "epoch": 4.83, + "learning_rate": 0.00024043321299638986, + "loss": 0.1763, + "step": 1053 + }, + { + "epoch": 4.83, + "learning_rate": 0.00024032490974729238, + "loss": 0.2671, + "step": 1054 + }, + { + "epoch": 4.84, + "learning_rate": 0.00024021660649819495, + "loss": 0.2591, + "step": 1055 + }, + { + "epoch": 4.84, + "learning_rate": 0.00024010830324909746, + "loss": 0.2433, + "step": 1056 + }, + { + "epoch": 4.85, + "learning_rate": 0.00023999999999999998, + "loss": 0.2445, + "step": 1057 + }, + { + "epoch": 4.85, + "learning_rate": 0.00023989169675090252, + "loss": 0.3433, + "step": 1058 + }, + { + "epoch": 4.86, + "learning_rate": 0.00023978339350180504, + "loss": 0.3004, + "step": 1059 + }, + { + "epoch": 4.86, + "learning_rate": 0.00023967509025270758, + "loss": 0.3585, + "step": 1060 + }, + { + "epoch": 4.87, + "learning_rate": 0.0002395667870036101, + "loss": 0.217, + "step": 1061 + }, + { + "epoch": 4.87, + "learning_rate": 0.00023945848375451261, + "loss": 0.2326, + "step": 1062 + }, + { + "epoch": 4.88, + "learning_rate": 0.00023935018050541516, + "loss": 0.2462, + "step": 1063 + }, + { + "epoch": 4.88, + "learning_rate": 0.00023924187725631767, + "loss": 0.2599, + "step": 1064 + }, + { + "epoch": 4.89, + "learning_rate": 0.0002391335740072202, + "loss": 0.2027, + "step": 1065 + }, + { + "epoch": 4.89, + "learning_rate": 0.00023902527075812273, + "loss": 0.3086, + "step": 1066 + }, + { + "epoch": 4.89, + "learning_rate": 0.00023891696750902525, + "loss": 0.2809, + "step": 1067 + }, + { + "epoch": 4.9, + "learning_rate": 0.00023880866425992776, + "loss": 0.2114, + "step": 1068 + }, + { + "epoch": 4.9, + "learning_rate": 0.0002387003610108303, + "loss": 0.2728, + "step": 1069 + }, + { + "epoch": 4.91, + "learning_rate": 0.00023859205776173282, + "loss": 0.2464, + "step": 1070 + }, + { + "epoch": 4.91, + "learning_rate": 0.00023848375451263534, + "loss": 0.2474, + "step": 1071 + }, + { + "epoch": 4.92, + "learning_rate": 0.00023837545126353788, + "loss": 0.294, + "step": 1072 + }, + { + "epoch": 4.92, + "learning_rate": 0.0002382671480144404, + "loss": 0.1369, + "step": 1073 + }, + { + "epoch": 4.93, + "learning_rate": 0.00023815884476534292, + "loss": 0.2261, + "step": 1074 + }, + { + "epoch": 4.93, + "learning_rate": 0.00023805054151624546, + "loss": 0.1408, + "step": 1075 + }, + { + "epoch": 4.94, + "learning_rate": 0.00023794223826714798, + "loss": 0.1385, + "step": 1076 + }, + { + "epoch": 4.94, + "learning_rate": 0.00023783393501805055, + "loss": 0.1971, + "step": 1077 + }, + { + "epoch": 4.94, + "learning_rate": 0.00023772563176895306, + "loss": 0.1703, + "step": 1078 + }, + { + "epoch": 4.95, + "learning_rate": 0.00023761732851985558, + "loss": 0.2339, + "step": 1079 + }, + { + "epoch": 4.95, + "learning_rate": 0.00023750902527075812, + "loss": 0.2402, + "step": 1080 + }, + { + "epoch": 4.96, + "learning_rate": 0.00023740072202166064, + "loss": 0.3772, + "step": 1081 + }, + { + "epoch": 4.96, + "learning_rate": 0.00023729241877256315, + "loss": 0.1826, + "step": 1082 + }, + { + "epoch": 4.97, + "learning_rate": 0.0002371841155234657, + "loss": 0.3, + "step": 1083 + }, + { + "epoch": 4.97, + "learning_rate": 0.0002370758122743682, + "loss": 0.4994, + "step": 1084 + }, + { + "epoch": 4.98, + "learning_rate": 0.00023696750902527073, + "loss": 0.3555, + "step": 1085 + }, + { + "epoch": 4.98, + "learning_rate": 0.00023685920577617327, + "loss": 0.1722, + "step": 1086 + }, + { + "epoch": 4.99, + "learning_rate": 0.0002367509025270758, + "loss": 0.2886, + "step": 1087 + }, + { + "epoch": 4.99, + "learning_rate": 0.0002366425992779783, + "loss": 0.2577, + "step": 1088 + }, + { + "epoch": 5.0, + "learning_rate": 0.00023653429602888085, + "loss": 0.2641, + "step": 1089 + }, + { + "epoch": 5.0, + "learning_rate": 0.00023642599277978336, + "loss": 0.2622, + "step": 1090 + }, + { + "epoch": 5.0, + "learning_rate": 0.0002363176895306859, + "loss": 0.2808, + "step": 1091 + }, + { + "epoch": 5.01, + "learning_rate": 0.00023620938628158842, + "loss": 0.1563, + "step": 1092 + }, + { + "epoch": 5.01, + "learning_rate": 0.00023610108303249094, + "loss": 0.1992, + "step": 1093 + }, + { + "epoch": 5.02, + "learning_rate": 0.00023599277978339348, + "loss": 0.1246, + "step": 1094 + }, + { + "epoch": 5.02, + "learning_rate": 0.000235884476534296, + "loss": 0.1378, + "step": 1095 + }, + { + "epoch": 5.03, + "learning_rate": 0.00023577617328519851, + "loss": 0.1803, + "step": 1096 + }, + { + "epoch": 5.03, + "learning_rate": 0.00023566787003610106, + "loss": 0.2305, + "step": 1097 + }, + { + "epoch": 5.04, + "learning_rate": 0.00023555956678700357, + "loss": 0.1751, + "step": 1098 + }, + { + "epoch": 5.04, + "learning_rate": 0.00023545126353790614, + "loss": 0.2478, + "step": 1099 + }, + { + "epoch": 5.05, + "learning_rate": 0.00023534296028880866, + "loss": 0.1831, + "step": 1100 + }, + { + "epoch": 5.05, + "eval_loss": 0.41777729988098145, + "eval_runtime": 19.8992, + "eval_samples_per_second": 82.767, + "eval_steps_per_second": 2.613, + "eval_wer": 0.44469410683280564, + "step": 1100 + }, + { + "epoch": 5.05, + "learning_rate": 0.00023523465703971118, + "loss": 0.2754, + "step": 1101 + }, + { + "epoch": 5.06, + "learning_rate": 0.00023512635379061372, + "loss": 0.3208, + "step": 1102 + }, + { + "epoch": 5.06, + "learning_rate": 0.00023501805054151624, + "loss": 0.2406, + "step": 1103 + }, + { + "epoch": 5.06, + "learning_rate": 0.00023490974729241875, + "loss": 0.146, + "step": 1104 + }, + { + "epoch": 5.07, + "learning_rate": 0.0002348014440433213, + "loss": 0.1875, + "step": 1105 + }, + { + "epoch": 5.07, + "learning_rate": 0.0002346931407942238, + "loss": 0.1207, + "step": 1106 + }, + { + "epoch": 5.08, + "learning_rate": 0.00023458483754512633, + "loss": 0.2032, + "step": 1107 + }, + { + "epoch": 5.08, + "learning_rate": 0.00023447653429602887, + "loss": 0.2078, + "step": 1108 + }, + { + "epoch": 5.09, + "learning_rate": 0.0002343682310469314, + "loss": 0.1551, + "step": 1109 + }, + { + "epoch": 5.09, + "learning_rate": 0.0002342599277978339, + "loss": 0.1566, + "step": 1110 + }, + { + "epoch": 5.1, + "learning_rate": 0.00023415162454873645, + "loss": 0.1389, + "step": 1111 + }, + { + "epoch": 5.1, + "learning_rate": 0.00023404332129963896, + "loss": 0.3133, + "step": 1112 + }, + { + "epoch": 5.11, + "learning_rate": 0.00023393501805054148, + "loss": 0.2773, + "step": 1113 + }, + { + "epoch": 5.11, + "learning_rate": 0.00023382671480144402, + "loss": 0.1836, + "step": 1114 + }, + { + "epoch": 5.11, + "learning_rate": 0.00023371841155234654, + "loss": 0.2566, + "step": 1115 + }, + { + "epoch": 5.12, + "learning_rate": 0.00023361010830324905, + "loss": 0.1017, + "step": 1116 + }, + { + "epoch": 5.12, + "learning_rate": 0.0002335018050541516, + "loss": 0.1495, + "step": 1117 + }, + { + "epoch": 5.13, + "learning_rate": 0.0002333935018050541, + "loss": 0.1402, + "step": 1118 + }, + { + "epoch": 5.13, + "learning_rate": 0.00023328519855595663, + "loss": 0.1454, + "step": 1119 + }, + { + "epoch": 5.14, + "learning_rate": 0.0002331768953068592, + "loss": 0.165, + "step": 1120 + }, + { + "epoch": 5.14, + "learning_rate": 0.00023306859205776172, + "loss": 0.2206, + "step": 1121 + }, + { + "epoch": 5.15, + "learning_rate": 0.00023296028880866426, + "loss": 0.2479, + "step": 1122 + }, + { + "epoch": 5.15, + "learning_rate": 0.00023285198555956678, + "loss": 0.2168, + "step": 1123 + }, + { + "epoch": 5.16, + "learning_rate": 0.0002327436823104693, + "loss": 0.115, + "step": 1124 + }, + { + "epoch": 5.16, + "learning_rate": 0.00023263537906137183, + "loss": 0.2707, + "step": 1125 + }, + { + "epoch": 5.17, + "learning_rate": 0.00023252707581227435, + "loss": 0.1416, + "step": 1126 + }, + { + "epoch": 5.17, + "learning_rate": 0.0002324187725631769, + "loss": 0.3826, + "step": 1127 + }, + { + "epoch": 5.17, + "learning_rate": 0.0002323104693140794, + "loss": 0.2214, + "step": 1128 + }, + { + "epoch": 5.18, + "learning_rate": 0.00023220216606498193, + "loss": 0.2007, + "step": 1129 + }, + { + "epoch": 5.18, + "learning_rate": 0.00023209386281588447, + "loss": 0.1162, + "step": 1130 + }, + { + "epoch": 5.19, + "learning_rate": 0.00023198555956678699, + "loss": 0.2067, + "step": 1131 + }, + { + "epoch": 5.19, + "learning_rate": 0.0002318772563176895, + "loss": 0.2043, + "step": 1132 + }, + { + "epoch": 5.2, + "learning_rate": 0.00023176895306859204, + "loss": 0.1798, + "step": 1133 + }, + { + "epoch": 5.2, + "learning_rate": 0.00023166064981949456, + "loss": 0.2487, + "step": 1134 + }, + { + "epoch": 5.21, + "learning_rate": 0.00023155234657039708, + "loss": 0.271, + "step": 1135 + }, + { + "epoch": 5.21, + "learning_rate": 0.00023144404332129962, + "loss": 0.1241, + "step": 1136 + }, + { + "epoch": 5.22, + "learning_rate": 0.00023133574007220214, + "loss": 0.2336, + "step": 1137 + }, + { + "epoch": 5.22, + "learning_rate": 0.00023122743682310465, + "loss": 0.2162, + "step": 1138 + }, + { + "epoch": 5.22, + "learning_rate": 0.0002311191335740072, + "loss": 0.2793, + "step": 1139 + }, + { + "epoch": 5.23, + "learning_rate": 0.0002310108303249097, + "loss": 0.3599, + "step": 1140 + }, + { + "epoch": 5.23, + "learning_rate": 0.00023090252707581223, + "loss": 0.1178, + "step": 1141 + }, + { + "epoch": 5.24, + "learning_rate": 0.0002307942238267148, + "loss": 0.1601, + "step": 1142 + }, + { + "epoch": 5.24, + "learning_rate": 0.00023068592057761731, + "loss": 0.1613, + "step": 1143 + }, + { + "epoch": 5.25, + "learning_rate": 0.00023057761732851986, + "loss": 0.3078, + "step": 1144 + }, + { + "epoch": 5.25, + "learning_rate": 0.00023046931407942237, + "loss": 0.171, + "step": 1145 + }, + { + "epoch": 5.26, + "learning_rate": 0.0002303610108303249, + "loss": 0.1525, + "step": 1146 + }, + { + "epoch": 5.26, + "learning_rate": 0.00023025270758122743, + "loss": 0.2043, + "step": 1147 + }, + { + "epoch": 5.27, + "learning_rate": 0.00023014440433212995, + "loss": 0.1863, + "step": 1148 + }, + { + "epoch": 5.27, + "learning_rate": 0.00023003610108303247, + "loss": 0.2313, + "step": 1149 + }, + { + "epoch": 5.28, + "learning_rate": 0.000229927797833935, + "loss": 0.1705, + "step": 1150 + }, + { + "epoch": 5.28, + "learning_rate": 0.00022981949458483752, + "loss": 0.3569, + "step": 1151 + }, + { + "epoch": 5.28, + "learning_rate": 0.00022971119133574004, + "loss": 0.1316, + "step": 1152 + }, + { + "epoch": 5.29, + "learning_rate": 0.00022960288808664258, + "loss": 0.1573, + "step": 1153 + }, + { + "epoch": 5.29, + "learning_rate": 0.0002294945848375451, + "loss": 0.2185, + "step": 1154 + }, + { + "epoch": 5.3, + "learning_rate": 0.00022938628158844762, + "loss": 0.1423, + "step": 1155 + }, + { + "epoch": 5.3, + "learning_rate": 0.00022927797833935016, + "loss": 0.1913, + "step": 1156 + }, + { + "epoch": 5.31, + "learning_rate": 0.00022916967509025268, + "loss": 0.1621, + "step": 1157 + }, + { + "epoch": 5.31, + "learning_rate": 0.00022906137184115522, + "loss": 0.1644, + "step": 1158 + }, + { + "epoch": 5.32, + "learning_rate": 0.00022895306859205774, + "loss": 0.146, + "step": 1159 + }, + { + "epoch": 5.32, + "learning_rate": 0.00022884476534296025, + "loss": 0.1998, + "step": 1160 + }, + { + "epoch": 5.33, + "learning_rate": 0.0002287364620938628, + "loss": 0.3611, + "step": 1161 + }, + { + "epoch": 5.33, + "learning_rate": 0.0002286281588447653, + "loss": 0.1423, + "step": 1162 + }, + { + "epoch": 5.33, + "learning_rate": 0.00022851985559566783, + "loss": 0.205, + "step": 1163 + }, + { + "epoch": 5.34, + "learning_rate": 0.0002284115523465704, + "loss": 0.1973, + "step": 1164 + }, + { + "epoch": 5.34, + "learning_rate": 0.0002283032490974729, + "loss": 0.2984, + "step": 1165 + }, + { + "epoch": 5.35, + "learning_rate": 0.00022819494584837546, + "loss": 0.1513, + "step": 1166 + }, + { + "epoch": 5.35, + "learning_rate": 0.00022808664259927797, + "loss": 0.1103, + "step": 1167 + }, + { + "epoch": 5.36, + "learning_rate": 0.0002279783393501805, + "loss": 0.1515, + "step": 1168 + }, + { + "epoch": 5.36, + "learning_rate": 0.00022787003610108303, + "loss": 0.2209, + "step": 1169 + }, + { + "epoch": 5.37, + "learning_rate": 0.00022776173285198555, + "loss": 0.0977, + "step": 1170 + }, + { + "epoch": 5.37, + "learning_rate": 0.00022765342960288806, + "loss": 0.1932, + "step": 1171 + }, + { + "epoch": 5.38, + "learning_rate": 0.0002275451263537906, + "loss": 0.2129, + "step": 1172 + }, + { + "epoch": 5.38, + "learning_rate": 0.00022743682310469312, + "loss": 0.2417, + "step": 1173 + }, + { + "epoch": 5.39, + "learning_rate": 0.00022732851985559564, + "loss": 0.2463, + "step": 1174 + }, + { + "epoch": 5.39, + "learning_rate": 0.00022722021660649818, + "loss": 0.2607, + "step": 1175 + }, + { + "epoch": 5.39, + "learning_rate": 0.0002271119133574007, + "loss": 0.2566, + "step": 1176 + }, + { + "epoch": 5.4, + "learning_rate": 0.00022700361010830322, + "loss": 0.3394, + "step": 1177 + }, + { + "epoch": 5.4, + "learning_rate": 0.00022689530685920576, + "loss": 0.2264, + "step": 1178 + }, + { + "epoch": 5.41, + "learning_rate": 0.00022678700361010827, + "loss": 0.107, + "step": 1179 + }, + { + "epoch": 5.41, + "learning_rate": 0.0002266787003610108, + "loss": 0.1893, + "step": 1180 + }, + { + "epoch": 5.42, + "learning_rate": 0.00022657039711191333, + "loss": 0.1821, + "step": 1181 + }, + { + "epoch": 5.42, + "learning_rate": 0.00022646209386281585, + "loss": 0.1597, + "step": 1182 + }, + { + "epoch": 5.43, + "learning_rate": 0.00022635379061371837, + "loss": 0.1591, + "step": 1183 + }, + { + "epoch": 5.43, + "learning_rate": 0.0002262454873646209, + "loss": 0.0853, + "step": 1184 + }, + { + "epoch": 5.44, + "learning_rate": 0.00022613718411552345, + "loss": 0.2411, + "step": 1185 + }, + { + "epoch": 5.44, + "learning_rate": 0.000226028880866426, + "loss": 0.2792, + "step": 1186 + }, + { + "epoch": 5.44, + "learning_rate": 0.0002259205776173285, + "loss": 0.2546, + "step": 1187 + }, + { + "epoch": 5.45, + "learning_rate": 0.00022581227436823103, + "loss": 0.162, + "step": 1188 + }, + { + "epoch": 5.45, + "learning_rate": 0.00022570397111913357, + "loss": 0.2334, + "step": 1189 + }, + { + "epoch": 5.46, + "learning_rate": 0.0002255956678700361, + "loss": 0.2384, + "step": 1190 + }, + { + "epoch": 5.46, + "learning_rate": 0.0002254873646209386, + "loss": 0.1221, + "step": 1191 + }, + { + "epoch": 5.47, + "learning_rate": 0.00022537906137184115, + "loss": 0.1899, + "step": 1192 + }, + { + "epoch": 5.47, + "learning_rate": 0.00022527075812274366, + "loss": 0.1476, + "step": 1193 + }, + { + "epoch": 5.48, + "learning_rate": 0.00022516245487364618, + "loss": 0.187, + "step": 1194 + }, + { + "epoch": 5.48, + "learning_rate": 0.00022505415162454872, + "loss": 0.1151, + "step": 1195 + }, + { + "epoch": 5.49, + "learning_rate": 0.00022494584837545124, + "loss": 0.2515, + "step": 1196 + }, + { + "epoch": 5.49, + "learning_rate": 0.00022483754512635378, + "loss": 0.188, + "step": 1197 + }, + { + "epoch": 5.5, + "learning_rate": 0.0002247292418772563, + "loss": 0.2445, + "step": 1198 + }, + { + "epoch": 5.5, + "learning_rate": 0.00022462093862815881, + "loss": 0.172, + "step": 1199 + }, + { + "epoch": 5.5, + "learning_rate": 0.00022451263537906136, + "loss": 0.2423, + "step": 1200 + }, + { + "epoch": 5.5, + "eval_loss": 0.38813942670822144, + "eval_runtime": 19.8433, + "eval_samples_per_second": 83.0, + "eval_steps_per_second": 2.621, + "eval_wer": 0.4277397610050046, + "step": 1200 + }, + { + "epoch": 5.51, + "learning_rate": 0.00022440433212996387, + "loss": 0.2354, + "step": 1201 + }, + { + "epoch": 5.51, + "learning_rate": 0.0002242960288808664, + "loss": 0.2321, + "step": 1202 + }, + { + "epoch": 5.52, + "learning_rate": 0.00022418772563176893, + "loss": 0.353, + "step": 1203 + }, + { + "epoch": 5.52, + "learning_rate": 0.00022407942238267145, + "loss": 0.2038, + "step": 1204 + }, + { + "epoch": 5.53, + "learning_rate": 0.00022397111913357396, + "loss": 0.1946, + "step": 1205 + }, + { + "epoch": 5.53, + "learning_rate": 0.0002238628158844765, + "loss": 0.1662, + "step": 1206 + }, + { + "epoch": 5.54, + "learning_rate": 0.00022375451263537905, + "loss": 0.1314, + "step": 1207 + }, + { + "epoch": 5.54, + "learning_rate": 0.0002236462093862816, + "loss": 0.1783, + "step": 1208 + }, + { + "epoch": 5.55, + "learning_rate": 0.0002235379061371841, + "loss": 0.1773, + "step": 1209 + }, + { + "epoch": 5.55, + "learning_rate": 0.00022342960288808663, + "loss": 0.241, + "step": 1210 + }, + { + "epoch": 5.56, + "learning_rate": 0.00022332129963898917, + "loss": 0.2135, + "step": 1211 + }, + { + "epoch": 5.56, + "learning_rate": 0.00022321299638989169, + "loss": 0.2318, + "step": 1212 + }, + { + "epoch": 5.56, + "learning_rate": 0.0002231046931407942, + "loss": 0.3598, + "step": 1213 + }, + { + "epoch": 5.57, + "learning_rate": 0.00022299638989169675, + "loss": 0.197, + "step": 1214 + }, + { + "epoch": 5.57, + "learning_rate": 0.00022288808664259926, + "loss": 0.2159, + "step": 1215 + }, + { + "epoch": 5.58, + "learning_rate": 0.00022277978339350178, + "loss": 0.2361, + "step": 1216 + }, + { + "epoch": 5.58, + "learning_rate": 0.00022267148014440432, + "loss": 0.203, + "step": 1217 + }, + { + "epoch": 5.59, + "learning_rate": 0.00022256317689530684, + "loss": 0.2127, + "step": 1218 + }, + { + "epoch": 5.59, + "learning_rate": 0.00022245487364620935, + "loss": 0.2306, + "step": 1219 + }, + { + "epoch": 5.6, + "learning_rate": 0.0002223465703971119, + "loss": 0.1997, + "step": 1220 + }, + { + "epoch": 5.6, + "learning_rate": 0.0002222382671480144, + "loss": 0.1338, + "step": 1221 + }, + { + "epoch": 5.61, + "learning_rate": 0.00022212996389891693, + "loss": 0.3236, + "step": 1222 + }, + { + "epoch": 5.61, + "learning_rate": 0.00022202166064981947, + "loss": 0.2417, + "step": 1223 + }, + { + "epoch": 5.61, + "learning_rate": 0.000221913357400722, + "loss": 0.1575, + "step": 1224 + }, + { + "epoch": 5.62, + "learning_rate": 0.0002218050541516245, + "loss": 0.272, + "step": 1225 + }, + { + "epoch": 5.62, + "learning_rate": 0.00022169675090252705, + "loss": 0.2462, + "step": 1226 + }, + { + "epoch": 5.63, + "learning_rate": 0.00022158844765342956, + "loss": 0.1837, + "step": 1227 + }, + { + "epoch": 5.63, + "learning_rate": 0.00022148014440433213, + "loss": 0.1778, + "step": 1228 + }, + { + "epoch": 5.64, + "learning_rate": 0.00022137184115523465, + "loss": 0.1878, + "step": 1229 + }, + { + "epoch": 5.64, + "learning_rate": 0.00022126353790613717, + "loss": 0.1989, + "step": 1230 + }, + { + "epoch": 5.65, + "learning_rate": 0.0002211552346570397, + "loss": 0.2962, + "step": 1231 + }, + { + "epoch": 5.65, + "learning_rate": 0.00022104693140794223, + "loss": 0.2261, + "step": 1232 + }, + { + "epoch": 5.66, + "learning_rate": 0.00022093862815884474, + "loss": 0.1771, + "step": 1233 + }, + { + "epoch": 5.66, + "learning_rate": 0.00022083032490974728, + "loss": 0.2048, + "step": 1234 + }, + { + "epoch": 5.67, + "learning_rate": 0.0002207220216606498, + "loss": 0.2239, + "step": 1235 + }, + { + "epoch": 5.67, + "learning_rate": 0.00022061371841155234, + "loss": 0.2512, + "step": 1236 + }, + { + "epoch": 5.67, + "learning_rate": 0.00022050541516245486, + "loss": 0.191, + "step": 1237 + }, + { + "epoch": 5.68, + "learning_rate": 0.00022039711191335738, + "loss": 0.2085, + "step": 1238 + }, + { + "epoch": 5.68, + "learning_rate": 0.00022028880866425992, + "loss": 0.3696, + "step": 1239 + }, + { + "epoch": 5.69, + "learning_rate": 0.00022018050541516244, + "loss": 0.3534, + "step": 1240 + }, + { + "epoch": 5.69, + "learning_rate": 0.00022007220216606495, + "loss": 0.1225, + "step": 1241 + }, + { + "epoch": 5.7, + "learning_rate": 0.0002199638989169675, + "loss": 0.2156, + "step": 1242 + }, + { + "epoch": 5.7, + "learning_rate": 0.00021985559566787, + "loss": 0.1559, + "step": 1243 + }, + { + "epoch": 5.71, + "learning_rate": 0.00021974729241877253, + "loss": 0.1919, + "step": 1244 + }, + { + "epoch": 5.71, + "learning_rate": 0.00021963898916967507, + "loss": 0.1196, + "step": 1245 + }, + { + "epoch": 5.72, + "learning_rate": 0.0002195306859205776, + "loss": 0.162, + "step": 1246 + }, + { + "epoch": 5.72, + "learning_rate": 0.0002194223826714801, + "loss": 0.1318, + "step": 1247 + }, + { + "epoch": 5.72, + "learning_rate": 0.00021931407942238265, + "loss": 0.2366, + "step": 1248 + }, + { + "epoch": 5.73, + "learning_rate": 0.00021920577617328516, + "loss": 0.2059, + "step": 1249 + }, + { + "epoch": 5.73, + "learning_rate": 0.00021909747292418773, + "loss": 0.2213, + "step": 1250 + }, + { + "epoch": 5.74, + "learning_rate": 0.00021898916967509025, + "loss": 0.1907, + "step": 1251 + }, + { + "epoch": 5.74, + "learning_rate": 0.00021888086642599276, + "loss": 0.1908, + "step": 1252 + }, + { + "epoch": 5.75, + "learning_rate": 0.0002187725631768953, + "loss": 0.2247, + "step": 1253 + }, + { + "epoch": 5.75, + "learning_rate": 0.00021866425992779782, + "loss": 0.141, + "step": 1254 + }, + { + "epoch": 5.76, + "learning_rate": 0.00021855595667870034, + "loss": 0.2175, + "step": 1255 + }, + { + "epoch": 5.76, + "learning_rate": 0.00021844765342960288, + "loss": 0.1326, + "step": 1256 + }, + { + "epoch": 5.77, + "learning_rate": 0.0002183393501805054, + "loss": 0.1466, + "step": 1257 + }, + { + "epoch": 5.77, + "learning_rate": 0.00021823104693140792, + "loss": 0.0946, + "step": 1258 + }, + { + "epoch": 5.78, + "learning_rate": 0.00021812274368231046, + "loss": 0.0954, + "step": 1259 + }, + { + "epoch": 5.78, + "learning_rate": 0.00021801444043321298, + "loss": 0.1888, + "step": 1260 + }, + { + "epoch": 5.78, + "learning_rate": 0.0002179061371841155, + "loss": 0.2012, + "step": 1261 + }, + { + "epoch": 5.79, + "learning_rate": 0.00021779783393501803, + "loss": 0.1289, + "step": 1262 + }, + { + "epoch": 5.79, + "learning_rate": 0.00021768953068592055, + "loss": 0.1268, + "step": 1263 + }, + { + "epoch": 5.8, + "learning_rate": 0.00021758122743682307, + "loss": 0.2936, + "step": 1264 + }, + { + "epoch": 5.8, + "learning_rate": 0.0002174729241877256, + "loss": 0.2829, + "step": 1265 + }, + { + "epoch": 5.81, + "learning_rate": 0.00021736462093862813, + "loss": 0.1403, + "step": 1266 + }, + { + "epoch": 5.81, + "learning_rate": 0.00021725631768953067, + "loss": 0.1658, + "step": 1267 + }, + { + "epoch": 5.82, + "learning_rate": 0.00021714801444043319, + "loss": 0.2335, + "step": 1268 + }, + { + "epoch": 5.82, + "learning_rate": 0.0002170397111913357, + "loss": 0.1508, + "step": 1269 + }, + { + "epoch": 5.83, + "learning_rate": 0.00021693140794223824, + "loss": 0.1781, + "step": 1270 + }, + { + "epoch": 5.83, + "learning_rate": 0.00021682310469314076, + "loss": 0.172, + "step": 1271 + }, + { + "epoch": 5.83, + "learning_rate": 0.00021671480144404333, + "loss": 0.155, + "step": 1272 + }, + { + "epoch": 5.84, + "learning_rate": 0.00021660649819494585, + "loss": 0.174, + "step": 1273 + }, + { + "epoch": 5.84, + "learning_rate": 0.00021649819494584836, + "loss": 0.2811, + "step": 1274 + }, + { + "epoch": 5.85, + "learning_rate": 0.0002163898916967509, + "loss": 0.169, + "step": 1275 + }, + { + "epoch": 5.85, + "learning_rate": 0.00021628158844765342, + "loss": 0.201, + "step": 1276 + }, + { + "epoch": 5.86, + "learning_rate": 0.00021617328519855594, + "loss": 0.2011, + "step": 1277 + }, + { + "epoch": 5.86, + "learning_rate": 0.00021606498194945848, + "loss": 0.2349, + "step": 1278 + }, + { + "epoch": 5.87, + "learning_rate": 0.000215956678700361, + "loss": 0.2835, + "step": 1279 + }, + { + "epoch": 5.87, + "learning_rate": 0.00021584837545126351, + "loss": 0.1376, + "step": 1280 + }, + { + "epoch": 5.88, + "learning_rate": 0.00021574007220216606, + "loss": 0.146, + "step": 1281 + }, + { + "epoch": 5.88, + "learning_rate": 0.00021563176895306857, + "loss": 0.1425, + "step": 1282 + }, + { + "epoch": 5.89, + "learning_rate": 0.0002155234657039711, + "loss": 0.1523, + "step": 1283 + }, + { + "epoch": 5.89, + "learning_rate": 0.00021541516245487363, + "loss": 0.146, + "step": 1284 + }, + { + "epoch": 5.89, + "learning_rate": 0.00021530685920577615, + "loss": 0.2041, + "step": 1285 + }, + { + "epoch": 5.9, + "learning_rate": 0.00021519855595667867, + "loss": 0.1294, + "step": 1286 + }, + { + "epoch": 5.9, + "learning_rate": 0.0002150902527075812, + "loss": 0.2164, + "step": 1287 + }, + { + "epoch": 5.91, + "learning_rate": 0.00021498194945848372, + "loss": 0.2182, + "step": 1288 + }, + { + "epoch": 5.91, + "learning_rate": 0.00021487364620938624, + "loss": 0.1592, + "step": 1289 + }, + { + "epoch": 5.92, + "learning_rate": 0.00021476534296028878, + "loss": 0.4319, + "step": 1290 + }, + { + "epoch": 5.92, + "learning_rate": 0.0002146570397111913, + "loss": 0.1391, + "step": 1291 + }, + { + "epoch": 5.93, + "learning_rate": 0.00021454873646209382, + "loss": 0.2933, + "step": 1292 + }, + { + "epoch": 5.93, + "learning_rate": 0.0002144404332129964, + "loss": 0.1441, + "step": 1293 + }, + { + "epoch": 5.94, + "learning_rate": 0.0002143321299638989, + "loss": 0.1183, + "step": 1294 + }, + { + "epoch": 5.94, + "learning_rate": 0.00021422382671480145, + "loss": 0.2034, + "step": 1295 + }, + { + "epoch": 5.94, + "learning_rate": 0.00021411552346570396, + "loss": 0.1792, + "step": 1296 + }, + { + "epoch": 5.95, + "learning_rate": 0.00021400722021660648, + "loss": 0.1781, + "step": 1297 + }, + { + "epoch": 5.95, + "learning_rate": 0.00021389891696750902, + "loss": 0.2367, + "step": 1298 + }, + { + "epoch": 5.96, + "learning_rate": 0.00021379061371841154, + "loss": 0.2563, + "step": 1299 + }, + { + "epoch": 5.96, + "learning_rate": 0.00021368231046931405, + "loss": 0.2128, + "step": 1300 + }, + { + "epoch": 5.96, + "eval_loss": 0.3865381181240082, + "eval_runtime": 20.4752, + "eval_samples_per_second": 80.439, + "eval_steps_per_second": 2.54, + "eval_wer": 0.4017975691962006, + "step": 1300 + }, + { + "epoch": 5.97, + "learning_rate": 0.0002135740072202166, + "loss": 0.11, + "step": 1301 + }, + { + "epoch": 5.97, + "learning_rate": 0.0002134657039711191, + "loss": 0.247, + "step": 1302 + }, + { + "epoch": 5.98, + "learning_rate": 0.00021335740072202166, + "loss": 0.2803, + "step": 1303 + }, + { + "epoch": 5.98, + "learning_rate": 0.00021324909747292417, + "loss": 0.1233, + "step": 1304 + }, + { + "epoch": 5.99, + "learning_rate": 0.0002131407942238267, + "loss": 0.1677, + "step": 1305 + }, + { + "epoch": 5.99, + "learning_rate": 0.00021303249097472923, + "loss": 0.1944, + "step": 1306 + }, + { + "epoch": 6.0, + "learning_rate": 0.00021292418772563175, + "loss": 0.1649, + "step": 1307 + }, + { + "epoch": 6.0, + "learning_rate": 0.00021281588447653426, + "loss": 0.4195, + "step": 1308 + }, + { + "epoch": 6.0, + "learning_rate": 0.0002127075812274368, + "loss": 0.123, + "step": 1309 + }, + { + "epoch": 6.01, + "learning_rate": 0.00021259927797833932, + "loss": 0.1455, + "step": 1310 + }, + { + "epoch": 6.01, + "learning_rate": 0.00021249097472924184, + "loss": 0.1475, + "step": 1311 + }, + { + "epoch": 6.02, + "learning_rate": 0.00021238267148014438, + "loss": 0.1317, + "step": 1312 + }, + { + "epoch": 6.02, + "learning_rate": 0.0002122743682310469, + "loss": 0.1032, + "step": 1313 + }, + { + "epoch": 6.03, + "learning_rate": 0.00021216606498194942, + "loss": 0.1525, + "step": 1314 + }, + { + "epoch": 6.03, + "learning_rate": 0.00021205776173285199, + "loss": 0.1142, + "step": 1315 + }, + { + "epoch": 6.04, + "learning_rate": 0.0002119494584837545, + "loss": 0.1174, + "step": 1316 + }, + { + "epoch": 6.04, + "learning_rate": 0.00021184115523465704, + "loss": 0.1639, + "step": 1317 + }, + { + "epoch": 6.05, + "learning_rate": 0.00021173285198555956, + "loss": 0.2727, + "step": 1318 + }, + { + "epoch": 6.05, + "learning_rate": 0.00021162454873646208, + "loss": 0.2804, + "step": 1319 + }, + { + "epoch": 6.06, + "learning_rate": 0.00021151624548736462, + "loss": 0.3224, + "step": 1320 + }, + { + "epoch": 6.06, + "learning_rate": 0.00021140794223826714, + "loss": 0.1565, + "step": 1321 + }, + { + "epoch": 6.06, + "learning_rate": 0.00021129963898916965, + "loss": 0.0901, + "step": 1322 + }, + { + "epoch": 6.07, + "learning_rate": 0.0002111913357400722, + "loss": 0.1136, + "step": 1323 + }, + { + "epoch": 6.07, + "learning_rate": 0.0002110830324909747, + "loss": 0.0821, + "step": 1324 + }, + { + "epoch": 6.08, + "learning_rate": 0.00021097472924187723, + "loss": 0.1113, + "step": 1325 + }, + { + "epoch": 6.08, + "learning_rate": 0.00021086642599277977, + "loss": 0.144, + "step": 1326 + }, + { + "epoch": 6.09, + "learning_rate": 0.0002107581227436823, + "loss": 0.181, + "step": 1327 + }, + { + "epoch": 6.09, + "learning_rate": 0.0002106498194945848, + "loss": 0.0939, + "step": 1328 + }, + { + "epoch": 6.1, + "learning_rate": 0.00021054151624548735, + "loss": 0.1741, + "step": 1329 + }, + { + "epoch": 6.1, + "learning_rate": 0.00021043321299638986, + "loss": 0.1686, + "step": 1330 + }, + { + "epoch": 6.11, + "learning_rate": 0.00021032490974729238, + "loss": 0.1158, + "step": 1331 + }, + { + "epoch": 6.11, + "learning_rate": 0.00021021660649819492, + "loss": 0.1743, + "step": 1332 + }, + { + "epoch": 6.11, + "learning_rate": 0.00021010830324909744, + "loss": 0.1655, + "step": 1333 + }, + { + "epoch": 6.12, + "learning_rate": 0.00020999999999999998, + "loss": 0.1451, + "step": 1334 + }, + { + "epoch": 6.12, + "learning_rate": 0.0002098916967509025, + "loss": 0.1956, + "step": 1335 + }, + { + "epoch": 6.13, + "learning_rate": 0.00020978339350180501, + "loss": 0.1882, + "step": 1336 + }, + { + "epoch": 6.13, + "learning_rate": 0.00020967509025270758, + "loss": 0.0884, + "step": 1337 + }, + { + "epoch": 6.14, + "learning_rate": 0.0002095667870036101, + "loss": 0.109, + "step": 1338 + }, + { + "epoch": 6.14, + "learning_rate": 0.00020945848375451262, + "loss": 0.0998, + "step": 1339 + }, + { + "epoch": 6.15, + "learning_rate": 0.00020935018050541516, + "loss": 0.1597, + "step": 1340 + }, + { + "epoch": 6.15, + "learning_rate": 0.00020924187725631768, + "loss": 0.0983, + "step": 1341 + }, + { + "epoch": 6.16, + "learning_rate": 0.00020913357400722022, + "loss": 0.1591, + "step": 1342 + }, + { + "epoch": 6.16, + "learning_rate": 0.00020902527075812274, + "loss": 0.2107, + "step": 1343 + }, + { + "epoch": 6.17, + "learning_rate": 0.00020891696750902525, + "loss": 0.1885, + "step": 1344 + }, + { + "epoch": 6.17, + "learning_rate": 0.0002088086642599278, + "loss": 0.1606, + "step": 1345 + }, + { + "epoch": 6.17, + "learning_rate": 0.0002087003610108303, + "loss": 0.1658, + "step": 1346 + }, + { + "epoch": 6.18, + "learning_rate": 0.00020859205776173283, + "loss": 0.1062, + "step": 1347 + }, + { + "epoch": 6.18, + "learning_rate": 0.00020848375451263537, + "loss": 0.1019, + "step": 1348 + }, + { + "epoch": 6.19, + "learning_rate": 0.00020837545126353789, + "loss": 0.0899, + "step": 1349 + }, + { + "epoch": 6.19, + "learning_rate": 0.0002082671480144404, + "loss": 0.1026, + "step": 1350 + }, + { + "epoch": 6.2, + "learning_rate": 0.00020815884476534295, + "loss": 0.0673, + "step": 1351 + }, + { + "epoch": 6.2, + "learning_rate": 0.00020805054151624546, + "loss": 0.1993, + "step": 1352 + }, + { + "epoch": 6.21, + "learning_rate": 0.00020794223826714798, + "loss": 0.1392, + "step": 1353 + }, + { + "epoch": 6.21, + "learning_rate": 0.00020783393501805052, + "loss": 0.3194, + "step": 1354 + }, + { + "epoch": 6.22, + "learning_rate": 0.00020772563176895304, + "loss": 0.1094, + "step": 1355 + }, + { + "epoch": 6.22, + "learning_rate": 0.00020761732851985555, + "loss": 0.1906, + "step": 1356 + }, + { + "epoch": 6.22, + "learning_rate": 0.0002075090252707581, + "loss": 0.1134, + "step": 1357 + }, + { + "epoch": 6.23, + "learning_rate": 0.00020740072202166064, + "loss": 0.3591, + "step": 1358 + }, + { + "epoch": 6.23, + "learning_rate": 0.00020729241877256318, + "loss": 0.1466, + "step": 1359 + }, + { + "epoch": 6.24, + "learning_rate": 0.0002071841155234657, + "loss": 0.1813, + "step": 1360 + }, + { + "epoch": 6.24, + "learning_rate": 0.00020707581227436822, + "loss": 0.1362, + "step": 1361 + }, + { + "epoch": 6.25, + "learning_rate": 0.00020696750902527076, + "loss": 0.1613, + "step": 1362 + }, + { + "epoch": 6.25, + "learning_rate": 0.00020685920577617327, + "loss": 0.1225, + "step": 1363 + }, + { + "epoch": 6.26, + "learning_rate": 0.0002067509025270758, + "loss": 0.0967, + "step": 1364 + }, + { + "epoch": 6.26, + "learning_rate": 0.00020664259927797833, + "loss": 0.2137, + "step": 1365 + }, + { + "epoch": 6.27, + "learning_rate": 0.00020653429602888085, + "loss": 0.2358, + "step": 1366 + }, + { + "epoch": 6.27, + "learning_rate": 0.00020642599277978337, + "loss": 0.2252, + "step": 1367 + }, + { + "epoch": 6.28, + "learning_rate": 0.0002063176895306859, + "loss": 0.2165, + "step": 1368 + }, + { + "epoch": 6.28, + "learning_rate": 0.00020620938628158843, + "loss": 0.134, + "step": 1369 + }, + { + "epoch": 6.28, + "learning_rate": 0.00020610108303249094, + "loss": 0.1801, + "step": 1370 + }, + { + "epoch": 6.29, + "learning_rate": 0.00020599277978339348, + "loss": 0.241, + "step": 1371 + }, + { + "epoch": 6.29, + "learning_rate": 0.000205884476534296, + "loss": 0.1193, + "step": 1372 + }, + { + "epoch": 6.3, + "learning_rate": 0.00020577617328519854, + "loss": 0.1802, + "step": 1373 + }, + { + "epoch": 6.3, + "learning_rate": 0.00020566787003610106, + "loss": 0.2307, + "step": 1374 + }, + { + "epoch": 6.31, + "learning_rate": 0.00020555956678700358, + "loss": 0.1151, + "step": 1375 + }, + { + "epoch": 6.31, + "learning_rate": 0.00020545126353790612, + "loss": 0.168, + "step": 1376 + }, + { + "epoch": 6.32, + "learning_rate": 0.00020534296028880864, + "loss": 0.1838, + "step": 1377 + }, + { + "epoch": 6.32, + "learning_rate": 0.00020523465703971115, + "loss": 0.2097, + "step": 1378 + }, + { + "epoch": 6.33, + "learning_rate": 0.0002051263537906137, + "loss": 0.2204, + "step": 1379 + }, + { + "epoch": 6.33, + "learning_rate": 0.00020501805054151624, + "loss": 0.214, + "step": 1380 + }, + { + "epoch": 6.33, + "learning_rate": 0.00020490974729241878, + "loss": 0.1566, + "step": 1381 + }, + { + "epoch": 6.34, + "learning_rate": 0.0002048014440433213, + "loss": 0.1281, + "step": 1382 + }, + { + "epoch": 6.34, + "learning_rate": 0.00020469314079422381, + "loss": 0.3929, + "step": 1383 + }, + { + "epoch": 6.35, + "learning_rate": 0.00020458483754512636, + "loss": 0.1058, + "step": 1384 + }, + { + "epoch": 6.35, + "learning_rate": 0.00020447653429602887, + "loss": 0.134, + "step": 1385 + }, + { + "epoch": 6.36, + "learning_rate": 0.0002043682310469314, + "loss": 0.0722, + "step": 1386 + }, + { + "epoch": 6.36, + "learning_rate": 0.00020425992779783393, + "loss": 0.152, + "step": 1387 + }, + { + "epoch": 6.37, + "learning_rate": 0.00020415162454873645, + "loss": 0.1169, + "step": 1388 + }, + { + "epoch": 6.37, + "learning_rate": 0.00020404332129963896, + "loss": 0.1897, + "step": 1389 + }, + { + "epoch": 6.38, + "learning_rate": 0.0002039350180505415, + "loss": 0.129, + "step": 1390 + }, + { + "epoch": 6.38, + "learning_rate": 0.00020382671480144402, + "loss": 0.1899, + "step": 1391 + }, + { + "epoch": 6.39, + "learning_rate": 0.00020371841155234654, + "loss": 0.2229, + "step": 1392 + }, + { + "epoch": 6.39, + "learning_rate": 0.00020361010830324908, + "loss": 0.1588, + "step": 1393 + }, + { + "epoch": 6.39, + "learning_rate": 0.0002035018050541516, + "loss": 0.2426, + "step": 1394 + }, + { + "epoch": 6.4, + "learning_rate": 0.00020339350180505412, + "loss": 0.2498, + "step": 1395 + }, + { + "epoch": 6.4, + "learning_rate": 0.00020328519855595666, + "loss": 0.1119, + "step": 1396 + }, + { + "epoch": 6.41, + "learning_rate": 0.00020317689530685918, + "loss": 0.1899, + "step": 1397 + }, + { + "epoch": 6.41, + "learning_rate": 0.0002030685920577617, + "loss": 0.1157, + "step": 1398 + }, + { + "epoch": 6.42, + "learning_rate": 0.00020296028880866423, + "loss": 0.1567, + "step": 1399 + }, + { + "epoch": 6.42, + "learning_rate": 0.00020285198555956675, + "loss": 0.1256, + "step": 1400 + }, + { + "epoch": 6.42, + "eval_loss": 0.3817655146121979, + "eval_runtime": 19.9754, + "eval_samples_per_second": 82.451, + "eval_steps_per_second": 2.603, + "eval_wer": 0.4137473189663977, + "step": 1400 + }, + { + "epoch": 6.43, + "learning_rate": 0.00020274368231046927, + "loss": 0.2155, + "step": 1401 + }, + { + "epoch": 6.43, + "learning_rate": 0.00020263537906137184, + "loss": 0.1445, + "step": 1402 + }, + { + "epoch": 6.44, + "learning_rate": 0.00020252707581227435, + "loss": 0.2376, + "step": 1403 + }, + { + "epoch": 6.44, + "learning_rate": 0.0002024187725631769, + "loss": 0.1816, + "step": 1404 + }, + { + "epoch": 6.44, + "learning_rate": 0.0002023104693140794, + "loss": 0.1584, + "step": 1405 + }, + { + "epoch": 6.45, + "learning_rate": 0.00020220216606498193, + "loss": 0.1913, + "step": 1406 + }, + { + "epoch": 6.45, + "learning_rate": 0.00020209386281588447, + "loss": 0.1162, + "step": 1407 + }, + { + "epoch": 6.46, + "learning_rate": 0.000201985559566787, + "loss": 0.2196, + "step": 1408 + }, + { + "epoch": 6.46, + "learning_rate": 0.0002018772563176895, + "loss": 0.1558, + "step": 1409 + }, + { + "epoch": 6.47, + "learning_rate": 0.00020176895306859205, + "loss": 0.118, + "step": 1410 + }, + { + "epoch": 6.47, + "learning_rate": 0.00020166064981949456, + "loss": 0.1222, + "step": 1411 + }, + { + "epoch": 6.48, + "learning_rate": 0.0002015523465703971, + "loss": 0.1749, + "step": 1412 + }, + { + "epoch": 6.48, + "learning_rate": 0.00020144404332129962, + "loss": 0.1776, + "step": 1413 + }, + { + "epoch": 6.49, + "learning_rate": 0.00020133574007220214, + "loss": 0.1671, + "step": 1414 + }, + { + "epoch": 6.49, + "learning_rate": 0.00020122743682310468, + "loss": 0.18, + "step": 1415 + }, + { + "epoch": 6.5, + "learning_rate": 0.0002011191335740072, + "loss": 0.1713, + "step": 1416 + }, + { + "epoch": 6.5, + "learning_rate": 0.00020101083032490971, + "loss": 0.1969, + "step": 1417 + }, + { + "epoch": 6.5, + "learning_rate": 0.00020090252707581226, + "loss": 0.1587, + "step": 1418 + }, + { + "epoch": 6.51, + "learning_rate": 0.00020079422382671477, + "loss": 0.2131, + "step": 1419 + }, + { + "epoch": 6.51, + "learning_rate": 0.0002006859205776173, + "loss": 0.3623, + "step": 1420 + }, + { + "epoch": 6.52, + "learning_rate": 0.00020057761732851983, + "loss": 0.1985, + "step": 1421 + }, + { + "epoch": 6.52, + "learning_rate": 0.00020046931407942235, + "loss": 0.1989, + "step": 1422 + }, + { + "epoch": 6.53, + "learning_rate": 0.00020036101083032492, + "loss": 0.1593, + "step": 1423 + }, + { + "epoch": 6.53, + "learning_rate": 0.00020025270758122744, + "loss": 0.1496, + "step": 1424 + }, + { + "epoch": 6.54, + "learning_rate": 0.00020014440433212995, + "loss": 0.1605, + "step": 1425 + }, + { + "epoch": 6.54, + "learning_rate": 0.0002000361010830325, + "loss": 0.1693, + "step": 1426 + }, + { + "epoch": 6.55, + "learning_rate": 0.000199927797833935, + "loss": 0.0998, + "step": 1427 + }, + { + "epoch": 6.55, + "learning_rate": 0.00019981949458483753, + "loss": 0.0933, + "step": 1428 + }, + { + "epoch": 6.56, + "learning_rate": 0.00019971119133574007, + "loss": 0.1625, + "step": 1429 + }, + { + "epoch": 6.56, + "learning_rate": 0.0001996028880866426, + "loss": 0.1831, + "step": 1430 + }, + { + "epoch": 6.56, + "learning_rate": 0.0001994945848375451, + "loss": 0.0762, + "step": 1431 + }, + { + "epoch": 6.57, + "learning_rate": 0.00019938628158844765, + "loss": 0.2332, + "step": 1432 + }, + { + "epoch": 6.57, + "learning_rate": 0.00019927797833935016, + "loss": 0.1687, + "step": 1433 + }, + { + "epoch": 6.58, + "learning_rate": 0.00019916967509025268, + "loss": 0.1118, + "step": 1434 + }, + { + "epoch": 6.58, + "learning_rate": 0.00019906137184115522, + "loss": 0.141, + "step": 1435 + }, + { + "epoch": 6.59, + "learning_rate": 0.00019895306859205774, + "loss": 0.1015, + "step": 1436 + }, + { + "epoch": 6.59, + "learning_rate": 0.00019884476534296025, + "loss": 0.1005, + "step": 1437 + }, + { + "epoch": 6.6, + "learning_rate": 0.0001987364620938628, + "loss": 0.1779, + "step": 1438 + }, + { + "epoch": 6.6, + "learning_rate": 0.0001986281588447653, + "loss": 0.0821, + "step": 1439 + }, + { + "epoch": 6.61, + "learning_rate": 0.00019851985559566783, + "loss": 0.1171, + "step": 1440 + }, + { + "epoch": 6.61, + "learning_rate": 0.00019841155234657037, + "loss": 0.1969, + "step": 1441 + }, + { + "epoch": 6.61, + "learning_rate": 0.0001983032490974729, + "loss": 0.1662, + "step": 1442 + }, + { + "epoch": 6.62, + "learning_rate": 0.00019819494584837543, + "loss": 0.1993, + "step": 1443 + }, + { + "epoch": 6.62, + "learning_rate": 0.00019808664259927795, + "loss": 0.1474, + "step": 1444 + }, + { + "epoch": 6.63, + "learning_rate": 0.0001979783393501805, + "loss": 0.1644, + "step": 1445 + }, + { + "epoch": 6.63, + "learning_rate": 0.00019787003610108303, + "loss": 0.1841, + "step": 1446 + }, + { + "epoch": 6.64, + "learning_rate": 0.00019776173285198555, + "loss": 0.1609, + "step": 1447 + }, + { + "epoch": 6.64, + "learning_rate": 0.0001976534296028881, + "loss": 0.153, + "step": 1448 + }, + { + "epoch": 6.65, + "learning_rate": 0.0001975451263537906, + "loss": 0.2223, + "step": 1449 + }, + { + "epoch": 6.65, + "learning_rate": 0.00019743682310469313, + "loss": 0.1288, + "step": 1450 + }, + { + "epoch": 6.66, + "learning_rate": 0.00019732851985559567, + "loss": 0.1053, + "step": 1451 + }, + { + "epoch": 6.66, + "learning_rate": 0.00019722021660649819, + "loss": 0.2425, + "step": 1452 + }, + { + "epoch": 6.67, + "learning_rate": 0.0001971119133574007, + "loss": 0.1485, + "step": 1453 + }, + { + "epoch": 6.67, + "learning_rate": 0.00019700361010830324, + "loss": 0.2, + "step": 1454 + }, + { + "epoch": 6.67, + "learning_rate": 0.00019689530685920576, + "loss": 0.1658, + "step": 1455 + }, + { + "epoch": 6.68, + "learning_rate": 0.00019678700361010828, + "loss": 0.2347, + "step": 1456 + }, + { + "epoch": 6.68, + "learning_rate": 0.00019667870036101082, + "loss": 0.3169, + "step": 1457 + }, + { + "epoch": 6.69, + "learning_rate": 0.00019657039711191334, + "loss": 0.1934, + "step": 1458 + }, + { + "epoch": 6.69, + "learning_rate": 0.00019646209386281585, + "loss": 0.0863, + "step": 1459 + }, + { + "epoch": 6.7, + "learning_rate": 0.0001963537906137184, + "loss": 0.1368, + "step": 1460 + }, + { + "epoch": 6.7, + "learning_rate": 0.0001962454873646209, + "loss": 0.1648, + "step": 1461 + }, + { + "epoch": 6.71, + "learning_rate": 0.00019613718411552343, + "loss": 0.0968, + "step": 1462 + }, + { + "epoch": 6.71, + "learning_rate": 0.00019602888086642597, + "loss": 0.1282, + "step": 1463 + }, + { + "epoch": 6.72, + "learning_rate": 0.0001959205776173285, + "loss": 0.1491, + "step": 1464 + }, + { + "epoch": 6.72, + "learning_rate": 0.000195812274368231, + "loss": 0.1154, + "step": 1465 + }, + { + "epoch": 6.72, + "learning_rate": 0.00019570397111913355, + "loss": 0.1908, + "step": 1466 + }, + { + "epoch": 6.73, + "learning_rate": 0.0001955956678700361, + "loss": 0.2541, + "step": 1467 + }, + { + "epoch": 6.73, + "learning_rate": 0.00019548736462093863, + "loss": 0.1666, + "step": 1468 + }, + { + "epoch": 6.74, + "learning_rate": 0.00019537906137184115, + "loss": 0.2337, + "step": 1469 + }, + { + "epoch": 6.74, + "learning_rate": 0.00019527075812274367, + "loss": 0.1449, + "step": 1470 + }, + { + "epoch": 6.75, + "learning_rate": 0.0001951624548736462, + "loss": 0.3607, + "step": 1471 + }, + { + "epoch": 6.75, + "learning_rate": 0.00019505415162454872, + "loss": 0.1426, + "step": 1472 + }, + { + "epoch": 6.76, + "learning_rate": 0.00019494584837545124, + "loss": 0.1715, + "step": 1473 + }, + { + "epoch": 6.76, + "learning_rate": 0.00019483754512635378, + "loss": 0.118, + "step": 1474 + }, + { + "epoch": 6.77, + "learning_rate": 0.0001947292418772563, + "loss": 0.1772, + "step": 1475 + }, + { + "epoch": 6.77, + "learning_rate": 0.00019462093862815882, + "loss": 0.134, + "step": 1476 + }, + { + "epoch": 6.78, + "learning_rate": 0.00019451263537906136, + "loss": 0.0912, + "step": 1477 + }, + { + "epoch": 6.78, + "learning_rate": 0.00019440433212996388, + "loss": 0.2249, + "step": 1478 + }, + { + "epoch": 6.78, + "learning_rate": 0.00019429602888086642, + "loss": 0.1481, + "step": 1479 + }, + { + "epoch": 6.79, + "learning_rate": 0.00019418772563176894, + "loss": 0.1112, + "step": 1480 + }, + { + "epoch": 6.79, + "learning_rate": 0.00019407942238267145, + "loss": 0.0972, + "step": 1481 + }, + { + "epoch": 6.8, + "learning_rate": 0.000193971119133574, + "loss": 0.1437, + "step": 1482 + }, + { + "epoch": 6.8, + "learning_rate": 0.0001938628158844765, + "loss": 0.2131, + "step": 1483 + }, + { + "epoch": 6.81, + "learning_rate": 0.00019375451263537903, + "loss": 0.1831, + "step": 1484 + }, + { + "epoch": 6.81, + "learning_rate": 0.00019364620938628157, + "loss": 0.112, + "step": 1485 + }, + { + "epoch": 6.82, + "learning_rate": 0.00019353790613718409, + "loss": 0.1393, + "step": 1486 + }, + { + "epoch": 6.82, + "learning_rate": 0.0001934296028880866, + "loss": 0.1138, + "step": 1487 + }, + { + "epoch": 6.83, + "learning_rate": 0.00019332129963898917, + "loss": 0.1312, + "step": 1488 + }, + { + "epoch": 6.83, + "learning_rate": 0.0001932129963898917, + "loss": 0.153, + "step": 1489 + }, + { + "epoch": 6.83, + "learning_rate": 0.00019310469314079423, + "loss": 0.1514, + "step": 1490 + }, + { + "epoch": 6.84, + "learning_rate": 0.00019299638989169675, + "loss": 0.1666, + "step": 1491 + }, + { + "epoch": 6.84, + "learning_rate": 0.00019288808664259926, + "loss": 0.1957, + "step": 1492 + }, + { + "epoch": 6.85, + "learning_rate": 0.0001927797833935018, + "loss": 0.2354, + "step": 1493 + }, + { + "epoch": 6.85, + "learning_rate": 0.00019267148014440432, + "loss": 0.1944, + "step": 1494 + }, + { + "epoch": 6.86, + "learning_rate": 0.00019256317689530684, + "loss": 0.1818, + "step": 1495 + }, + { + "epoch": 6.86, + "learning_rate": 0.00019245487364620938, + "loss": 0.2112, + "step": 1496 + }, + { + "epoch": 6.87, + "learning_rate": 0.0001923465703971119, + "loss": 0.0983, + "step": 1497 + }, + { + "epoch": 6.87, + "learning_rate": 0.00019223826714801442, + "loss": 0.1496, + "step": 1498 + }, + { + "epoch": 6.88, + "learning_rate": 0.00019212996389891696, + "loss": 0.1497, + "step": 1499 + }, + { + "epoch": 6.88, + "learning_rate": 0.00019202166064981947, + "loss": 0.1038, + "step": 1500 + }, + { + "epoch": 6.88, + "eval_loss": 0.37394917011260986, + "eval_runtime": 20.0558, + "eval_samples_per_second": 82.121, + "eval_steps_per_second": 2.593, + "eval_wer": 0.3942396078030845, + "step": 1500 + }, + { + "epoch": 6.89, + "learning_rate": 0.000191913357400722, + "loss": 0.1395, + "step": 1501 + }, + { + "epoch": 6.89, + "learning_rate": 0.00019180505415162453, + "loss": 0.1639, + "step": 1502 + }, + { + "epoch": 6.89, + "learning_rate": 0.00019169675090252705, + "loss": 0.1156, + "step": 1503 + }, + { + "epoch": 6.9, + "learning_rate": 0.00019158844765342957, + "loss": 0.1503, + "step": 1504 + }, + { + "epoch": 6.9, + "learning_rate": 0.0001914801444043321, + "loss": 0.1053, + "step": 1505 + }, + { + "epoch": 6.91, + "learning_rate": 0.00019137184115523463, + "loss": 0.1792, + "step": 1506 + }, + { + "epoch": 6.91, + "learning_rate": 0.00019126353790613714, + "loss": 0.2367, + "step": 1507 + }, + { + "epoch": 6.92, + "learning_rate": 0.00019115523465703968, + "loss": 0.2082, + "step": 1508 + }, + { + "epoch": 6.92, + "learning_rate": 0.0001910469314079422, + "loss": 0.1143, + "step": 1509 + }, + { + "epoch": 6.93, + "learning_rate": 0.00019093862815884477, + "loss": 0.1492, + "step": 1510 + }, + { + "epoch": 6.93, + "learning_rate": 0.0001908303249097473, + "loss": 0.1378, + "step": 1511 + }, + { + "epoch": 6.94, + "learning_rate": 0.0001907220216606498, + "loss": 0.1617, + "step": 1512 + }, + { + "epoch": 6.94, + "learning_rate": 0.00019061371841155235, + "loss": 0.0842, + "step": 1513 + }, + { + "epoch": 6.94, + "learning_rate": 0.00019050541516245486, + "loss": 0.1164, + "step": 1514 + }, + { + "epoch": 6.95, + "learning_rate": 0.00019039711191335738, + "loss": 0.2314, + "step": 1515 + }, + { + "epoch": 6.95, + "learning_rate": 0.00019028880866425992, + "loss": 0.1775, + "step": 1516 + }, + { + "epoch": 6.96, + "learning_rate": 0.00019018050541516244, + "loss": 0.0684, + "step": 1517 + }, + { + "epoch": 6.96, + "learning_rate": 0.00019007220216606498, + "loss": 0.1661, + "step": 1518 + }, + { + "epoch": 6.97, + "learning_rate": 0.0001899638989169675, + "loss": 0.169, + "step": 1519 + }, + { + "epoch": 6.97, + "learning_rate": 0.00018985559566787001, + "loss": 0.343, + "step": 1520 + }, + { + "epoch": 6.98, + "learning_rate": 0.00018974729241877256, + "loss": 0.1817, + "step": 1521 + }, + { + "epoch": 6.98, + "learning_rate": 0.00018963898916967507, + "loss": 0.103, + "step": 1522 + }, + { + "epoch": 6.99, + "learning_rate": 0.0001895306859205776, + "loss": 0.1601, + "step": 1523 + }, + { + "epoch": 6.99, + "learning_rate": 0.00018942238267148013, + "loss": 0.1836, + "step": 1524 + }, + { + "epoch": 7.0, + "learning_rate": 0.00018931407942238265, + "loss": 0.2109, + "step": 1525 + }, + { + "epoch": 7.0, + "learning_rate": 0.00018920577617328516, + "loss": 0.1351, + "step": 1526 + }, + { + "epoch": 7.0, + "learning_rate": 0.0001890974729241877, + "loss": 0.112, + "step": 1527 + }, + { + "epoch": 7.01, + "learning_rate": 0.00018898916967509022, + "loss": 0.1405, + "step": 1528 + }, + { + "epoch": 7.01, + "learning_rate": 0.00018888086642599274, + "loss": 0.0643, + "step": 1529 + }, + { + "epoch": 7.02, + "learning_rate": 0.00018877256317689528, + "loss": 0.1651, + "step": 1530 + }, + { + "epoch": 7.02, + "learning_rate": 0.00018866425992779783, + "loss": 0.1226, + "step": 1531 + }, + { + "epoch": 7.03, + "learning_rate": 0.00018855595667870037, + "loss": 0.1107, + "step": 1532 + }, + { + "epoch": 7.03, + "learning_rate": 0.00018844765342960289, + "loss": 0.1547, + "step": 1533 + }, + { + "epoch": 7.04, + "learning_rate": 0.0001883393501805054, + "loss": 0.1232, + "step": 1534 + }, + { + "epoch": 7.04, + "learning_rate": 0.00018823104693140795, + "loss": 0.2184, + "step": 1535 + }, + { + "epoch": 7.05, + "learning_rate": 0.00018812274368231046, + "loss": 0.0938, + "step": 1536 + }, + { + "epoch": 7.05, + "learning_rate": 0.00018801444043321298, + "loss": 0.1627, + "step": 1537 + }, + { + "epoch": 7.06, + "learning_rate": 0.00018790613718411552, + "loss": 0.2463, + "step": 1538 + }, + { + "epoch": 7.06, + "learning_rate": 0.00018779783393501804, + "loss": 0.1229, + "step": 1539 + }, + { + "epoch": 7.06, + "learning_rate": 0.00018768953068592055, + "loss": 0.103, + "step": 1540 + }, + { + "epoch": 7.07, + "learning_rate": 0.0001875812274368231, + "loss": 0.0998, + "step": 1541 + }, + { + "epoch": 7.07, + "learning_rate": 0.0001874729241877256, + "loss": 0.1033, + "step": 1542 + }, + { + "epoch": 7.08, + "learning_rate": 0.00018736462093862813, + "loss": 0.1231, + "step": 1543 + }, + { + "epoch": 7.08, + "learning_rate": 0.00018725631768953067, + "loss": 0.1186, + "step": 1544 + }, + { + "epoch": 7.09, + "learning_rate": 0.0001871480144404332, + "loss": 0.1845, + "step": 1545 + }, + { + "epoch": 7.09, + "learning_rate": 0.0001870397111913357, + "loss": 0.105, + "step": 1546 + }, + { + "epoch": 7.1, + "learning_rate": 0.00018693140794223825, + "loss": 0.1032, + "step": 1547 + }, + { + "epoch": 7.1, + "learning_rate": 0.00018682310469314076, + "loss": 0.2022, + "step": 1548 + }, + { + "epoch": 7.11, + "learning_rate": 0.0001867148014440433, + "loss": 0.2588, + "step": 1549 + }, + { + "epoch": 7.11, + "learning_rate": 0.00018660649819494582, + "loss": 0.1651, + "step": 1550 + }, + { + "epoch": 7.11, + "learning_rate": 0.00018649819494584834, + "loss": 0.1859, + "step": 1551 + }, + { + "epoch": 7.12, + "learning_rate": 0.00018638989169675088, + "loss": 0.0638, + "step": 1552 + }, + { + "epoch": 7.12, + "learning_rate": 0.00018628158844765343, + "loss": 0.1225, + "step": 1553 + }, + { + "epoch": 7.13, + "learning_rate": 0.00018617328519855594, + "loss": 0.0881, + "step": 1554 + }, + { + "epoch": 7.13, + "learning_rate": 0.00018606498194945848, + "loss": 0.1554, + "step": 1555 + }, + { + "epoch": 7.14, + "learning_rate": 0.000185956678700361, + "loss": 0.1536, + "step": 1556 + }, + { + "epoch": 7.14, + "learning_rate": 0.00018584837545126354, + "loss": 0.1009, + "step": 1557 + }, + { + "epoch": 7.15, + "learning_rate": 0.00018574007220216606, + "loss": 0.1331, + "step": 1558 + }, + { + "epoch": 7.15, + "learning_rate": 0.00018563176895306858, + "loss": 0.0944, + "step": 1559 + }, + { + "epoch": 7.16, + "learning_rate": 0.00018552346570397112, + "loss": 0.0721, + "step": 1560 + }, + { + "epoch": 7.16, + "learning_rate": 0.00018541516245487364, + "loss": 0.179, + "step": 1561 + }, + { + "epoch": 7.17, + "learning_rate": 0.00018530685920577615, + "loss": 0.1626, + "step": 1562 + }, + { + "epoch": 7.17, + "learning_rate": 0.0001851985559566787, + "loss": 0.1863, + "step": 1563 + }, + { + "epoch": 7.17, + "learning_rate": 0.0001850902527075812, + "loss": 0.108, + "step": 1564 + }, + { + "epoch": 7.18, + "learning_rate": 0.00018498194945848373, + "loss": 0.0929, + "step": 1565 + }, + { + "epoch": 7.18, + "learning_rate": 0.00018487364620938627, + "loss": 0.1528, + "step": 1566 + }, + { + "epoch": 7.19, + "learning_rate": 0.0001847653429602888, + "loss": 0.0673, + "step": 1567 + }, + { + "epoch": 7.19, + "learning_rate": 0.0001846570397111913, + "loss": 0.0347, + "step": 1568 + }, + { + "epoch": 7.2, + "learning_rate": 0.00018454873646209385, + "loss": 0.1961, + "step": 1569 + }, + { + "epoch": 7.2, + "learning_rate": 0.00018444043321299636, + "loss": 0.1578, + "step": 1570 + }, + { + "epoch": 7.21, + "learning_rate": 0.00018433212996389888, + "loss": 0.0905, + "step": 1571 + }, + { + "epoch": 7.21, + "learning_rate": 0.00018422382671480142, + "loss": 0.0979, + "step": 1572 + }, + { + "epoch": 7.22, + "learning_rate": 0.00018411552346570394, + "loss": 0.0843, + "step": 1573 + }, + { + "epoch": 7.22, + "learning_rate": 0.00018400722021660645, + "loss": 0.1123, + "step": 1574 + }, + { + "epoch": 7.22, + "learning_rate": 0.00018389891696750902, + "loss": 0.1716, + "step": 1575 + }, + { + "epoch": 7.23, + "learning_rate": 0.00018379061371841154, + "loss": 0.3042, + "step": 1576 + }, + { + "epoch": 7.23, + "learning_rate": 0.00018368231046931408, + "loss": 0.1179, + "step": 1577 + }, + { + "epoch": 7.24, + "learning_rate": 0.0001835740072202166, + "loss": 0.0814, + "step": 1578 + }, + { + "epoch": 7.24, + "learning_rate": 0.00018346570397111912, + "loss": 0.1725, + "step": 1579 + }, + { + "epoch": 7.25, + "learning_rate": 0.00018335740072202166, + "loss": 0.0515, + "step": 1580 + }, + { + "epoch": 7.25, + "learning_rate": 0.00018324909747292418, + "loss": 0.0973, + "step": 1581 + }, + { + "epoch": 7.26, + "learning_rate": 0.0001831407942238267, + "loss": 0.1306, + "step": 1582 + }, + { + "epoch": 7.26, + "learning_rate": 0.00018303249097472923, + "loss": 0.1247, + "step": 1583 + }, + { + "epoch": 7.27, + "learning_rate": 0.00018292418772563175, + "loss": 0.139, + "step": 1584 + }, + { + "epoch": 7.27, + "learning_rate": 0.00018281588447653427, + "loss": 0.0923, + "step": 1585 + }, + { + "epoch": 7.28, + "learning_rate": 0.0001827075812274368, + "loss": 0.1803, + "step": 1586 + }, + { + "epoch": 7.28, + "learning_rate": 0.00018259927797833933, + "loss": 0.18, + "step": 1587 + }, + { + "epoch": 7.28, + "learning_rate": 0.00018249097472924187, + "loss": 0.1447, + "step": 1588 + }, + { + "epoch": 7.29, + "learning_rate": 0.00018238267148014439, + "loss": 0.1949, + "step": 1589 + }, + { + "epoch": 7.29, + "learning_rate": 0.0001822743682310469, + "loss": 0.0895, + "step": 1590 + }, + { + "epoch": 7.3, + "learning_rate": 0.00018216606498194944, + "loss": 0.1031, + "step": 1591 + }, + { + "epoch": 7.3, + "learning_rate": 0.00018205776173285196, + "loss": 0.119, + "step": 1592 + }, + { + "epoch": 7.31, + "learning_rate": 0.00018194945848375448, + "loss": 0.1236, + "step": 1593 + }, + { + "epoch": 7.31, + "learning_rate": 0.00018184115523465702, + "loss": 0.1004, + "step": 1594 + }, + { + "epoch": 7.32, + "learning_rate": 0.00018173285198555954, + "loss": 0.1797, + "step": 1595 + }, + { + "epoch": 7.32, + "learning_rate": 0.0001816245487364621, + "loss": 0.1496, + "step": 1596 + }, + { + "epoch": 7.33, + "learning_rate": 0.00018151624548736462, + "loss": 0.1699, + "step": 1597 + }, + { + "epoch": 7.33, + "learning_rate": 0.00018140794223826714, + "loss": 0.1567, + "step": 1598 + }, + { + "epoch": 7.33, + "learning_rate": 0.00018129963898916968, + "loss": 0.1888, + "step": 1599 + }, + { + "epoch": 7.34, + "learning_rate": 0.0001811913357400722, + "loss": 0.1662, + "step": 1600 + }, + { + "epoch": 7.34, + "eval_loss": 0.39384403824806213, + "eval_runtime": 20.6906, + "eval_samples_per_second": 79.601, + "eval_steps_per_second": 2.513, + "eval_wer": 0.3929118578286181, + "step": 1600 + }, + { + "epoch": 7.34, + "learning_rate": 0.00018108303249097471, + "loss": 0.1986, + "step": 1601 + }, + { + "epoch": 7.35, + "learning_rate": 0.00018097472924187726, + "loss": 0.1106, + "step": 1602 + }, + { + "epoch": 7.35, + "learning_rate": 0.00018086642599277977, + "loss": 0.0882, + "step": 1603 + }, + { + "epoch": 7.36, + "learning_rate": 0.0001807581227436823, + "loss": 0.1474, + "step": 1604 + }, + { + "epoch": 7.36, + "learning_rate": 0.00018064981949458483, + "loss": 0.118, + "step": 1605 + }, + { + "epoch": 7.37, + "learning_rate": 0.00018054151624548735, + "loss": 0.1638, + "step": 1606 + }, + { + "epoch": 7.37, + "learning_rate": 0.00018043321299638987, + "loss": 0.115, + "step": 1607 + }, + { + "epoch": 7.38, + "learning_rate": 0.0001803249097472924, + "loss": 0.1041, + "step": 1608 + }, + { + "epoch": 7.38, + "learning_rate": 0.00018021660649819492, + "loss": 0.1516, + "step": 1609 + }, + { + "epoch": 7.39, + "learning_rate": 0.00018010830324909744, + "loss": 0.1976, + "step": 1610 + }, + { + "epoch": 7.39, + "learning_rate": 0.00017999999999999998, + "loss": 0.2617, + "step": 1611 + }, + { + "epoch": 7.39, + "learning_rate": 0.0001798916967509025, + "loss": 0.2021, + "step": 1612 + }, + { + "epoch": 7.4, + "learning_rate": 0.00017978339350180502, + "loss": 0.1454, + "step": 1613 + }, + { + "epoch": 7.4, + "learning_rate": 0.00017967509025270756, + "loss": 0.2009, + "step": 1614 + }, + { + "epoch": 7.41, + "learning_rate": 0.00017956678700361008, + "loss": 0.1255, + "step": 1615 + }, + { + "epoch": 7.41, + "learning_rate": 0.0001794584837545126, + "loss": 0.1593, + "step": 1616 + }, + { + "epoch": 7.42, + "learning_rate": 0.00017935018050541514, + "loss": 0.1463, + "step": 1617 + }, + { + "epoch": 7.42, + "learning_rate": 0.00017924187725631768, + "loss": 0.064, + "step": 1618 + }, + { + "epoch": 7.43, + "learning_rate": 0.00017913357400722022, + "loss": 0.1131, + "step": 1619 + }, + { + "epoch": 7.43, + "learning_rate": 0.00017902527075812274, + "loss": 0.1788, + "step": 1620 + }, + { + "epoch": 7.44, + "learning_rate": 0.00017891696750902525, + "loss": 0.1853, + "step": 1621 + }, + { + "epoch": 7.44, + "learning_rate": 0.0001788086642599278, + "loss": 0.117, + "step": 1622 + }, + { + "epoch": 7.44, + "learning_rate": 0.0001787003610108303, + "loss": 0.1682, + "step": 1623 + }, + { + "epoch": 7.45, + "learning_rate": 0.00017859205776173286, + "loss": 0.1287, + "step": 1624 + }, + { + "epoch": 7.45, + "learning_rate": 0.00017848375451263537, + "loss": 0.2824, + "step": 1625 + }, + { + "epoch": 7.46, + "learning_rate": 0.0001783754512635379, + "loss": 0.2284, + "step": 1626 + }, + { + "epoch": 7.46, + "learning_rate": 0.00017826714801444043, + "loss": 0.0958, + "step": 1627 + }, + { + "epoch": 7.47, + "learning_rate": 0.00017815884476534295, + "loss": 0.1209, + "step": 1628 + }, + { + "epoch": 7.47, + "learning_rate": 0.00017805054151624546, + "loss": 0.0881, + "step": 1629 + }, + { + "epoch": 7.48, + "learning_rate": 0.000177942238267148, + "loss": 0.1284, + "step": 1630 + }, + { + "epoch": 7.48, + "learning_rate": 0.00017783393501805052, + "loss": 0.0862, + "step": 1631 + }, + { + "epoch": 7.49, + "learning_rate": 0.00017772563176895304, + "loss": 0.0815, + "step": 1632 + }, + { + "epoch": 7.49, + "learning_rate": 0.00017761732851985558, + "loss": 0.1508, + "step": 1633 + }, + { + "epoch": 7.5, + "learning_rate": 0.0001775090252707581, + "loss": 0.1986, + "step": 1634 + }, + { + "epoch": 7.5, + "learning_rate": 0.00017740072202166062, + "loss": 0.1475, + "step": 1635 + }, + { + "epoch": 7.5, + "learning_rate": 0.00017729241877256316, + "loss": 0.1969, + "step": 1636 + }, + { + "epoch": 7.51, + "learning_rate": 0.00017718411552346567, + "loss": 0.1962, + "step": 1637 + }, + { + "epoch": 7.51, + "learning_rate": 0.0001770758122743682, + "loss": 0.1576, + "step": 1638 + }, + { + "epoch": 7.52, + "learning_rate": 0.00017696750902527073, + "loss": 0.1486, + "step": 1639 + }, + { + "epoch": 7.52, + "learning_rate": 0.00017685920577617328, + "loss": 0.0708, + "step": 1640 + }, + { + "epoch": 7.53, + "learning_rate": 0.00017675090252707582, + "loss": 0.1319, + "step": 1641 + }, + { + "epoch": 7.53, + "learning_rate": 0.00017664259927797834, + "loss": 0.1068, + "step": 1642 + }, + { + "epoch": 7.54, + "learning_rate": 0.00017653429602888085, + "loss": 0.1189, + "step": 1643 + }, + { + "epoch": 7.54, + "learning_rate": 0.0001764259927797834, + "loss": 0.1046, + "step": 1644 + }, + { + "epoch": 7.55, + "learning_rate": 0.0001763176895306859, + "loss": 0.157, + "step": 1645 + }, + { + "epoch": 7.55, + "learning_rate": 0.00017620938628158843, + "loss": 0.1931, + "step": 1646 + }, + { + "epoch": 7.56, + "learning_rate": 0.00017610108303249097, + "loss": 0.1027, + "step": 1647 + }, + { + "epoch": 7.56, + "learning_rate": 0.0001759927797833935, + "loss": 0.1732, + "step": 1648 + }, + { + "epoch": 7.56, + "learning_rate": 0.000175884476534296, + "loss": 0.113, + "step": 1649 + }, + { + "epoch": 7.57, + "learning_rate": 0.00017577617328519855, + "loss": 0.2927, + "step": 1650 + }, + { + "epoch": 7.57, + "learning_rate": 0.00017566787003610106, + "loss": 0.2615, + "step": 1651 + }, + { + "epoch": 7.58, + "learning_rate": 0.00017555956678700358, + "loss": 0.0847, + "step": 1652 + }, + { + "epoch": 7.58, + "learning_rate": 0.00017545126353790612, + "loss": 0.1258, + "step": 1653 + }, + { + "epoch": 7.59, + "learning_rate": 0.00017534296028880864, + "loss": 0.1056, + "step": 1654 + }, + { + "epoch": 7.59, + "learning_rate": 0.00017523465703971118, + "loss": 0.1223, + "step": 1655 + }, + { + "epoch": 7.6, + "learning_rate": 0.0001751263537906137, + "loss": 0.1075, + "step": 1656 + }, + { + "epoch": 7.6, + "learning_rate": 0.00017501805054151621, + "loss": 0.0866, + "step": 1657 + }, + { + "epoch": 7.61, + "learning_rate": 0.00017490974729241876, + "loss": 0.1755, + "step": 1658 + }, + { + "epoch": 7.61, + "learning_rate": 0.00017480144404332127, + "loss": 0.1039, + "step": 1659 + }, + { + "epoch": 7.61, + "learning_rate": 0.0001746931407942238, + "loss": 0.3223, + "step": 1660 + }, + { + "epoch": 7.62, + "learning_rate": 0.00017458483754512636, + "loss": 0.1085, + "step": 1661 + }, + { + "epoch": 7.62, + "learning_rate": 0.00017447653429602888, + "loss": 0.2045, + "step": 1662 + }, + { + "epoch": 7.63, + "learning_rate": 0.00017436823104693142, + "loss": 0.249, + "step": 1663 + }, + { + "epoch": 7.63, + "learning_rate": 0.00017425992779783394, + "loss": 0.207, + "step": 1664 + }, + { + "epoch": 7.64, + "learning_rate": 0.00017415162454873645, + "loss": 0.0827, + "step": 1665 + }, + { + "epoch": 7.64, + "learning_rate": 0.000174043321299639, + "loss": 0.1086, + "step": 1666 + }, + { + "epoch": 7.65, + "learning_rate": 0.0001739350180505415, + "loss": 0.1792, + "step": 1667 + }, + { + "epoch": 7.65, + "learning_rate": 0.00017382671480144403, + "loss": 0.0806, + "step": 1668 + }, + { + "epoch": 7.66, + "learning_rate": 0.00017371841155234657, + "loss": 0.1475, + "step": 1669 + }, + { + "epoch": 7.66, + "learning_rate": 0.00017361010830324909, + "loss": 0.1333, + "step": 1670 + }, + { + "epoch": 7.67, + "learning_rate": 0.0001735018050541516, + "loss": 0.1051, + "step": 1671 + }, + { + "epoch": 7.67, + "learning_rate": 0.00017339350180505415, + "loss": 0.1355, + "step": 1672 + }, + { + "epoch": 7.67, + "learning_rate": 0.00017328519855595666, + "loss": 0.1767, + "step": 1673 + }, + { + "epoch": 7.68, + "learning_rate": 0.00017317689530685918, + "loss": 0.1798, + "step": 1674 + }, + { + "epoch": 7.68, + "learning_rate": 0.00017306859205776172, + "loss": 0.1352, + "step": 1675 + }, + { + "epoch": 7.69, + "learning_rate": 0.00017296028880866424, + "loss": 0.1205, + "step": 1676 + }, + { + "epoch": 7.69, + "learning_rate": 0.00017285198555956675, + "loss": 0.0936, + "step": 1677 + }, + { + "epoch": 7.7, + "learning_rate": 0.0001727436823104693, + "loss": 0.1879, + "step": 1678 + }, + { + "epoch": 7.7, + "learning_rate": 0.0001726353790613718, + "loss": 0.1412, + "step": 1679 + }, + { + "epoch": 7.71, + "learning_rate": 0.00017252707581227433, + "loss": 0.0788, + "step": 1680 + }, + { + "epoch": 7.71, + "learning_rate": 0.00017241877256317687, + "loss": 0.1069, + "step": 1681 + }, + { + "epoch": 7.72, + "learning_rate": 0.0001723104693140794, + "loss": 0.0561, + "step": 1682 + }, + { + "epoch": 7.72, + "learning_rate": 0.00017220216606498196, + "loss": 0.1374, + "step": 1683 + }, + { + "epoch": 7.72, + "learning_rate": 0.00017209386281588447, + "loss": 0.1231, + "step": 1684 + }, + { + "epoch": 7.73, + "learning_rate": 0.000171985559566787, + "loss": 0.2252, + "step": 1685 + }, + { + "epoch": 7.73, + "learning_rate": 0.00017187725631768953, + "loss": 0.2004, + "step": 1686 + }, + { + "epoch": 7.74, + "learning_rate": 0.00017176895306859205, + "loss": 0.2023, + "step": 1687 + }, + { + "epoch": 7.74, + "learning_rate": 0.00017166064981949457, + "loss": 0.2211, + "step": 1688 + }, + { + "epoch": 7.75, + "learning_rate": 0.0001715523465703971, + "loss": 0.1052, + "step": 1689 + }, + { + "epoch": 7.75, + "learning_rate": 0.00017144404332129963, + "loss": 0.1383, + "step": 1690 + }, + { + "epoch": 7.76, + "learning_rate": 0.00017133574007220214, + "loss": 0.0932, + "step": 1691 + }, + { + "epoch": 7.76, + "learning_rate": 0.00017122743682310468, + "loss": 0.1229, + "step": 1692 + }, + { + "epoch": 7.77, + "learning_rate": 0.0001711191335740072, + "loss": 0.1067, + "step": 1693 + }, + { + "epoch": 7.77, + "learning_rate": 0.00017101083032490974, + "loss": 0.1519, + "step": 1694 + }, + { + "epoch": 7.78, + "learning_rate": 0.00017090252707581226, + "loss": 0.1008, + "step": 1695 + }, + { + "epoch": 7.78, + "learning_rate": 0.00017079422382671478, + "loss": 0.0556, + "step": 1696 + }, + { + "epoch": 7.78, + "learning_rate": 0.00017068592057761732, + "loss": 0.1521, + "step": 1697 + }, + { + "epoch": 7.79, + "learning_rate": 0.00017057761732851984, + "loss": 0.1807, + "step": 1698 + }, + { + "epoch": 7.79, + "learning_rate": 0.00017046931407942235, + "loss": 0.1872, + "step": 1699 + }, + { + "epoch": 7.8, + "learning_rate": 0.0001703610108303249, + "loss": 0.198, + "step": 1700 + }, + { + "epoch": 7.8, + "eval_loss": 0.3831448256969452, + "eval_runtime": 20.6512, + "eval_samples_per_second": 79.753, + "eval_steps_per_second": 2.518, + "eval_wer": 0.3837197426207742, + "step": 1700 + }, + { + "epoch": 7.8, + "learning_rate": 0.0001702527075812274, + "loss": 0.1819, + "step": 1701 + }, + { + "epoch": 7.81, + "learning_rate": 0.00017014440433212993, + "loss": 0.0572, + "step": 1702 + }, + { + "epoch": 7.81, + "learning_rate": 0.00017003610108303247, + "loss": 0.0968, + "step": 1703 + }, + { + "epoch": 7.82, + "learning_rate": 0.000169927797833935, + "loss": 0.1559, + "step": 1704 + }, + { + "epoch": 7.82, + "learning_rate": 0.00016981949458483756, + "loss": 0.0864, + "step": 1705 + }, + { + "epoch": 7.83, + "learning_rate": 0.00016971119133574007, + "loss": 0.0865, + "step": 1706 + }, + { + "epoch": 7.83, + "learning_rate": 0.0001696028880866426, + "loss": 0.1441, + "step": 1707 + }, + { + "epoch": 7.83, + "learning_rate": 0.00016949458483754513, + "loss": 0.1375, + "step": 1708 + }, + { + "epoch": 7.84, + "learning_rate": 0.00016938628158844765, + "loss": 0.1595, + "step": 1709 + }, + { + "epoch": 7.84, + "learning_rate": 0.00016927797833935016, + "loss": 0.2625, + "step": 1710 + }, + { + "epoch": 7.85, + "learning_rate": 0.0001691696750902527, + "loss": 0.1011, + "step": 1711 + }, + { + "epoch": 7.85, + "learning_rate": 0.00016906137184115522, + "loss": 0.1693, + "step": 1712 + }, + { + "epoch": 7.86, + "learning_rate": 0.00016895306859205774, + "loss": 0.1653, + "step": 1713 + }, + { + "epoch": 7.86, + "learning_rate": 0.00016884476534296028, + "loss": 0.2386, + "step": 1714 + }, + { + "epoch": 7.87, + "learning_rate": 0.0001687364620938628, + "loss": 0.2255, + "step": 1715 + }, + { + "epoch": 7.87, + "learning_rate": 0.00016862815884476532, + "loss": 0.1801, + "step": 1716 + }, + { + "epoch": 7.88, + "learning_rate": 0.00016851985559566786, + "loss": 0.1043, + "step": 1717 + }, + { + "epoch": 7.88, + "learning_rate": 0.00016841155234657038, + "loss": 0.13, + "step": 1718 + }, + { + "epoch": 7.89, + "learning_rate": 0.0001683032490974729, + "loss": 0.1365, + "step": 1719 + }, + { + "epoch": 7.89, + "learning_rate": 0.00016819494584837543, + "loss": 0.1314, + "step": 1720 + }, + { + "epoch": 7.89, + "learning_rate": 0.00016808664259927795, + "loss": 0.1558, + "step": 1721 + }, + { + "epoch": 7.9, + "learning_rate": 0.00016797833935018047, + "loss": 0.1485, + "step": 1722 + }, + { + "epoch": 7.9, + "learning_rate": 0.000167870036101083, + "loss": 0.162, + "step": 1723 + }, + { + "epoch": 7.91, + "learning_rate": 0.00016776173285198553, + "loss": 0.2153, + "step": 1724 + }, + { + "epoch": 7.91, + "learning_rate": 0.00016765342960288807, + "loss": 0.1568, + "step": 1725 + }, + { + "epoch": 7.92, + "learning_rate": 0.0001675451263537906, + "loss": 0.2517, + "step": 1726 + }, + { + "epoch": 7.92, + "learning_rate": 0.00016743682310469313, + "loss": 0.1677, + "step": 1727 + }, + { + "epoch": 7.93, + "learning_rate": 0.00016732851985559567, + "loss": 0.1601, + "step": 1728 + }, + { + "epoch": 7.93, + "learning_rate": 0.0001672202166064982, + "loss": 0.1155, + "step": 1729 + }, + { + "epoch": 7.94, + "learning_rate": 0.0001671119133574007, + "loss": 0.1506, + "step": 1730 + }, + { + "epoch": 7.94, + "learning_rate": 0.00016700361010830325, + "loss": 0.0911, + "step": 1731 + }, + { + "epoch": 7.94, + "learning_rate": 0.00016689530685920576, + "loss": 0.1504, + "step": 1732 + }, + { + "epoch": 7.95, + "learning_rate": 0.0001667870036101083, + "loss": 0.0983, + "step": 1733 + }, + { + "epoch": 7.95, + "learning_rate": 0.00016667870036101082, + "loss": 0.0978, + "step": 1734 + }, + { + "epoch": 7.96, + "learning_rate": 0.00016657039711191334, + "loss": 0.1257, + "step": 1735 + }, + { + "epoch": 7.96, + "learning_rate": 0.00016646209386281588, + "loss": 0.1808, + "step": 1736 + }, + { + "epoch": 7.97, + "learning_rate": 0.0001663537906137184, + "loss": 0.2144, + "step": 1737 + }, + { + "epoch": 7.97, + "learning_rate": 0.00016624548736462091, + "loss": 0.1202, + "step": 1738 + }, + { + "epoch": 7.98, + "learning_rate": 0.00016613718411552346, + "loss": 0.1663, + "step": 1739 + }, + { + "epoch": 7.98, + "learning_rate": 0.00016602888086642597, + "loss": 0.1085, + "step": 1740 + }, + { + "epoch": 7.99, + "learning_rate": 0.0001659205776173285, + "loss": 0.1601, + "step": 1741 + }, + { + "epoch": 7.99, + "learning_rate": 0.00016581227436823103, + "loss": 0.1876, + "step": 1742 + }, + { + "epoch": 8.0, + "learning_rate": 0.00016570397111913355, + "loss": 0.1968, + "step": 1743 + }, + { + "epoch": 8.0, + "learning_rate": 0.00016559566787003607, + "loss": 0.1273, + "step": 1744 + }, + { + "epoch": 8.0, + "learning_rate": 0.0001654873646209386, + "loss": 0.0946, + "step": 1745 + }, + { + "epoch": 8.01, + "learning_rate": 0.00016537906137184112, + "loss": 0.0771, + "step": 1746 + }, + { + "epoch": 8.01, + "learning_rate": 0.00016527075812274364, + "loss": 0.0927, + "step": 1747 + }, + { + "epoch": 8.02, + "learning_rate": 0.0001651624548736462, + "loss": 0.1208, + "step": 1748 + }, + { + "epoch": 8.02, + "learning_rate": 0.00016505415162454873, + "loss": 0.082, + "step": 1749 + }, + { + "epoch": 8.03, + "learning_rate": 0.00016494584837545127, + "loss": 0.1702, + "step": 1750 + }, + { + "epoch": 8.03, + "learning_rate": 0.0001648375451263538, + "loss": 0.1187, + "step": 1751 + }, + { + "epoch": 8.04, + "learning_rate": 0.0001647292418772563, + "loss": 0.1498, + "step": 1752 + }, + { + "epoch": 8.04, + "learning_rate": 0.00016462093862815885, + "loss": 0.1683, + "step": 1753 + }, + { + "epoch": 8.05, + "learning_rate": 0.00016451263537906136, + "loss": 0.13, + "step": 1754 + }, + { + "epoch": 8.05, + "learning_rate": 0.00016440433212996388, + "loss": 0.1652, + "step": 1755 + }, + { + "epoch": 8.06, + "learning_rate": 0.00016429602888086642, + "loss": 0.1887, + "step": 1756 + }, + { + "epoch": 8.06, + "learning_rate": 0.00016418772563176894, + "loss": 0.0797, + "step": 1757 + }, + { + "epoch": 8.06, + "learning_rate": 0.00016407942238267145, + "loss": 0.123, + "step": 1758 + }, + { + "epoch": 8.07, + "learning_rate": 0.000163971119133574, + "loss": 0.1056, + "step": 1759 + }, + { + "epoch": 8.07, + "learning_rate": 0.0001638628158844765, + "loss": 0.0715, + "step": 1760 + }, + { + "epoch": 8.08, + "learning_rate": 0.00016375451263537903, + "loss": 0.1123, + "step": 1761 + }, + { + "epoch": 8.08, + "learning_rate": 0.00016364620938628157, + "loss": 0.1135, + "step": 1762 + }, + { + "epoch": 8.09, + "learning_rate": 0.0001635379061371841, + "loss": 0.0627, + "step": 1763 + }, + { + "epoch": 8.09, + "learning_rate": 0.00016342960288808663, + "loss": 0.1227, + "step": 1764 + }, + { + "epoch": 8.1, + "learning_rate": 0.00016332129963898915, + "loss": 0.1702, + "step": 1765 + }, + { + "epoch": 8.1, + "learning_rate": 0.00016321299638989166, + "loss": 0.1214, + "step": 1766 + }, + { + "epoch": 8.11, + "learning_rate": 0.0001631046931407942, + "loss": 0.1745, + "step": 1767 + }, + { + "epoch": 8.11, + "learning_rate": 0.00016299638989169672, + "loss": 0.227, + "step": 1768 + }, + { + "epoch": 8.11, + "learning_rate": 0.00016288808664259927, + "loss": 0.1874, + "step": 1769 + }, + { + "epoch": 8.12, + "learning_rate": 0.0001627797833935018, + "loss": 0.046, + "step": 1770 + }, + { + "epoch": 8.12, + "learning_rate": 0.00016267148014440433, + "loss": 0.0788, + "step": 1771 + }, + { + "epoch": 8.13, + "learning_rate": 0.00016256317689530687, + "loss": 0.1288, + "step": 1772 + }, + { + "epoch": 8.13, + "learning_rate": 0.00016245487364620939, + "loss": 0.0794, + "step": 1773 + }, + { + "epoch": 8.14, + "learning_rate": 0.0001623465703971119, + "loss": 0.0512, + "step": 1774 + }, + { + "epoch": 8.14, + "learning_rate": 0.00016223826714801444, + "loss": 0.1106, + "step": 1775 + }, + { + "epoch": 8.15, + "learning_rate": 0.00016212996389891696, + "loss": 0.1262, + "step": 1776 + }, + { + "epoch": 8.15, + "learning_rate": 0.00016202166064981948, + "loss": 0.1816, + "step": 1777 + }, + { + "epoch": 8.16, + "learning_rate": 0.00016191335740072202, + "loss": 0.127, + "step": 1778 + }, + { + "epoch": 8.16, + "learning_rate": 0.00016180505415162454, + "loss": 0.2061, + "step": 1779 + }, + { + "epoch": 8.17, + "learning_rate": 0.00016169675090252705, + "loss": 0.1933, + "step": 1780 + }, + { + "epoch": 8.17, + "learning_rate": 0.0001615884476534296, + "loss": 0.2388, + "step": 1781 + }, + { + "epoch": 8.17, + "learning_rate": 0.0001614801444043321, + "loss": 0.0929, + "step": 1782 + }, + { + "epoch": 8.18, + "learning_rate": 0.00016137184115523463, + "loss": 0.1151, + "step": 1783 + }, + { + "epoch": 8.18, + "learning_rate": 0.00016126353790613717, + "loss": 0.0565, + "step": 1784 + }, + { + "epoch": 8.19, + "learning_rate": 0.0001611552346570397, + "loss": 0.1354, + "step": 1785 + }, + { + "epoch": 8.19, + "learning_rate": 0.0001610469314079422, + "loss": 0.1155, + "step": 1786 + }, + { + "epoch": 8.2, + "learning_rate": 0.00016093862815884475, + "loss": 0.0798, + "step": 1787 + }, + { + "epoch": 8.2, + "learning_rate": 0.00016083032490974726, + "loss": 0.1083, + "step": 1788 + }, + { + "epoch": 8.21, + "learning_rate": 0.00016072202166064978, + "loss": 0.1912, + "step": 1789 + }, + { + "epoch": 8.21, + "learning_rate": 0.00016061371841155232, + "loss": 0.1365, + "step": 1790 + }, + { + "epoch": 8.22, + "learning_rate": 0.00016050541516245487, + "loss": 0.1171, + "step": 1791 + }, + { + "epoch": 8.22, + "learning_rate": 0.0001603971119133574, + "loss": 0.1853, + "step": 1792 + }, + { + "epoch": 8.22, + "learning_rate": 0.00016028880866425992, + "loss": 0.1297, + "step": 1793 + }, + { + "epoch": 8.23, + "learning_rate": 0.00016018050541516244, + "loss": 0.2399, + "step": 1794 + }, + { + "epoch": 8.23, + "learning_rate": 0.00016007220216606498, + "loss": 0.0798, + "step": 1795 + }, + { + "epoch": 8.24, + "learning_rate": 0.0001599638989169675, + "loss": 0.0816, + "step": 1796 + }, + { + "epoch": 8.24, + "learning_rate": 0.00015985559566787002, + "loss": 0.1499, + "step": 1797 + }, + { + "epoch": 8.25, + "learning_rate": 0.00015974729241877256, + "loss": 0.0484, + "step": 1798 + }, + { + "epoch": 8.25, + "learning_rate": 0.00015963898916967508, + "loss": 0.0588, + "step": 1799 + }, + { + "epoch": 8.26, + "learning_rate": 0.00015953068592057762, + "loss": 0.0728, + "step": 1800 + }, + { + "epoch": 8.26, + "eval_loss": 0.3910059332847595, + "eval_runtime": 20.9844, + "eval_samples_per_second": 78.487, + "eval_steps_per_second": 2.478, + "eval_wer": 0.3866816464099683, + "step": 1800 + }, + { + "epoch": 8.26, + "learning_rate": 0.00015942238267148014, + "loss": 0.1435, + "step": 1801 + }, + { + "epoch": 8.27, + "learning_rate": 0.00015931407942238265, + "loss": 0.0704, + "step": 1802 + }, + { + "epoch": 8.27, + "learning_rate": 0.0001592057761732852, + "loss": 0.078, + "step": 1803 + }, + { + "epoch": 8.28, + "learning_rate": 0.0001590974729241877, + "loss": 0.1847, + "step": 1804 + }, + { + "epoch": 8.28, + "learning_rate": 0.00015898916967509023, + "loss": 0.1201, + "step": 1805 + }, + { + "epoch": 8.28, + "learning_rate": 0.00015888086642599277, + "loss": 0.1877, + "step": 1806 + }, + { + "epoch": 8.29, + "learning_rate": 0.00015877256317689529, + "loss": 0.1017, + "step": 1807 + }, + { + "epoch": 8.29, + "learning_rate": 0.0001586642599277978, + "loss": 0.0667, + "step": 1808 + }, + { + "epoch": 8.3, + "learning_rate": 0.00015855595667870035, + "loss": 0.0572, + "step": 1809 + }, + { + "epoch": 8.3, + "learning_rate": 0.00015844765342960286, + "loss": 0.0826, + "step": 1810 + }, + { + "epoch": 8.31, + "learning_rate": 0.00015833935018050538, + "loss": 0.1066, + "step": 1811 + }, + { + "epoch": 8.31, + "learning_rate": 0.00015823104693140792, + "loss": 0.1097, + "step": 1812 + }, + { + "epoch": 8.32, + "learning_rate": 0.00015812274368231046, + "loss": 0.1257, + "step": 1813 + }, + { + "epoch": 8.32, + "learning_rate": 0.000158014440433213, + "loss": 0.1535, + "step": 1814 + }, + { + "epoch": 8.33, + "learning_rate": 0.00015790613718411552, + "loss": 0.1065, + "step": 1815 + }, + { + "epoch": 8.33, + "learning_rate": 0.00015779783393501804, + "loss": 0.096, + "step": 1816 + }, + { + "epoch": 8.33, + "learning_rate": 0.00015768953068592058, + "loss": 0.1646, + "step": 1817 + }, + { + "epoch": 8.34, + "learning_rate": 0.0001575812274368231, + "loss": 0.2015, + "step": 1818 + }, + { + "epoch": 8.34, + "learning_rate": 0.00015747292418772562, + "loss": 0.2249, + "step": 1819 + }, + { + "epoch": 8.35, + "learning_rate": 0.00015736462093862816, + "loss": 0.0866, + "step": 1820 + }, + { + "epoch": 8.35, + "learning_rate": 0.00015725631768953067, + "loss": 0.0851, + "step": 1821 + }, + { + "epoch": 8.36, + "learning_rate": 0.0001571480144404332, + "loss": 0.0939, + "step": 1822 + }, + { + "epoch": 8.36, + "learning_rate": 0.00015703971119133573, + "loss": 0.0571, + "step": 1823 + }, + { + "epoch": 8.37, + "learning_rate": 0.00015693140794223825, + "loss": 0.0737, + "step": 1824 + }, + { + "epoch": 8.37, + "learning_rate": 0.00015682310469314077, + "loss": 0.1184, + "step": 1825 + }, + { + "epoch": 8.38, + "learning_rate": 0.0001567148014440433, + "loss": 0.1005, + "step": 1826 + }, + { + "epoch": 8.38, + "learning_rate": 0.00015660649819494583, + "loss": 0.086, + "step": 1827 + }, + { + "epoch": 8.39, + "learning_rate": 0.00015649819494584834, + "loss": 0.1681, + "step": 1828 + }, + { + "epoch": 8.39, + "learning_rate": 0.00015638989169675088, + "loss": 0.1329, + "step": 1829 + }, + { + "epoch": 8.39, + "learning_rate": 0.0001562815884476534, + "loss": 0.1466, + "step": 1830 + }, + { + "epoch": 8.4, + "learning_rate": 0.00015617328519855594, + "loss": 0.1419, + "step": 1831 + }, + { + "epoch": 8.4, + "learning_rate": 0.00015606498194945846, + "loss": 0.1462, + "step": 1832 + }, + { + "epoch": 8.41, + "learning_rate": 0.00015595667870036098, + "loss": 0.1228, + "step": 1833 + }, + { + "epoch": 8.41, + "learning_rate": 0.00015584837545126355, + "loss": 0.0469, + "step": 1834 + }, + { + "epoch": 8.42, + "learning_rate": 0.00015574007220216606, + "loss": 0.1045, + "step": 1835 + }, + { + "epoch": 8.42, + "learning_rate": 0.00015563176895306858, + "loss": 0.043, + "step": 1836 + }, + { + "epoch": 8.43, + "learning_rate": 0.00015552346570397112, + "loss": 0.1375, + "step": 1837 + }, + { + "epoch": 8.43, + "learning_rate": 0.00015541516245487364, + "loss": 0.0903, + "step": 1838 + }, + { + "epoch": 8.44, + "learning_rate": 0.00015530685920577618, + "loss": 0.1352, + "step": 1839 + }, + { + "epoch": 8.44, + "learning_rate": 0.0001551985559566787, + "loss": 0.1706, + "step": 1840 + }, + { + "epoch": 8.44, + "learning_rate": 0.00015509025270758121, + "loss": 0.1722, + "step": 1841 + }, + { + "epoch": 8.45, + "learning_rate": 0.00015498194945848376, + "loss": 0.1846, + "step": 1842 + }, + { + "epoch": 8.45, + "learning_rate": 0.00015487364620938627, + "loss": 0.1378, + "step": 1843 + }, + { + "epoch": 8.46, + "learning_rate": 0.0001547653429602888, + "loss": 0.046, + "step": 1844 + }, + { + "epoch": 8.46, + "learning_rate": 0.00015465703971119133, + "loss": 0.0609, + "step": 1845 + }, + { + "epoch": 8.47, + "learning_rate": 0.00015454873646209385, + "loss": 0.1025, + "step": 1846 + }, + { + "epoch": 8.47, + "learning_rate": 0.00015444043321299636, + "loss": 0.0957, + "step": 1847 + }, + { + "epoch": 8.48, + "learning_rate": 0.0001543321299638989, + "loss": 0.1022, + "step": 1848 + }, + { + "epoch": 8.48, + "learning_rate": 0.00015422382671480142, + "loss": 0.0748, + "step": 1849 + }, + { + "epoch": 8.49, + "learning_rate": 0.00015411552346570394, + "loss": 0.1439, + "step": 1850 + }, + { + "epoch": 8.49, + "learning_rate": 0.00015400722021660648, + "loss": 0.134, + "step": 1851 + }, + { + "epoch": 8.5, + "learning_rate": 0.000153898916967509, + "loss": 0.1946, + "step": 1852 + }, + { + "epoch": 8.5, + "learning_rate": 0.00015379061371841152, + "loss": 0.132, + "step": 1853 + }, + { + "epoch": 8.5, + "learning_rate": 0.00015368231046931406, + "loss": 0.1606, + "step": 1854 + }, + { + "epoch": 8.51, + "learning_rate": 0.00015357400722021658, + "loss": 0.148, + "step": 1855 + }, + { + "epoch": 8.51, + "learning_rate": 0.00015346570397111915, + "loss": 0.1816, + "step": 1856 + }, + { + "epoch": 8.52, + "learning_rate": 0.00015335740072202166, + "loss": 0.1013, + "step": 1857 + }, + { + "epoch": 8.52, + "learning_rate": 0.00015324909747292418, + "loss": 0.0986, + "step": 1858 + }, + { + "epoch": 8.53, + "learning_rate": 0.00015314079422382672, + "loss": 0.0998, + "step": 1859 + }, + { + "epoch": 8.53, + "learning_rate": 0.00015303249097472924, + "loss": 0.0473, + "step": 1860 + }, + { + "epoch": 8.54, + "learning_rate": 0.00015292418772563175, + "loss": 0.1311, + "step": 1861 + }, + { + "epoch": 8.54, + "learning_rate": 0.0001528158844765343, + "loss": 0.1033, + "step": 1862 + }, + { + "epoch": 8.55, + "learning_rate": 0.0001527075812274368, + "loss": 0.1128, + "step": 1863 + }, + { + "epoch": 8.55, + "learning_rate": 0.00015259927797833933, + "loss": 0.1252, + "step": 1864 + }, + { + "epoch": 8.56, + "learning_rate": 0.00015249097472924187, + "loss": 0.0973, + "step": 1865 + }, + { + "epoch": 8.56, + "learning_rate": 0.0001523826714801444, + "loss": 0.1431, + "step": 1866 + }, + { + "epoch": 8.56, + "learning_rate": 0.0001522743682310469, + "loss": 0.1164, + "step": 1867 + }, + { + "epoch": 8.57, + "learning_rate": 0.00015216606498194945, + "loss": 0.1775, + "step": 1868 + }, + { + "epoch": 8.57, + "learning_rate": 0.00015205776173285196, + "loss": 0.1641, + "step": 1869 + }, + { + "epoch": 8.58, + "learning_rate": 0.0001519494584837545, + "loss": 0.0824, + "step": 1870 + }, + { + "epoch": 8.58, + "learning_rate": 0.00015184115523465702, + "loss": 0.0608, + "step": 1871 + }, + { + "epoch": 8.59, + "learning_rate": 0.00015173285198555954, + "loss": 0.0685, + "step": 1872 + }, + { + "epoch": 8.59, + "learning_rate": 0.00015162454873646208, + "loss": 0.071, + "step": 1873 + }, + { + "epoch": 8.6, + "learning_rate": 0.0001515162454873646, + "loss": 0.0997, + "step": 1874 + }, + { + "epoch": 8.6, + "learning_rate": 0.00015140794223826711, + "loss": 0.0941, + "step": 1875 + }, + { + "epoch": 8.61, + "learning_rate": 0.00015129963898916966, + "loss": 0.11, + "step": 1876 + }, + { + "epoch": 8.61, + "learning_rate": 0.00015119133574007217, + "loss": 0.1453, + "step": 1877 + }, + { + "epoch": 8.61, + "learning_rate": 0.00015108303249097474, + "loss": 0.1048, + "step": 1878 + }, + { + "epoch": 8.62, + "learning_rate": 0.00015097472924187726, + "loss": 0.0773, + "step": 1879 + }, + { + "epoch": 8.62, + "learning_rate": 0.00015086642599277978, + "loss": 0.1035, + "step": 1880 + }, + { + "epoch": 8.63, + "learning_rate": 0.00015075812274368232, + "loss": 0.1178, + "step": 1881 + }, + { + "epoch": 8.63, + "learning_rate": 0.00015064981949458484, + "loss": 0.0608, + "step": 1882 + }, + { + "epoch": 8.64, + "learning_rate": 0.00015054151624548735, + "loss": 0.0761, + "step": 1883 + }, + { + "epoch": 8.64, + "learning_rate": 0.0001504332129963899, + "loss": 0.0751, + "step": 1884 + }, + { + "epoch": 8.65, + "learning_rate": 0.0001503249097472924, + "loss": 0.0682, + "step": 1885 + }, + { + "epoch": 8.65, + "learning_rate": 0.00015021660649819493, + "loss": 0.1539, + "step": 1886 + }, + { + "epoch": 8.66, + "learning_rate": 0.00015010830324909747, + "loss": 0.1198, + "step": 1887 + }, + { + "epoch": 8.66, + "learning_rate": 0.00015, + "loss": 0.0759, + "step": 1888 + }, + { + "epoch": 8.67, + "learning_rate": 0.0001498916967509025, + "loss": 0.1024, + "step": 1889 + }, + { + "epoch": 8.67, + "learning_rate": 0.00014978339350180505, + "loss": 0.1709, + "step": 1890 + }, + { + "epoch": 8.67, + "learning_rate": 0.00014967509025270756, + "loss": 0.1404, + "step": 1891 + }, + { + "epoch": 8.68, + "learning_rate": 0.00014956678700361008, + "loss": 0.178, + "step": 1892 + }, + { + "epoch": 8.68, + "learning_rate": 0.00014945848375451262, + "loss": 0.1701, + "step": 1893 + }, + { + "epoch": 8.69, + "learning_rate": 0.00014935018050541516, + "loss": 0.2917, + "step": 1894 + }, + { + "epoch": 8.69, + "learning_rate": 0.00014924187725631768, + "loss": 0.0788, + "step": 1895 + }, + { + "epoch": 8.7, + "learning_rate": 0.0001491335740072202, + "loss": 0.0995, + "step": 1896 + }, + { + "epoch": 8.7, + "learning_rate": 0.00014902527075812274, + "loss": 0.0731, + "step": 1897 + }, + { + "epoch": 8.71, + "learning_rate": 0.00014891696750902526, + "loss": 0.1188, + "step": 1898 + }, + { + "epoch": 8.71, + "learning_rate": 0.00014880866425992777, + "loss": 0.0794, + "step": 1899 + }, + { + "epoch": 8.72, + "learning_rate": 0.00014870036101083032, + "loss": 0.123, + "step": 1900 + }, + { + "epoch": 8.72, + "eval_loss": 0.3722236156463623, + "eval_runtime": 19.5626, + "eval_samples_per_second": 84.191, + "eval_steps_per_second": 2.658, + "eval_wer": 0.37350628127872537, + "step": 1900 + }, + { + "epoch": 8.72, + "learning_rate": 0.00014859205776173283, + "loss": 0.1113, + "step": 1901 + }, + { + "epoch": 8.72, + "learning_rate": 0.00014848375451263535, + "loss": 0.1132, + "step": 1902 + }, + { + "epoch": 8.73, + "learning_rate": 0.0001483754512635379, + "loss": 0.1364, + "step": 1903 + }, + { + "epoch": 8.73, + "learning_rate": 0.0001482671480144404, + "loss": 0.1471, + "step": 1904 + }, + { + "epoch": 8.74, + "learning_rate": 0.00014815884476534295, + "loss": 0.1147, + "step": 1905 + }, + { + "epoch": 8.74, + "learning_rate": 0.00014805054151624547, + "loss": 0.1539, + "step": 1906 + }, + { + "epoch": 8.75, + "learning_rate": 0.000147942238267148, + "loss": 0.1706, + "step": 1907 + }, + { + "epoch": 8.75, + "learning_rate": 0.00014783393501805053, + "loss": 0.0924, + "step": 1908 + }, + { + "epoch": 8.76, + "learning_rate": 0.00014772563176895307, + "loss": 0.1973, + "step": 1909 + }, + { + "epoch": 8.76, + "learning_rate": 0.00014761732851985559, + "loss": 0.0781, + "step": 1910 + }, + { + "epoch": 8.77, + "learning_rate": 0.0001475090252707581, + "loss": 0.058, + "step": 1911 + }, + { + "epoch": 8.77, + "learning_rate": 0.00014740072202166064, + "loss": 0.0899, + "step": 1912 + }, + { + "epoch": 8.78, + "learning_rate": 0.00014729241877256316, + "loss": 0.1407, + "step": 1913 + }, + { + "epoch": 8.78, + "learning_rate": 0.00014718411552346568, + "loss": 0.0846, + "step": 1914 + }, + { + "epoch": 8.78, + "learning_rate": 0.00014707581227436822, + "loss": 0.1576, + "step": 1915 + }, + { + "epoch": 8.79, + "learning_rate": 0.00014696750902527076, + "loss": 0.1453, + "step": 1916 + }, + { + "epoch": 8.79, + "learning_rate": 0.00014685920577617328, + "loss": 0.225, + "step": 1917 + }, + { + "epoch": 8.8, + "learning_rate": 0.0001467509025270758, + "loss": 0.2225, + "step": 1918 + }, + { + "epoch": 8.8, + "learning_rate": 0.00014664259927797834, + "loss": 0.1085, + "step": 1919 + }, + { + "epoch": 8.81, + "learning_rate": 0.00014653429602888086, + "loss": 0.1517, + "step": 1920 + }, + { + "epoch": 8.81, + "learning_rate": 0.00014642599277978337, + "loss": 0.1254, + "step": 1921 + }, + { + "epoch": 8.82, + "learning_rate": 0.00014631768953068591, + "loss": 0.0774, + "step": 1922 + }, + { + "epoch": 8.82, + "learning_rate": 0.00014620938628158843, + "loss": 0.1011, + "step": 1923 + }, + { + "epoch": 8.83, + "learning_rate": 0.00014610108303249095, + "loss": 0.1006, + "step": 1924 + }, + { + "epoch": 8.83, + "learning_rate": 0.0001459927797833935, + "loss": 0.0882, + "step": 1925 + }, + { + "epoch": 8.83, + "learning_rate": 0.00014588447653429603, + "loss": 0.1327, + "step": 1926 + }, + { + "epoch": 8.84, + "learning_rate": 0.00014577617328519855, + "loss": 0.1432, + "step": 1927 + }, + { + "epoch": 8.84, + "learning_rate": 0.00014566787003610107, + "loss": 0.176, + "step": 1928 + }, + { + "epoch": 8.85, + "learning_rate": 0.0001455595667870036, + "loss": 0.1059, + "step": 1929 + }, + { + "epoch": 8.85, + "learning_rate": 0.00014545126353790612, + "loss": 0.1798, + "step": 1930 + }, + { + "epoch": 8.86, + "learning_rate": 0.00014534296028880864, + "loss": 0.2902, + "step": 1931 + }, + { + "epoch": 8.86, + "learning_rate": 0.00014523465703971118, + "loss": 0.1217, + "step": 1932 + }, + { + "epoch": 8.87, + "learning_rate": 0.0001451263537906137, + "loss": 0.1069, + "step": 1933 + }, + { + "epoch": 8.87, + "learning_rate": 0.00014501805054151622, + "loss": 0.0902, + "step": 1934 + }, + { + "epoch": 8.88, + "learning_rate": 0.00014490974729241876, + "loss": 0.1265, + "step": 1935 + }, + { + "epoch": 8.88, + "learning_rate": 0.00014480144404332128, + "loss": 0.0595, + "step": 1936 + }, + { + "epoch": 8.89, + "learning_rate": 0.00014469314079422382, + "loss": 0.1499, + "step": 1937 + }, + { + "epoch": 8.89, + "learning_rate": 0.00014458483754512634, + "loss": 0.0561, + "step": 1938 + }, + { + "epoch": 8.89, + "learning_rate": 0.00014447653429602888, + "loss": 0.0896, + "step": 1939 + }, + { + "epoch": 8.9, + "learning_rate": 0.0001443682310469314, + "loss": 0.1576, + "step": 1940 + }, + { + "epoch": 8.9, + "learning_rate": 0.0001442599277978339, + "loss": 0.1554, + "step": 1941 + }, + { + "epoch": 8.91, + "learning_rate": 0.00014415162454873645, + "loss": 0.2377, + "step": 1942 + }, + { + "epoch": 8.91, + "learning_rate": 0.00014404332129963897, + "loss": 0.1331, + "step": 1943 + }, + { + "epoch": 8.92, + "learning_rate": 0.0001439350180505415, + "loss": 0.3323, + "step": 1944 + }, + { + "epoch": 8.92, + "learning_rate": 0.00014382671480144403, + "loss": 0.0813, + "step": 1945 + }, + { + "epoch": 8.93, + "learning_rate": 0.00014371841155234655, + "loss": 0.085, + "step": 1946 + }, + { + "epoch": 8.93, + "learning_rate": 0.0001436101083032491, + "loss": 0.0721, + "step": 1947 + }, + { + "epoch": 8.94, + "learning_rate": 0.00014350180505415163, + "loss": 0.1001, + "step": 1948 + }, + { + "epoch": 8.94, + "learning_rate": 0.00014339350180505415, + "loss": 0.1109, + "step": 1949 + }, + { + "epoch": 8.94, + "learning_rate": 0.00014328519855595666, + "loss": 0.1127, + "step": 1950 + }, + { + "epoch": 8.95, + "learning_rate": 0.0001431768953068592, + "loss": 0.0854, + "step": 1951 + }, + { + "epoch": 8.95, + "learning_rate": 0.00014306859205776172, + "loss": 0.133, + "step": 1952 + }, + { + "epoch": 8.96, + "learning_rate": 0.00014296028880866424, + "loss": 0.1342, + "step": 1953 + }, + { + "epoch": 8.96, + "learning_rate": 0.00014285198555956678, + "loss": 0.1933, + "step": 1954 + }, + { + "epoch": 8.97, + "learning_rate": 0.0001427436823104693, + "loss": 0.1994, + "step": 1955 + }, + { + "epoch": 8.97, + "learning_rate": 0.00014263537906137182, + "loss": 0.2885, + "step": 1956 + }, + { + "epoch": 8.98, + "learning_rate": 0.00014252707581227436, + "loss": 0.0872, + "step": 1957 + }, + { + "epoch": 8.98, + "learning_rate": 0.00014241877256317687, + "loss": 0.0788, + "step": 1958 + }, + { + "epoch": 8.99, + "learning_rate": 0.00014231046931407942, + "loss": 0.1109, + "step": 1959 + }, + { + "epoch": 8.99, + "learning_rate": 0.00014220216606498193, + "loss": 0.1486, + "step": 1960 + }, + { + "epoch": 9.0, + "learning_rate": 0.00014209386281588448, + "loss": 0.1556, + "step": 1961 + }, + { + "epoch": 9.0, + "learning_rate": 0.000141985559566787, + "loss": 0.295, + "step": 1962 + }, + { + "epoch": 9.0, + "learning_rate": 0.0001418772563176895, + "loss": 0.0908, + "step": 1963 + }, + { + "epoch": 9.01, + "learning_rate": 0.00014176895306859205, + "loss": 0.1133, + "step": 1964 + }, + { + "epoch": 9.01, + "learning_rate": 0.00014166064981949457, + "loss": 0.1048, + "step": 1965 + }, + { + "epoch": 9.02, + "learning_rate": 0.00014155234657039708, + "loss": 0.0782, + "step": 1966 + }, + { + "epoch": 9.02, + "learning_rate": 0.00014144404332129963, + "loss": 0.046, + "step": 1967 + }, + { + "epoch": 9.03, + "learning_rate": 0.00014133574007220214, + "loss": 0.0861, + "step": 1968 + }, + { + "epoch": 9.03, + "learning_rate": 0.00014122743682310466, + "loss": 0.1312, + "step": 1969 + }, + { + "epoch": 9.04, + "learning_rate": 0.0001411191335740072, + "loss": 0.1358, + "step": 1970 + }, + { + "epoch": 9.04, + "learning_rate": 0.00014101083032490975, + "loss": 0.0724, + "step": 1971 + }, + { + "epoch": 9.05, + "learning_rate": 0.00014090252707581226, + "loss": 0.1268, + "step": 1972 + }, + { + "epoch": 9.05, + "learning_rate": 0.00014079422382671478, + "loss": 0.1165, + "step": 1973 + }, + { + "epoch": 9.06, + "learning_rate": 0.00014068592057761732, + "loss": 0.1124, + "step": 1974 + }, + { + "epoch": 9.06, + "learning_rate": 0.00014057761732851984, + "loss": 0.1289, + "step": 1975 + }, + { + "epoch": 9.06, + "learning_rate": 0.00014046931407942235, + "loss": 0.1102, + "step": 1976 + }, + { + "epoch": 9.07, + "learning_rate": 0.0001403610108303249, + "loss": 0.1261, + "step": 1977 + }, + { + "epoch": 9.07, + "learning_rate": 0.00014025270758122741, + "loss": 0.1359, + "step": 1978 + }, + { + "epoch": 9.08, + "learning_rate": 0.00014014440433212996, + "loss": 0.0812, + "step": 1979 + }, + { + "epoch": 9.08, + "learning_rate": 0.0001400361010830325, + "loss": 0.0896, + "step": 1980 + }, + { + "epoch": 9.09, + "learning_rate": 0.00013992779783393502, + "loss": 0.0916, + "step": 1981 + }, + { + "epoch": 9.09, + "learning_rate": 0.00013981949458483753, + "loss": 0.1195, + "step": 1982 + }, + { + "epoch": 9.1, + "learning_rate": 0.00013971119133574008, + "loss": 0.1709, + "step": 1983 + }, + { + "epoch": 9.1, + "learning_rate": 0.0001396028880866426, + "loss": 0.0958, + "step": 1984 + }, + { + "epoch": 9.11, + "learning_rate": 0.0001394945848375451, + "loss": 0.1774, + "step": 1985 + }, + { + "epoch": 9.11, + "learning_rate": 0.00013938628158844765, + "loss": 0.1745, + "step": 1986 + }, + { + "epoch": 9.11, + "learning_rate": 0.00013927797833935017, + "loss": 0.1398, + "step": 1987 + }, + { + "epoch": 9.12, + "learning_rate": 0.00013916967509025268, + "loss": 0.06, + "step": 1988 + }, + { + "epoch": 9.12, + "learning_rate": 0.00013906137184115523, + "loss": 0.0421, + "step": 1989 + }, + { + "epoch": 9.13, + "learning_rate": 0.00013895306859205774, + "loss": 0.0613, + "step": 1990 + }, + { + "epoch": 9.13, + "learning_rate": 0.00013884476534296029, + "loss": 0.0522, + "step": 1991 + }, + { + "epoch": 9.14, + "learning_rate": 0.0001387364620938628, + "loss": 0.0659, + "step": 1992 + }, + { + "epoch": 9.14, + "learning_rate": 0.00013862815884476535, + "loss": 0.063, + "step": 1993 + }, + { + "epoch": 9.15, + "learning_rate": 0.00013851985559566786, + "loss": 0.1107, + "step": 1994 + }, + { + "epoch": 9.15, + "learning_rate": 0.00013841155234657038, + "loss": 0.2154, + "step": 1995 + }, + { + "epoch": 9.16, + "learning_rate": 0.00013830324909747292, + "loss": 0.149, + "step": 1996 + }, + { + "epoch": 9.16, + "learning_rate": 0.00013819494584837544, + "loss": 0.1239, + "step": 1997 + }, + { + "epoch": 9.17, + "learning_rate": 0.00013808664259927795, + "loss": 0.0885, + "step": 1998 + }, + { + "epoch": 9.17, + "learning_rate": 0.0001379783393501805, + "loss": 0.1094, + "step": 1999 + }, + { + "epoch": 9.17, + "learning_rate": 0.000137870036101083, + "loss": 0.0776, + "step": 2000 + }, + { + "epoch": 9.17, + "eval_loss": 0.3937987983226776, + "eval_runtime": 19.713, + "eval_samples_per_second": 83.549, + "eval_steps_per_second": 2.638, + "eval_wer": 0.37248493514452047, + "step": 2000 + }, + { + "epoch": 9.18, + "learning_rate": 0.00013776173285198553, + "loss": 0.0358, + "step": 2001 + }, + { + "epoch": 9.18, + "learning_rate": 0.00013765342960288807, + "loss": 0.0864, + "step": 2002 + }, + { + "epoch": 9.19, + "learning_rate": 0.00013754512635379062, + "loss": 0.0879, + "step": 2003 + }, + { + "epoch": 9.19, + "learning_rate": 0.00013743682310469313, + "loss": 0.1096, + "step": 2004 + }, + { + "epoch": 9.2, + "learning_rate": 0.00013732851985559565, + "loss": 0.1502, + "step": 2005 + }, + { + "epoch": 9.2, + "learning_rate": 0.0001372202166064982, + "loss": 0.1286, + "step": 2006 + }, + { + "epoch": 9.21, + "learning_rate": 0.0001371119133574007, + "loss": 0.0963, + "step": 2007 + }, + { + "epoch": 9.21, + "learning_rate": 0.00013700361010830322, + "loss": 0.1371, + "step": 2008 + }, + { + "epoch": 9.22, + "learning_rate": 0.00013689530685920577, + "loss": 0.0718, + "step": 2009 + }, + { + "epoch": 9.22, + "learning_rate": 0.00013678700361010828, + "loss": 0.1477, + "step": 2010 + }, + { + "epoch": 9.22, + "learning_rate": 0.00013667870036101083, + "loss": 0.1169, + "step": 2011 + }, + { + "epoch": 9.23, + "learning_rate": 0.00013657039711191334, + "loss": 0.0876, + "step": 2012 + }, + { + "epoch": 9.23, + "learning_rate": 0.00013646209386281588, + "loss": 0.1322, + "step": 2013 + }, + { + "epoch": 9.24, + "learning_rate": 0.0001363537906137184, + "loss": 0.0786, + "step": 2014 + }, + { + "epoch": 9.24, + "learning_rate": 0.00013624548736462094, + "loss": 0.1005, + "step": 2015 + }, + { + "epoch": 9.25, + "learning_rate": 0.00013613718411552346, + "loss": 0.1235, + "step": 2016 + }, + { + "epoch": 9.25, + "learning_rate": 0.00013602888086642598, + "loss": 0.1004, + "step": 2017 + }, + { + "epoch": 9.26, + "learning_rate": 0.00013592057761732852, + "loss": 0.0836, + "step": 2018 + }, + { + "epoch": 9.26, + "learning_rate": 0.00013581227436823104, + "loss": 0.0911, + "step": 2019 + }, + { + "epoch": 9.27, + "learning_rate": 0.00013570397111913355, + "loss": 0.1423, + "step": 2020 + }, + { + "epoch": 9.27, + "learning_rate": 0.0001355956678700361, + "loss": 0.1467, + "step": 2021 + }, + { + "epoch": 9.28, + "learning_rate": 0.0001354873646209386, + "loss": 0.1069, + "step": 2022 + }, + { + "epoch": 9.28, + "learning_rate": 0.00013537906137184113, + "loss": 0.0971, + "step": 2023 + }, + { + "epoch": 9.28, + "learning_rate": 0.00013527075812274367, + "loss": 0.2705, + "step": 2024 + }, + { + "epoch": 9.29, + "learning_rate": 0.00013516245487364621, + "loss": 0.0601, + "step": 2025 + }, + { + "epoch": 9.29, + "learning_rate": 0.00013505415162454873, + "loss": 0.1134, + "step": 2026 + }, + { + "epoch": 9.3, + "learning_rate": 0.00013494584837545125, + "loss": 0.0958, + "step": 2027 + }, + { + "epoch": 9.3, + "learning_rate": 0.0001348375451263538, + "loss": 0.0763, + "step": 2028 + }, + { + "epoch": 9.31, + "learning_rate": 0.0001347292418772563, + "loss": 0.1233, + "step": 2029 + }, + { + "epoch": 9.31, + "learning_rate": 0.00013462093862815882, + "loss": 0.0613, + "step": 2030 + }, + { + "epoch": 9.32, + "learning_rate": 0.00013451263537906136, + "loss": 0.0873, + "step": 2031 + }, + { + "epoch": 9.32, + "learning_rate": 0.00013440433212996388, + "loss": 0.0624, + "step": 2032 + }, + { + "epoch": 9.33, + "learning_rate": 0.0001342960288808664, + "loss": 0.0854, + "step": 2033 + }, + { + "epoch": 9.33, + "learning_rate": 0.00013418772563176894, + "loss": 0.174, + "step": 2034 + }, + { + "epoch": 9.33, + "learning_rate": 0.00013407942238267148, + "loss": 0.1406, + "step": 2035 + }, + { + "epoch": 9.34, + "learning_rate": 0.000133971119133574, + "loss": 0.1801, + "step": 2036 + }, + { + "epoch": 9.34, + "learning_rate": 0.00013386281588447652, + "loss": 0.1922, + "step": 2037 + }, + { + "epoch": 9.35, + "learning_rate": 0.00013375451263537906, + "loss": 0.084, + "step": 2038 + }, + { + "epoch": 9.35, + "learning_rate": 0.00013364620938628158, + "loss": 0.1225, + "step": 2039 + }, + { + "epoch": 9.36, + "learning_rate": 0.0001335379061371841, + "loss": 0.0642, + "step": 2040 + }, + { + "epoch": 9.36, + "learning_rate": 0.00013342960288808663, + "loss": 0.0665, + "step": 2041 + }, + { + "epoch": 9.37, + "learning_rate": 0.00013332129963898915, + "loss": 0.0654, + "step": 2042 + }, + { + "epoch": 9.37, + "learning_rate": 0.00013321299638989167, + "loss": 0.1147, + "step": 2043 + }, + { + "epoch": 9.38, + "learning_rate": 0.0001331046931407942, + "loss": 0.0926, + "step": 2044 + }, + { + "epoch": 9.38, + "learning_rate": 0.00013299638989169675, + "loss": 0.0562, + "step": 2045 + }, + { + "epoch": 9.39, + "learning_rate": 0.00013288808664259927, + "loss": 0.1468, + "step": 2046 + }, + { + "epoch": 9.39, + "learning_rate": 0.00013277978339350179, + "loss": 0.1001, + "step": 2047 + }, + { + "epoch": 9.39, + "learning_rate": 0.00013267148014440433, + "loss": 0.2049, + "step": 2048 + }, + { + "epoch": 9.4, + "learning_rate": 0.00013256317689530684, + "loss": 0.157, + "step": 2049 + }, + { + "epoch": 9.4, + "learning_rate": 0.0001324548736462094, + "loss": 0.1591, + "step": 2050 + }, + { + "epoch": 9.41, + "learning_rate": 0.0001323465703971119, + "loss": 0.0682, + "step": 2051 + }, + { + "epoch": 9.41, + "learning_rate": 0.00013223826714801442, + "loss": 0.0679, + "step": 2052 + }, + { + "epoch": 9.42, + "learning_rate": 0.00013212996389891696, + "loss": 0.1037, + "step": 2053 + }, + { + "epoch": 9.42, + "learning_rate": 0.00013202166064981948, + "loss": 0.0619, + "step": 2054 + }, + { + "epoch": 9.43, + "learning_rate": 0.000131913357400722, + "loss": 0.0519, + "step": 2055 + }, + { + "epoch": 9.43, + "learning_rate": 0.00013180505415162454, + "loss": 0.1106, + "step": 2056 + }, + { + "epoch": 9.44, + "learning_rate": 0.00013169675090252708, + "loss": 0.1044, + "step": 2057 + }, + { + "epoch": 9.44, + "learning_rate": 0.0001315884476534296, + "loss": 0.0946, + "step": 2058 + }, + { + "epoch": 9.44, + "learning_rate": 0.00013148014440433211, + "loss": 0.1685, + "step": 2059 + }, + { + "epoch": 9.45, + "learning_rate": 0.00013137184115523466, + "loss": 0.1182, + "step": 2060 + }, + { + "epoch": 9.45, + "learning_rate": 0.00013126353790613717, + "loss": 0.1409, + "step": 2061 + }, + { + "epoch": 9.46, + "learning_rate": 0.0001311552346570397, + "loss": 0.2284, + "step": 2062 + }, + { + "epoch": 9.46, + "learning_rate": 0.00013104693140794223, + "loss": 0.0784, + "step": 2063 + }, + { + "epoch": 9.47, + "learning_rate": 0.00013093862815884475, + "loss": 0.0748, + "step": 2064 + }, + { + "epoch": 9.47, + "learning_rate": 0.00013083032490974727, + "loss": 0.0527, + "step": 2065 + }, + { + "epoch": 9.48, + "learning_rate": 0.0001307220216606498, + "loss": 0.0809, + "step": 2066 + }, + { + "epoch": 9.48, + "learning_rate": 0.00013061371841155235, + "loss": 0.1259, + "step": 2067 + }, + { + "epoch": 9.49, + "learning_rate": 0.00013050541516245487, + "loss": 0.1211, + "step": 2068 + }, + { + "epoch": 9.49, + "learning_rate": 0.00013039711191335738, + "loss": 0.1026, + "step": 2069 + }, + { + "epoch": 9.5, + "learning_rate": 0.00013028880866425993, + "loss": 0.0507, + "step": 2070 + }, + { + "epoch": 9.5, + "learning_rate": 0.00013018050541516244, + "loss": 0.1937, + "step": 2071 + }, + { + "epoch": 9.5, + "learning_rate": 0.00013007220216606496, + "loss": 0.1457, + "step": 2072 + }, + { + "epoch": 9.51, + "learning_rate": 0.0001299638989169675, + "loss": 0.2218, + "step": 2073 + }, + { + "epoch": 9.51, + "learning_rate": 0.00012985559566787002, + "loss": 0.0698, + "step": 2074 + }, + { + "epoch": 9.52, + "learning_rate": 0.00012974729241877254, + "loss": 0.1696, + "step": 2075 + }, + { + "epoch": 9.52, + "learning_rate": 0.00012963898916967508, + "loss": 0.1135, + "step": 2076 + }, + { + "epoch": 9.53, + "learning_rate": 0.0001295306859205776, + "loss": 0.0678, + "step": 2077 + }, + { + "epoch": 9.53, + "learning_rate": 0.00012942238267148014, + "loss": 0.1025, + "step": 2078 + }, + { + "epoch": 9.54, + "learning_rate": 0.00012931407942238265, + "loss": 0.0524, + "step": 2079 + }, + { + "epoch": 9.54, + "learning_rate": 0.0001292057761732852, + "loss": 0.0664, + "step": 2080 + }, + { + "epoch": 9.55, + "learning_rate": 0.0001290974729241877, + "loss": 0.0816, + "step": 2081 + }, + { + "epoch": 9.55, + "learning_rate": 0.00012898916967509023, + "loss": 0.0767, + "step": 2082 + }, + { + "epoch": 9.56, + "learning_rate": 0.00012888086642599277, + "loss": 0.1257, + "step": 2083 + }, + { + "epoch": 9.56, + "learning_rate": 0.0001287725631768953, + "loss": 0.0981, + "step": 2084 + }, + { + "epoch": 9.56, + "learning_rate": 0.00012866425992779783, + "loss": 0.0636, + "step": 2085 + }, + { + "epoch": 9.57, + "learning_rate": 0.00012855595667870035, + "loss": 0.1168, + "step": 2086 + }, + { + "epoch": 9.57, + "learning_rate": 0.00012844765342960286, + "loss": 0.3165, + "step": 2087 + }, + { + "epoch": 9.58, + "learning_rate": 0.0001283393501805054, + "loss": 0.0873, + "step": 2088 + }, + { + "epoch": 9.58, + "learning_rate": 0.00012823104693140795, + "loss": 0.0384, + "step": 2089 + }, + { + "epoch": 9.59, + "learning_rate": 0.00012812274368231047, + "loss": 0.1116, + "step": 2090 + }, + { + "epoch": 9.59, + "learning_rate": 0.00012801444043321298, + "loss": 0.0723, + "step": 2091 + }, + { + "epoch": 9.6, + "learning_rate": 0.00012790613718411553, + "loss": 0.0929, + "step": 2092 + }, + { + "epoch": 9.6, + "learning_rate": 0.00012779783393501804, + "loss": 0.089, + "step": 2093 + }, + { + "epoch": 9.61, + "learning_rate": 0.00012768953068592056, + "loss": 0.0723, + "step": 2094 + }, + { + "epoch": 9.61, + "learning_rate": 0.0001275812274368231, + "loss": 0.1179, + "step": 2095 + }, + { + "epoch": 9.61, + "learning_rate": 0.00012747292418772562, + "loss": 0.1956, + "step": 2096 + }, + { + "epoch": 9.62, + "learning_rate": 0.00012736462093862813, + "loss": 0.0582, + "step": 2097 + }, + { + "epoch": 9.62, + "learning_rate": 0.00012725631768953068, + "loss": 0.1803, + "step": 2098 + }, + { + "epoch": 9.63, + "learning_rate": 0.00012714801444043322, + "loss": 0.0975, + "step": 2099 + }, + { + "epoch": 9.63, + "learning_rate": 0.00012703971119133574, + "loss": 0.1597, + "step": 2100 + }, + { + "epoch": 9.63, + "eval_loss": 0.37861549854278564, + "eval_runtime": 19.9945, + "eval_samples_per_second": 82.373, + "eval_steps_per_second": 2.601, + "eval_wer": 0.3697273005821673, + "step": 2100 + }, + { + "epoch": 9.64, + "learning_rate": 0.00012693140794223825, + "loss": 0.133, + "step": 2101 + }, + { + "epoch": 9.64, + "learning_rate": 0.0001268231046931408, + "loss": 0.062, + "step": 2102 + }, + { + "epoch": 9.65, + "learning_rate": 0.0001267148014440433, + "loss": 0.2063, + "step": 2103 + }, + { + "epoch": 9.65, + "learning_rate": 0.00012660649819494583, + "loss": 0.0507, + "step": 2104 + }, + { + "epoch": 9.66, + "learning_rate": 0.00012649819494584837, + "loss": 0.0607, + "step": 2105 + }, + { + "epoch": 9.66, + "learning_rate": 0.0001263898916967509, + "loss": 0.083, + "step": 2106 + }, + { + "epoch": 9.67, + "learning_rate": 0.0001262815884476534, + "loss": 0.1307, + "step": 2107 + }, + { + "epoch": 9.67, + "learning_rate": 0.00012617328519855595, + "loss": 0.1252, + "step": 2108 + }, + { + "epoch": 9.67, + "learning_rate": 0.00012606498194945846, + "loss": 0.0807, + "step": 2109 + }, + { + "epoch": 9.68, + "learning_rate": 0.000125956678700361, + "loss": 0.1, + "step": 2110 + }, + { + "epoch": 9.68, + "learning_rate": 0.00012584837545126352, + "loss": 0.106, + "step": 2111 + }, + { + "epoch": 9.69, + "learning_rate": 0.00012574007220216607, + "loss": 0.2213, + "step": 2112 + }, + { + "epoch": 9.69, + "learning_rate": 0.00012563176895306858, + "loss": 0.148, + "step": 2113 + }, + { + "epoch": 9.7, + "learning_rate": 0.0001255234657039711, + "loss": 0.1197, + "step": 2114 + }, + { + "epoch": 9.7, + "learning_rate": 0.00012541516245487364, + "loss": 0.1234, + "step": 2115 + }, + { + "epoch": 9.71, + "learning_rate": 0.00012530685920577616, + "loss": 0.0666, + "step": 2116 + }, + { + "epoch": 9.71, + "learning_rate": 0.00012519855595667867, + "loss": 0.105, + "step": 2117 + }, + { + "epoch": 9.72, + "learning_rate": 0.00012509025270758122, + "loss": 0.1323, + "step": 2118 + }, + { + "epoch": 9.72, + "learning_rate": 0.00012498194945848373, + "loss": 0.1098, + "step": 2119 + }, + { + "epoch": 9.72, + "learning_rate": 0.00012487364620938628, + "loss": 0.0925, + "step": 2120 + }, + { + "epoch": 9.73, + "learning_rate": 0.0001247653429602888, + "loss": 0.1414, + "step": 2121 + }, + { + "epoch": 9.73, + "learning_rate": 0.00012465703971119134, + "loss": 0.1529, + "step": 2122 + }, + { + "epoch": 9.74, + "learning_rate": 0.00012454873646209385, + "loss": 0.15, + "step": 2123 + }, + { + "epoch": 9.74, + "learning_rate": 0.0001244404332129964, + "loss": 0.2713, + "step": 2124 + }, + { + "epoch": 9.75, + "learning_rate": 0.0001243321299638989, + "loss": 0.1291, + "step": 2125 + }, + { + "epoch": 9.75, + "learning_rate": 0.00012422382671480143, + "loss": 0.0976, + "step": 2126 + }, + { + "epoch": 9.76, + "learning_rate": 0.00012411552346570397, + "loss": 0.0487, + "step": 2127 + }, + { + "epoch": 9.76, + "learning_rate": 0.00012400722021660649, + "loss": 0.0502, + "step": 2128 + }, + { + "epoch": 9.77, + "learning_rate": 0.000123898916967509, + "loss": 0.0817, + "step": 2129 + }, + { + "epoch": 9.77, + "learning_rate": 0.00012379061371841155, + "loss": 0.1108, + "step": 2130 + }, + { + "epoch": 9.78, + "learning_rate": 0.00012368231046931406, + "loss": 0.066, + "step": 2131 + }, + { + "epoch": 9.78, + "learning_rate": 0.0001235740072202166, + "loss": 0.1073, + "step": 2132 + }, + { + "epoch": 9.78, + "learning_rate": 0.00012346570397111912, + "loss": 0.0812, + "step": 2133 + }, + { + "epoch": 9.79, + "learning_rate": 0.00012335740072202166, + "loss": 0.1527, + "step": 2134 + }, + { + "epoch": 9.79, + "learning_rate": 0.00012324909747292418, + "loss": 0.0896, + "step": 2135 + }, + { + "epoch": 9.8, + "learning_rate": 0.0001231407942238267, + "loss": 0.1823, + "step": 2136 + }, + { + "epoch": 9.8, + "learning_rate": 0.00012303249097472924, + "loss": 0.2149, + "step": 2137 + }, + { + "epoch": 9.81, + "learning_rate": 0.00012292418772563176, + "loss": 0.0734, + "step": 2138 + }, + { + "epoch": 9.81, + "learning_rate": 0.00012281588447653427, + "loss": 0.0538, + "step": 2139 + }, + { + "epoch": 9.82, + "learning_rate": 0.00012270758122743682, + "loss": 0.0436, + "step": 2140 + }, + { + "epoch": 9.82, + "learning_rate": 0.00012259927797833933, + "loss": 0.0755, + "step": 2141 + }, + { + "epoch": 9.83, + "learning_rate": 0.00012249097472924185, + "loss": 0.0882, + "step": 2142 + }, + { + "epoch": 9.83, + "learning_rate": 0.0001223826714801444, + "loss": 0.0641, + "step": 2143 + }, + { + "epoch": 9.83, + "learning_rate": 0.00012227436823104693, + "loss": 0.0987, + "step": 2144 + }, + { + "epoch": 9.84, + "learning_rate": 0.00012216606498194945, + "loss": 0.1883, + "step": 2145 + }, + { + "epoch": 9.84, + "learning_rate": 0.00012205776173285198, + "loss": 0.069, + "step": 2146 + }, + { + "epoch": 9.85, + "learning_rate": 0.00012194945848375451, + "loss": 0.0865, + "step": 2147 + }, + { + "epoch": 9.85, + "learning_rate": 0.00012184115523465703, + "loss": 0.1181, + "step": 2148 + }, + { + "epoch": 9.86, + "learning_rate": 0.00012173285198555956, + "loss": 0.1281, + "step": 2149 + }, + { + "epoch": 9.86, + "learning_rate": 0.00012162454873646208, + "loss": 0.2035, + "step": 2150 + }, + { + "epoch": 9.87, + "learning_rate": 0.0001215162454873646, + "loss": 0.0739, + "step": 2151 + }, + { + "epoch": 9.87, + "learning_rate": 0.00012140794223826713, + "loss": 0.0884, + "step": 2152 + }, + { + "epoch": 9.88, + "learning_rate": 0.00012129963898916966, + "loss": 0.1112, + "step": 2153 + }, + { + "epoch": 9.88, + "learning_rate": 0.0001211913357400722, + "loss": 0.0658, + "step": 2154 + }, + { + "epoch": 9.89, + "learning_rate": 0.00012108303249097472, + "loss": 0.0793, + "step": 2155 + }, + { + "epoch": 9.89, + "learning_rate": 0.00012097472924187725, + "loss": 0.0695, + "step": 2156 + }, + { + "epoch": 9.89, + "learning_rate": 0.00012086642599277978, + "loss": 0.1032, + "step": 2157 + }, + { + "epoch": 9.9, + "learning_rate": 0.0001207581227436823, + "loss": 0.1636, + "step": 2158 + }, + { + "epoch": 9.9, + "learning_rate": 0.00012064981949458482, + "loss": 0.1069, + "step": 2159 + }, + { + "epoch": 9.91, + "learning_rate": 0.00012054151624548735, + "loss": 0.1016, + "step": 2160 + }, + { + "epoch": 9.91, + "learning_rate": 0.00012043321299638987, + "loss": 0.1466, + "step": 2161 + }, + { + "epoch": 9.92, + "learning_rate": 0.0001203249097472924, + "loss": 0.152, + "step": 2162 + }, + { + "epoch": 9.92, + "learning_rate": 0.00012021660649819493, + "loss": 0.0996, + "step": 2163 + }, + { + "epoch": 9.93, + "learning_rate": 0.00012010830324909747, + "loss": 0.0886, + "step": 2164 + }, + { + "epoch": 9.93, + "learning_rate": 0.00011999999999999999, + "loss": 0.0676, + "step": 2165 + }, + { + "epoch": 9.94, + "learning_rate": 0.00011989169675090252, + "loss": 0.1048, + "step": 2166 + }, + { + "epoch": 9.94, + "learning_rate": 0.00011978339350180505, + "loss": 0.0768, + "step": 2167 + }, + { + "epoch": 9.94, + "learning_rate": 0.00011967509025270758, + "loss": 0.0554, + "step": 2168 + }, + { + "epoch": 9.95, + "learning_rate": 0.0001195667870036101, + "loss": 0.0643, + "step": 2169 + }, + { + "epoch": 9.95, + "learning_rate": 0.00011945848375451262, + "loss": 0.0451, + "step": 2170 + }, + { + "epoch": 9.96, + "learning_rate": 0.00011935018050541515, + "loss": 0.1358, + "step": 2171 + }, + { + "epoch": 9.96, + "learning_rate": 0.00011924187725631767, + "loss": 0.1142, + "step": 2172 + }, + { + "epoch": 9.97, + "learning_rate": 0.0001191335740072202, + "loss": 0.0548, + "step": 2173 + }, + { + "epoch": 9.97, + "learning_rate": 0.00011902527075812273, + "loss": 0.1387, + "step": 2174 + }, + { + "epoch": 9.98, + "learning_rate": 0.00011891696750902527, + "loss": 0.1143, + "step": 2175 + }, + { + "epoch": 9.98, + "learning_rate": 0.00011880866425992779, + "loss": 0.0734, + "step": 2176 + }, + { + "epoch": 9.99, + "learning_rate": 0.00011870036101083032, + "loss": 0.0873, + "step": 2177 + }, + { + "epoch": 9.99, + "learning_rate": 0.00011859205776173285, + "loss": 0.1724, + "step": 2178 + }, + { + "epoch": 10.0, + "learning_rate": 0.00011848375451263536, + "loss": 0.0919, + "step": 2179 + }, + { + "epoch": 10.0, + "learning_rate": 0.0001183754512635379, + "loss": 0.2433, + "step": 2180 + }, + { + "epoch": 10.0, + "learning_rate": 0.00011826714801444042, + "loss": 0.0573, + "step": 2181 + }, + { + "epoch": 10.01, + "learning_rate": 0.00011815884476534295, + "loss": 0.0603, + "step": 2182 + }, + { + "epoch": 10.01, + "learning_rate": 0.00011805054151624547, + "loss": 0.0857, + "step": 2183 + }, + { + "epoch": 10.02, + "learning_rate": 0.000117942238267148, + "loss": 0.0444, + "step": 2184 + }, + { + "epoch": 10.02, + "learning_rate": 0.00011783393501805053, + "loss": 0.0726, + "step": 2185 + }, + { + "epoch": 10.03, + "learning_rate": 0.00011772563176895307, + "loss": 0.0773, + "step": 2186 + }, + { + "epoch": 10.03, + "learning_rate": 0.00011761732851985559, + "loss": 0.071, + "step": 2187 + }, + { + "epoch": 10.04, + "learning_rate": 0.00011750902527075812, + "loss": 0.0614, + "step": 2188 + }, + { + "epoch": 10.04, + "learning_rate": 0.00011740072202166065, + "loss": 0.0957, + "step": 2189 + }, + { + "epoch": 10.05, + "learning_rate": 0.00011729241877256316, + "loss": 0.1084, + "step": 2190 + }, + { + "epoch": 10.05, + "learning_rate": 0.0001171841155234657, + "loss": 0.0529, + "step": 2191 + }, + { + "epoch": 10.06, + "learning_rate": 0.00011707581227436822, + "loss": 0.1818, + "step": 2192 + }, + { + "epoch": 10.06, + "learning_rate": 0.00011696750902527074, + "loss": 0.1391, + "step": 2193 + }, + { + "epoch": 10.06, + "learning_rate": 0.00011685920577617327, + "loss": 0.0567, + "step": 2194 + }, + { + "epoch": 10.07, + "learning_rate": 0.0001167509025270758, + "loss": 0.0846, + "step": 2195 + }, + { + "epoch": 10.07, + "learning_rate": 0.00011664259927797831, + "loss": 0.0906, + "step": 2196 + }, + { + "epoch": 10.08, + "learning_rate": 0.00011653429602888086, + "loss": 0.0783, + "step": 2197 + }, + { + "epoch": 10.08, + "learning_rate": 0.00011642599277978339, + "loss": 0.0764, + "step": 2198 + }, + { + "epoch": 10.09, + "learning_rate": 0.00011631768953068592, + "loss": 0.0639, + "step": 2199 + }, + { + "epoch": 10.09, + "learning_rate": 0.00011620938628158845, + "loss": 0.1124, + "step": 2200 + }, + { + "epoch": 10.09, + "eval_loss": 0.3946552574634552, + "eval_runtime": 19.834, + "eval_samples_per_second": 83.039, + "eval_steps_per_second": 2.622, + "eval_wer": 0.35900316617301603, + "step": 2200 + }, + { + "epoch": 10.1, + "learning_rate": 0.00011610108303249096, + "loss": 0.083, + "step": 2201 + }, + { + "epoch": 10.1, + "learning_rate": 0.00011599277978339349, + "loss": 0.1369, + "step": 2202 + }, + { + "epoch": 10.11, + "learning_rate": 0.00011588447653429602, + "loss": 0.1721, + "step": 2203 + }, + { + "epoch": 10.11, + "learning_rate": 0.00011577617328519854, + "loss": 0.1586, + "step": 2204 + }, + { + "epoch": 10.11, + "learning_rate": 0.00011566787003610107, + "loss": 0.0972, + "step": 2205 + }, + { + "epoch": 10.12, + "learning_rate": 0.0001155595667870036, + "loss": 0.0555, + "step": 2206 + }, + { + "epoch": 10.12, + "learning_rate": 0.00011545126353790611, + "loss": 0.0368, + "step": 2207 + }, + { + "epoch": 10.13, + "learning_rate": 0.00011534296028880866, + "loss": 0.0728, + "step": 2208 + }, + { + "epoch": 10.13, + "learning_rate": 0.00011523465703971119, + "loss": 0.0581, + "step": 2209 + }, + { + "epoch": 10.14, + "learning_rate": 0.00011512635379061372, + "loss": 0.069, + "step": 2210 + }, + { + "epoch": 10.14, + "learning_rate": 0.00011501805054151623, + "loss": 0.113, + "step": 2211 + }, + { + "epoch": 10.15, + "learning_rate": 0.00011490974729241876, + "loss": 0.1064, + "step": 2212 + }, + { + "epoch": 10.15, + "learning_rate": 0.00011480144404332129, + "loss": 0.0824, + "step": 2213 + }, + { + "epoch": 10.16, + "learning_rate": 0.00011469314079422381, + "loss": 0.1239, + "step": 2214 + }, + { + "epoch": 10.16, + "learning_rate": 0.00011458483754512634, + "loss": 0.1385, + "step": 2215 + }, + { + "epoch": 10.17, + "learning_rate": 0.00011447653429602887, + "loss": 0.1078, + "step": 2216 + }, + { + "epoch": 10.17, + "learning_rate": 0.0001143682310469314, + "loss": 0.0481, + "step": 2217 + }, + { + "epoch": 10.17, + "learning_rate": 0.00011425992779783391, + "loss": 0.1172, + "step": 2218 + }, + { + "epoch": 10.18, + "learning_rate": 0.00011415162454873646, + "loss": 0.0694, + "step": 2219 + }, + { + "epoch": 10.18, + "learning_rate": 0.00011404332129963899, + "loss": 0.0764, + "step": 2220 + }, + { + "epoch": 10.19, + "learning_rate": 0.00011393501805054152, + "loss": 0.1115, + "step": 2221 + }, + { + "epoch": 10.19, + "learning_rate": 0.00011382671480144403, + "loss": 0.0933, + "step": 2222 + }, + { + "epoch": 10.2, + "learning_rate": 0.00011371841155234656, + "loss": 0.0593, + "step": 2223 + }, + { + "epoch": 10.2, + "learning_rate": 0.00011361010830324909, + "loss": 0.0678, + "step": 2224 + }, + { + "epoch": 10.21, + "learning_rate": 0.00011350180505415161, + "loss": 0.0794, + "step": 2225 + }, + { + "epoch": 10.21, + "learning_rate": 0.00011339350180505414, + "loss": 0.0907, + "step": 2226 + }, + { + "epoch": 10.22, + "learning_rate": 0.00011328519855595667, + "loss": 0.1233, + "step": 2227 + }, + { + "epoch": 10.22, + "learning_rate": 0.00011317689530685918, + "loss": 0.0812, + "step": 2228 + }, + { + "epoch": 10.22, + "learning_rate": 0.00011306859205776173, + "loss": 0.058, + "step": 2229 + }, + { + "epoch": 10.23, + "learning_rate": 0.00011296028880866426, + "loss": 0.1144, + "step": 2230 + }, + { + "epoch": 10.23, + "learning_rate": 0.00011285198555956679, + "loss": 0.0783, + "step": 2231 + }, + { + "epoch": 10.24, + "learning_rate": 0.0001127436823104693, + "loss": 0.0568, + "step": 2232 + }, + { + "epoch": 10.24, + "learning_rate": 0.00011263537906137183, + "loss": 0.0304, + "step": 2233 + }, + { + "epoch": 10.25, + "learning_rate": 0.00011252707581227436, + "loss": 0.0522, + "step": 2234 + }, + { + "epoch": 10.25, + "learning_rate": 0.00011241877256317689, + "loss": 0.0519, + "step": 2235 + }, + { + "epoch": 10.26, + "learning_rate": 0.00011231046931407941, + "loss": 0.1177, + "step": 2236 + }, + { + "epoch": 10.26, + "learning_rate": 0.00011220216606498194, + "loss": 0.0918, + "step": 2237 + }, + { + "epoch": 10.27, + "learning_rate": 0.00011209386281588447, + "loss": 0.1255, + "step": 2238 + }, + { + "epoch": 10.27, + "learning_rate": 0.00011198555956678698, + "loss": 0.1038, + "step": 2239 + }, + { + "epoch": 10.28, + "learning_rate": 0.00011187725631768953, + "loss": 0.0551, + "step": 2240 + }, + { + "epoch": 10.28, + "learning_rate": 0.00011176895306859206, + "loss": 0.1189, + "step": 2241 + }, + { + "epoch": 10.28, + "learning_rate": 0.00011166064981949458, + "loss": 0.1689, + "step": 2242 + }, + { + "epoch": 10.29, + "learning_rate": 0.0001115523465703971, + "loss": 0.1234, + "step": 2243 + }, + { + "epoch": 10.29, + "learning_rate": 0.00011144404332129963, + "loss": 0.0491, + "step": 2244 + }, + { + "epoch": 10.3, + "learning_rate": 0.00011133574007220216, + "loss": 0.0612, + "step": 2245 + }, + { + "epoch": 10.3, + "learning_rate": 0.00011122743682310468, + "loss": 0.075, + "step": 2246 + }, + { + "epoch": 10.31, + "learning_rate": 0.0001111191335740072, + "loss": 0.0539, + "step": 2247 + }, + { + "epoch": 10.31, + "learning_rate": 0.00011101083032490974, + "loss": 0.0573, + "step": 2248 + }, + { + "epoch": 10.32, + "learning_rate": 0.00011090252707581225, + "loss": 0.0668, + "step": 2249 + }, + { + "epoch": 10.32, + "learning_rate": 0.00011079422382671478, + "loss": 0.0437, + "step": 2250 + }, + { + "epoch": 10.33, + "learning_rate": 0.00011068592057761732, + "loss": 0.1596, + "step": 2251 + }, + { + "epoch": 10.33, + "learning_rate": 0.00011057761732851985, + "loss": 0.0589, + "step": 2252 + }, + { + "epoch": 10.33, + "learning_rate": 0.00011046931407942237, + "loss": 0.143, + "step": 2253 + }, + { + "epoch": 10.34, + "learning_rate": 0.0001103610108303249, + "loss": 0.142, + "step": 2254 + }, + { + "epoch": 10.34, + "learning_rate": 0.00011025270758122743, + "loss": 0.2014, + "step": 2255 + }, + { + "epoch": 10.35, + "learning_rate": 0.00011014440433212996, + "loss": 0.0469, + "step": 2256 + }, + { + "epoch": 10.35, + "learning_rate": 0.00011003610108303248, + "loss": 0.0433, + "step": 2257 + }, + { + "epoch": 10.36, + "learning_rate": 0.000109927797833935, + "loss": 0.0393, + "step": 2258 + }, + { + "epoch": 10.36, + "learning_rate": 0.00010981949458483754, + "loss": 0.0276, + "step": 2259 + }, + { + "epoch": 10.37, + "learning_rate": 0.00010971119133574005, + "loss": 0.033, + "step": 2260 + }, + { + "epoch": 10.37, + "learning_rate": 0.00010960288808664258, + "loss": 0.0889, + "step": 2261 + }, + { + "epoch": 10.38, + "learning_rate": 0.00010949458483754512, + "loss": 0.1641, + "step": 2262 + }, + { + "epoch": 10.38, + "learning_rate": 0.00010938628158844765, + "loss": 0.0916, + "step": 2263 + }, + { + "epoch": 10.39, + "learning_rate": 0.00010927797833935017, + "loss": 0.0207, + "step": 2264 + }, + { + "epoch": 10.39, + "learning_rate": 0.0001091696750902527, + "loss": 0.093, + "step": 2265 + }, + { + "epoch": 10.39, + "learning_rate": 0.00010906137184115523, + "loss": 0.1004, + "step": 2266 + }, + { + "epoch": 10.4, + "learning_rate": 0.00010895306859205775, + "loss": 0.1744, + "step": 2267 + }, + { + "epoch": 10.4, + "learning_rate": 0.00010884476534296028, + "loss": 0.0832, + "step": 2268 + }, + { + "epoch": 10.41, + "learning_rate": 0.0001087364620938628, + "loss": 0.057, + "step": 2269 + }, + { + "epoch": 10.41, + "learning_rate": 0.00010862815884476533, + "loss": 0.0547, + "step": 2270 + }, + { + "epoch": 10.42, + "learning_rate": 0.00010851985559566785, + "loss": 0.0537, + "step": 2271 + }, + { + "epoch": 10.42, + "learning_rate": 0.00010841155234657038, + "loss": 0.0928, + "step": 2272 + }, + { + "epoch": 10.43, + "learning_rate": 0.00010830324909747292, + "loss": 0.0645, + "step": 2273 + }, + { + "epoch": 10.43, + "learning_rate": 0.00010819494584837545, + "loss": 0.0599, + "step": 2274 + }, + { + "epoch": 10.44, + "learning_rate": 0.00010808664259927797, + "loss": 0.0697, + "step": 2275 + }, + { + "epoch": 10.44, + "learning_rate": 0.0001079783393501805, + "loss": 0.0781, + "step": 2276 + }, + { + "epoch": 10.44, + "learning_rate": 0.00010787003610108303, + "loss": 0.1216, + "step": 2277 + }, + { + "epoch": 10.45, + "learning_rate": 0.00010776173285198554, + "loss": 0.0708, + "step": 2278 + }, + { + "epoch": 10.45, + "learning_rate": 0.00010765342960288807, + "loss": 0.0761, + "step": 2279 + }, + { + "epoch": 10.46, + "learning_rate": 0.0001075451263537906, + "loss": 0.0533, + "step": 2280 + }, + { + "epoch": 10.46, + "learning_rate": 0.00010743682310469312, + "loss": 0.0854, + "step": 2281 + }, + { + "epoch": 10.47, + "learning_rate": 0.00010732851985559565, + "loss": 0.051, + "step": 2282 + }, + { + "epoch": 10.47, + "learning_rate": 0.0001072202166064982, + "loss": 0.0453, + "step": 2283 + }, + { + "epoch": 10.48, + "learning_rate": 0.00010711191335740072, + "loss": 0.0525, + "step": 2284 + }, + { + "epoch": 10.48, + "learning_rate": 0.00010700361010830324, + "loss": 0.0956, + "step": 2285 + }, + { + "epoch": 10.49, + "learning_rate": 0.00010689530685920577, + "loss": 0.0174, + "step": 2286 + }, + { + "epoch": 10.49, + "learning_rate": 0.0001067870036101083, + "loss": 0.0962, + "step": 2287 + }, + { + "epoch": 10.5, + "learning_rate": 0.00010667870036101083, + "loss": 0.156, + "step": 2288 + }, + { + "epoch": 10.5, + "learning_rate": 0.00010657039711191334, + "loss": 0.0889, + "step": 2289 + }, + { + "epoch": 10.5, + "learning_rate": 0.00010646209386281587, + "loss": 0.0327, + "step": 2290 + }, + { + "epoch": 10.51, + "learning_rate": 0.0001063537906137184, + "loss": 0.0514, + "step": 2291 + }, + { + "epoch": 10.51, + "learning_rate": 0.00010624548736462092, + "loss": 0.0672, + "step": 2292 + }, + { + "epoch": 10.52, + "learning_rate": 0.00010613718411552345, + "loss": 0.0475, + "step": 2293 + }, + { + "epoch": 10.52, + "learning_rate": 0.00010602888086642599, + "loss": 0.1079, + "step": 2294 + }, + { + "epoch": 10.53, + "learning_rate": 0.00010592057761732852, + "loss": 0.0894, + "step": 2295 + }, + { + "epoch": 10.53, + "learning_rate": 0.00010581227436823104, + "loss": 0.1625, + "step": 2296 + }, + { + "epoch": 10.54, + "learning_rate": 0.00010570397111913357, + "loss": 0.0996, + "step": 2297 + }, + { + "epoch": 10.54, + "learning_rate": 0.0001055956678700361, + "loss": 0.0618, + "step": 2298 + }, + { + "epoch": 10.55, + "learning_rate": 0.00010548736462093861, + "loss": 0.1074, + "step": 2299 + }, + { + "epoch": 10.55, + "learning_rate": 0.00010537906137184114, + "loss": 0.0965, + "step": 2300 + }, + { + "epoch": 10.55, + "eval_loss": 0.3952449858188629, + "eval_runtime": 20.0329, + "eval_samples_per_second": 82.215, + "eval_steps_per_second": 2.596, + "eval_wer": 0.35624553161066286, + "step": 2300 + }, + { + "epoch": 10.56, + "learning_rate": 0.00010527075812274367, + "loss": 0.0852, + "step": 2301 + }, + { + "epoch": 10.56, + "learning_rate": 0.00010516245487364619, + "loss": 0.1513, + "step": 2302 + }, + { + "epoch": 10.56, + "learning_rate": 0.00010505415162454872, + "loss": 0.0603, + "step": 2303 + }, + { + "epoch": 10.57, + "learning_rate": 0.00010494584837545125, + "loss": 0.1101, + "step": 2304 + }, + { + "epoch": 10.57, + "learning_rate": 0.00010483754512635379, + "loss": 0.1866, + "step": 2305 + }, + { + "epoch": 10.58, + "learning_rate": 0.00010472924187725631, + "loss": 0.07, + "step": 2306 + }, + { + "epoch": 10.58, + "learning_rate": 0.00010462093862815884, + "loss": 0.0655, + "step": 2307 + }, + { + "epoch": 10.59, + "learning_rate": 0.00010451263537906137, + "loss": 0.0576, + "step": 2308 + }, + { + "epoch": 10.59, + "learning_rate": 0.0001044043321299639, + "loss": 0.102, + "step": 2309 + }, + { + "epoch": 10.6, + "learning_rate": 0.00010429602888086641, + "loss": 0.1277, + "step": 2310 + }, + { + "epoch": 10.6, + "learning_rate": 0.00010418772563176894, + "loss": 0.0789, + "step": 2311 + }, + { + "epoch": 10.61, + "learning_rate": 0.00010407942238267147, + "loss": 0.0677, + "step": 2312 + }, + { + "epoch": 10.61, + "learning_rate": 0.00010397111913357399, + "loss": 0.0639, + "step": 2313 + }, + { + "epoch": 10.61, + "learning_rate": 0.00010386281588447652, + "loss": 0.0828, + "step": 2314 + }, + { + "epoch": 10.62, + "learning_rate": 0.00010375451263537905, + "loss": 0.1267, + "step": 2315 + }, + { + "epoch": 10.62, + "learning_rate": 0.00010364620938628159, + "loss": 0.0793, + "step": 2316 + }, + { + "epoch": 10.63, + "learning_rate": 0.00010353790613718411, + "loss": 0.1298, + "step": 2317 + }, + { + "epoch": 10.63, + "learning_rate": 0.00010342960288808664, + "loss": 0.0712, + "step": 2318 + }, + { + "epoch": 10.64, + "learning_rate": 0.00010332129963898917, + "loss": 0.0811, + "step": 2319 + }, + { + "epoch": 10.64, + "learning_rate": 0.00010321299638989168, + "loss": 0.0751, + "step": 2320 + }, + { + "epoch": 10.65, + "learning_rate": 0.00010310469314079421, + "loss": 0.0636, + "step": 2321 + }, + { + "epoch": 10.65, + "learning_rate": 0.00010299638989169674, + "loss": 0.1031, + "step": 2322 + }, + { + "epoch": 10.66, + "learning_rate": 0.00010288808664259927, + "loss": 0.136, + "step": 2323 + }, + { + "epoch": 10.66, + "learning_rate": 0.00010277978339350179, + "loss": 0.0561, + "step": 2324 + }, + { + "epoch": 10.67, + "learning_rate": 0.00010267148014440432, + "loss": 0.0839, + "step": 2325 + }, + { + "epoch": 10.67, + "learning_rate": 0.00010256317689530685, + "loss": 0.1188, + "step": 2326 + }, + { + "epoch": 10.67, + "learning_rate": 0.00010245487364620939, + "loss": 0.1294, + "step": 2327 + }, + { + "epoch": 10.68, + "learning_rate": 0.00010234657039711191, + "loss": 0.1334, + "step": 2328 + }, + { + "epoch": 10.68, + "learning_rate": 0.00010223826714801444, + "loss": 0.1386, + "step": 2329 + }, + { + "epoch": 10.69, + "learning_rate": 0.00010212996389891697, + "loss": 0.1955, + "step": 2330 + }, + { + "epoch": 10.69, + "learning_rate": 0.00010202166064981948, + "loss": 0.029, + "step": 2331 + }, + { + "epoch": 10.7, + "learning_rate": 0.00010191335740072201, + "loss": 0.1054, + "step": 2332 + }, + { + "epoch": 10.7, + "learning_rate": 0.00010180505415162454, + "loss": 0.0696, + "step": 2333 + }, + { + "epoch": 10.71, + "learning_rate": 0.00010169675090252706, + "loss": 0.0927, + "step": 2334 + }, + { + "epoch": 10.71, + "learning_rate": 0.00010158844765342959, + "loss": 0.103, + "step": 2335 + }, + { + "epoch": 10.72, + "learning_rate": 0.00010148014440433212, + "loss": 0.0703, + "step": 2336 + }, + { + "epoch": 10.72, + "learning_rate": 0.00010137184115523463, + "loss": 0.1277, + "step": 2337 + }, + { + "epoch": 10.72, + "learning_rate": 0.00010126353790613718, + "loss": 0.0836, + "step": 2338 + }, + { + "epoch": 10.73, + "learning_rate": 0.0001011552346570397, + "loss": 0.0965, + "step": 2339 + }, + { + "epoch": 10.73, + "learning_rate": 0.00010104693140794224, + "loss": 0.0577, + "step": 2340 + }, + { + "epoch": 10.74, + "learning_rate": 0.00010093862815884475, + "loss": 0.071, + "step": 2341 + }, + { + "epoch": 10.74, + "learning_rate": 0.00010083032490974728, + "loss": 0.0878, + "step": 2342 + }, + { + "epoch": 10.75, + "learning_rate": 0.00010072202166064981, + "loss": 0.1419, + "step": 2343 + }, + { + "epoch": 10.75, + "learning_rate": 0.00010061371841155234, + "loss": 0.0555, + "step": 2344 + }, + { + "epoch": 10.76, + "learning_rate": 0.00010050541516245486, + "loss": 0.0941, + "step": 2345 + }, + { + "epoch": 10.76, + "learning_rate": 0.00010039711191335739, + "loss": 0.0328, + "step": 2346 + }, + { + "epoch": 10.77, + "learning_rate": 0.00010028880866425992, + "loss": 0.0718, + "step": 2347 + }, + { + "epoch": 10.77, + "learning_rate": 0.00010018050541516246, + "loss": 0.0774, + "step": 2348 + }, + { + "epoch": 10.78, + "learning_rate": 0.00010007220216606498, + "loss": 0.0788, + "step": 2349 + }, + { + "epoch": 10.78, + "learning_rate": 9.99638989169675e-05, + "loss": 0.0892, + "step": 2350 + }, + { + "epoch": 10.78, + "learning_rate": 9.985559566787004e-05, + "loss": 0.1171, + "step": 2351 + }, + { + "epoch": 10.79, + "learning_rate": 9.974729241877255e-05, + "loss": 0.0917, + "step": 2352 + }, + { + "epoch": 10.79, + "learning_rate": 9.963898916967508e-05, + "loss": 0.1061, + "step": 2353 + }, + { + "epoch": 10.8, + "learning_rate": 9.953068592057761e-05, + "loss": 0.0849, + "step": 2354 + }, + { + "epoch": 10.8, + "learning_rate": 9.942238267148013e-05, + "loss": 0.2185, + "step": 2355 + }, + { + "epoch": 10.81, + "learning_rate": 9.931407942238266e-05, + "loss": 0.0425, + "step": 2356 + }, + { + "epoch": 10.81, + "learning_rate": 9.920577617328519e-05, + "loss": 0.091, + "step": 2357 + }, + { + "epoch": 10.82, + "learning_rate": 9.909747292418772e-05, + "loss": 0.0907, + "step": 2358 + }, + { + "epoch": 10.82, + "learning_rate": 9.898916967509025e-05, + "loss": 0.0751, + "step": 2359 + }, + { + "epoch": 10.83, + "learning_rate": 9.888086642599278e-05, + "loss": 0.083, + "step": 2360 + }, + { + "epoch": 10.83, + "learning_rate": 9.87725631768953e-05, + "loss": 0.063, + "step": 2361 + }, + { + "epoch": 10.83, + "learning_rate": 9.866425992779783e-05, + "loss": 0.1762, + "step": 2362 + }, + { + "epoch": 10.84, + "learning_rate": 9.855595667870035e-05, + "loss": 0.0844, + "step": 2363 + }, + { + "epoch": 10.84, + "learning_rate": 9.844765342960288e-05, + "loss": 0.1032, + "step": 2364 + }, + { + "epoch": 10.85, + "learning_rate": 9.833935018050541e-05, + "loss": 0.1372, + "step": 2365 + }, + { + "epoch": 10.85, + "learning_rate": 9.823104693140793e-05, + "loss": 0.1547, + "step": 2366 + }, + { + "epoch": 10.86, + "learning_rate": 9.812274368231046e-05, + "loss": 0.2023, + "step": 2367 + }, + { + "epoch": 10.86, + "learning_rate": 9.801444043321299e-05, + "loss": 0.0635, + "step": 2368 + }, + { + "epoch": 10.87, + "learning_rate": 9.79061371841155e-05, + "loss": 0.0716, + "step": 2369 + }, + { + "epoch": 10.87, + "learning_rate": 9.779783393501805e-05, + "loss": 0.0814, + "step": 2370 + }, + { + "epoch": 10.88, + "learning_rate": 9.768953068592057e-05, + "loss": 0.0666, + "step": 2371 + }, + { + "epoch": 10.88, + "learning_rate": 9.75812274368231e-05, + "loss": 0.0787, + "step": 2372 + }, + { + "epoch": 10.89, + "learning_rate": 9.747292418772562e-05, + "loss": 0.1062, + "step": 2373 + }, + { + "epoch": 10.89, + "learning_rate": 9.736462093862815e-05, + "loss": 0.0599, + "step": 2374 + }, + { + "epoch": 10.89, + "learning_rate": 9.725631768953068e-05, + "loss": 0.1157, + "step": 2375 + }, + { + "epoch": 10.9, + "learning_rate": 9.714801444043321e-05, + "loss": 0.1443, + "step": 2376 + }, + { + "epoch": 10.9, + "learning_rate": 9.703971119133573e-05, + "loss": 0.0812, + "step": 2377 + }, + { + "epoch": 10.91, + "learning_rate": 9.693140794223826e-05, + "loss": 0.1497, + "step": 2378 + }, + { + "epoch": 10.91, + "learning_rate": 9.682310469314079e-05, + "loss": 0.1307, + "step": 2379 + }, + { + "epoch": 10.92, + "learning_rate": 9.67148014440433e-05, + "loss": 0.2658, + "step": 2380 + }, + { + "epoch": 10.92, + "learning_rate": 9.660649819494584e-05, + "loss": 0.0666, + "step": 2381 + }, + { + "epoch": 10.93, + "learning_rate": 9.649819494584837e-05, + "loss": 0.0976, + "step": 2382 + }, + { + "epoch": 10.93, + "learning_rate": 9.63898916967509e-05, + "loss": 0.0587, + "step": 2383 + }, + { + "epoch": 10.94, + "learning_rate": 9.628158844765342e-05, + "loss": 0.0898, + "step": 2384 + }, + { + "epoch": 10.94, + "learning_rate": 9.617328519855595e-05, + "loss": 0.1123, + "step": 2385 + }, + { + "epoch": 10.94, + "learning_rate": 9.606498194945848e-05, + "loss": 0.0723, + "step": 2386 + }, + { + "epoch": 10.95, + "learning_rate": 9.5956678700361e-05, + "loss": 0.0891, + "step": 2387 + }, + { + "epoch": 10.95, + "learning_rate": 9.584837545126353e-05, + "loss": 0.09, + "step": 2388 + }, + { + "epoch": 10.96, + "learning_rate": 9.574007220216605e-05, + "loss": 0.0523, + "step": 2389 + }, + { + "epoch": 10.96, + "learning_rate": 9.563176895306857e-05, + "loss": 0.1646, + "step": 2390 + }, + { + "epoch": 10.97, + "learning_rate": 9.55234657039711e-05, + "loss": 0.1236, + "step": 2391 + }, + { + "epoch": 10.97, + "learning_rate": 9.541516245487364e-05, + "loss": 0.1521, + "step": 2392 + }, + { + "epoch": 10.98, + "learning_rate": 9.530685920577617e-05, + "loss": 0.1041, + "step": 2393 + }, + { + "epoch": 10.98, + "learning_rate": 9.519855595667869e-05, + "loss": 0.0945, + "step": 2394 + }, + { + "epoch": 10.99, + "learning_rate": 9.509025270758122e-05, + "loss": 0.0973, + "step": 2395 + }, + { + "epoch": 10.99, + "learning_rate": 9.498194945848375e-05, + "loss": 0.0753, + "step": 2396 + }, + { + "epoch": 11.0, + "learning_rate": 9.487364620938628e-05, + "loss": 0.1107, + "step": 2397 + }, + { + "epoch": 11.0, + "learning_rate": 9.47653429602888e-05, + "loss": 0.0432, + "step": 2398 + }, + { + "epoch": 11.0, + "learning_rate": 9.465703971119132e-05, + "loss": 0.0433, + "step": 2399 + }, + { + "epoch": 11.01, + "learning_rate": 9.454873646209385e-05, + "loss": 0.0612, + "step": 2400 + }, + { + "epoch": 11.01, + "eval_loss": 0.3809739351272583, + "eval_runtime": 19.8118, + "eval_samples_per_second": 83.132, + "eval_steps_per_second": 2.625, + "eval_wer": 0.34756408946992134, + "step": 2400 + }, + { + "epoch": 11.01, + "learning_rate": 9.444043321299637e-05, + "loss": 0.1233, + "step": 2401 + }, + { + "epoch": 11.02, + "learning_rate": 9.433212996389891e-05, + "loss": 0.0818, + "step": 2402 + }, + { + "epoch": 11.02, + "learning_rate": 9.422382671480144e-05, + "loss": 0.0699, + "step": 2403 + }, + { + "epoch": 11.03, + "learning_rate": 9.411552346570397e-05, + "loss": 0.0724, + "step": 2404 + }, + { + "epoch": 11.03, + "learning_rate": 9.400722021660649e-05, + "loss": 0.0877, + "step": 2405 + }, + { + "epoch": 11.04, + "learning_rate": 9.389891696750902e-05, + "loss": 0.0873, + "step": 2406 + }, + { + "epoch": 11.04, + "learning_rate": 9.379061371841155e-05, + "loss": 0.0881, + "step": 2407 + }, + { + "epoch": 11.05, + "learning_rate": 9.368231046931406e-05, + "loss": 0.0812, + "step": 2408 + }, + { + "epoch": 11.05, + "learning_rate": 9.35740072202166e-05, + "loss": 0.1183, + "step": 2409 + }, + { + "epoch": 11.06, + "learning_rate": 9.346570397111912e-05, + "loss": 0.1181, + "step": 2410 + }, + { + "epoch": 11.06, + "learning_rate": 9.335740072202165e-05, + "loss": 0.0816, + "step": 2411 + }, + { + "epoch": 11.06, + "learning_rate": 9.324909747292417e-05, + "loss": 0.071, + "step": 2412 + }, + { + "epoch": 11.07, + "learning_rate": 9.314079422382671e-05, + "loss": 0.0218, + "step": 2413 + }, + { + "epoch": 11.07, + "learning_rate": 9.303249097472924e-05, + "loss": 0.1017, + "step": 2414 + }, + { + "epoch": 11.08, + "learning_rate": 9.292418772563177e-05, + "loss": 0.0674, + "step": 2415 + }, + { + "epoch": 11.08, + "learning_rate": 9.281588447653429e-05, + "loss": 0.0352, + "step": 2416 + }, + { + "epoch": 11.09, + "learning_rate": 9.270758122743682e-05, + "loss": 0.1346, + "step": 2417 + }, + { + "epoch": 11.09, + "learning_rate": 9.259927797833935e-05, + "loss": 0.0708, + "step": 2418 + }, + { + "epoch": 11.1, + "learning_rate": 9.249097472924186e-05, + "loss": 0.1342, + "step": 2419 + }, + { + "epoch": 11.1, + "learning_rate": 9.23826714801444e-05, + "loss": 0.1233, + "step": 2420 + }, + { + "epoch": 11.11, + "learning_rate": 9.227436823104692e-05, + "loss": 0.1057, + "step": 2421 + }, + { + "epoch": 11.11, + "learning_rate": 9.216606498194944e-05, + "loss": 0.0898, + "step": 2422 + }, + { + "epoch": 11.11, + "learning_rate": 9.205776173285197e-05, + "loss": 0.1001, + "step": 2423 + }, + { + "epoch": 11.12, + "learning_rate": 9.194945848375451e-05, + "loss": 0.1079, + "step": 2424 + }, + { + "epoch": 11.12, + "learning_rate": 9.184115523465704e-05, + "loss": 0.063, + "step": 2425 + }, + { + "epoch": 11.13, + "learning_rate": 9.173285198555956e-05, + "loss": 0.0587, + "step": 2426 + }, + { + "epoch": 11.13, + "learning_rate": 9.162454873646209e-05, + "loss": 0.1096, + "step": 2427 + }, + { + "epoch": 11.14, + "learning_rate": 9.151624548736462e-05, + "loss": 0.1014, + "step": 2428 + }, + { + "epoch": 11.14, + "learning_rate": 9.140794223826713e-05, + "loss": 0.1042, + "step": 2429 + }, + { + "epoch": 11.15, + "learning_rate": 9.129963898916966e-05, + "loss": 0.0756, + "step": 2430 + }, + { + "epoch": 11.15, + "learning_rate": 9.119133574007219e-05, + "loss": 0.0579, + "step": 2431 + }, + { + "epoch": 11.16, + "learning_rate": 9.108303249097472e-05, + "loss": 0.0568, + "step": 2432 + }, + { + "epoch": 11.16, + "learning_rate": 9.097472924187724e-05, + "loss": 0.1529, + "step": 2433 + }, + { + "epoch": 11.17, + "learning_rate": 9.086642599277977e-05, + "loss": 0.106, + "step": 2434 + }, + { + "epoch": 11.17, + "learning_rate": 9.075812274368231e-05, + "loss": 0.1274, + "step": 2435 + }, + { + "epoch": 11.17, + "learning_rate": 9.064981949458484e-05, + "loss": 0.0524, + "step": 2436 + }, + { + "epoch": 11.18, + "learning_rate": 9.054151624548736e-05, + "loss": 0.0403, + "step": 2437 + }, + { + "epoch": 11.18, + "learning_rate": 9.043321299638989e-05, + "loss": 0.04, + "step": 2438 + }, + { + "epoch": 11.19, + "learning_rate": 9.032490974729242e-05, + "loss": 0.0982, + "step": 2439 + }, + { + "epoch": 11.19, + "learning_rate": 9.021660649819493e-05, + "loss": 0.0608, + "step": 2440 + }, + { + "epoch": 11.2, + "learning_rate": 9.010830324909746e-05, + "loss": 0.0594, + "step": 2441 + }, + { + "epoch": 11.2, + "learning_rate": 8.999999999999999e-05, + "loss": 0.048, + "step": 2442 + }, + { + "epoch": 11.21, + "learning_rate": 8.989169675090251e-05, + "loss": 0.085, + "step": 2443 + }, + { + "epoch": 11.21, + "learning_rate": 8.978339350180504e-05, + "loss": 0.1139, + "step": 2444 + }, + { + "epoch": 11.22, + "learning_rate": 8.967509025270757e-05, + "loss": 0.1235, + "step": 2445 + }, + { + "epoch": 11.22, + "learning_rate": 8.956678700361011e-05, + "loss": 0.1417, + "step": 2446 + }, + { + "epoch": 11.22, + "learning_rate": 8.945848375451263e-05, + "loss": 0.1003, + "step": 2447 + }, + { + "epoch": 11.23, + "learning_rate": 8.935018050541516e-05, + "loss": 0.0544, + "step": 2448 + }, + { + "epoch": 11.23, + "learning_rate": 8.924187725631769e-05, + "loss": 0.0745, + "step": 2449 + }, + { + "epoch": 11.24, + "learning_rate": 8.913357400722022e-05, + "loss": 0.0686, + "step": 2450 + }, + { + "epoch": 11.24, + "learning_rate": 8.902527075812273e-05, + "loss": 0.0589, + "step": 2451 + }, + { + "epoch": 11.25, + "learning_rate": 8.891696750902526e-05, + "loss": 0.092, + "step": 2452 + }, + { + "epoch": 11.25, + "learning_rate": 8.880866425992779e-05, + "loss": 0.0822, + "step": 2453 + }, + { + "epoch": 11.26, + "learning_rate": 8.870036101083031e-05, + "loss": 0.0555, + "step": 2454 + }, + { + "epoch": 11.26, + "learning_rate": 8.859205776173284e-05, + "loss": 0.1457, + "step": 2455 + }, + { + "epoch": 11.27, + "learning_rate": 8.848375451263537e-05, + "loss": 0.0784, + "step": 2456 + }, + { + "epoch": 11.27, + "learning_rate": 8.837545126353791e-05, + "loss": 0.0526, + "step": 2457 + }, + { + "epoch": 11.28, + "learning_rate": 8.826714801444043e-05, + "loss": 0.1147, + "step": 2458 + }, + { + "epoch": 11.28, + "learning_rate": 8.815884476534296e-05, + "loss": 0.1329, + "step": 2459 + }, + { + "epoch": 11.28, + "learning_rate": 8.805054151624549e-05, + "loss": 0.0948, + "step": 2460 + }, + { + "epoch": 11.29, + "learning_rate": 8.7942238267148e-05, + "loss": 0.1025, + "step": 2461 + }, + { + "epoch": 11.29, + "learning_rate": 8.783393501805053e-05, + "loss": 0.0469, + "step": 2462 + }, + { + "epoch": 11.3, + "learning_rate": 8.772563176895306e-05, + "loss": 0.1012, + "step": 2463 + }, + { + "epoch": 11.3, + "learning_rate": 8.761732851985559e-05, + "loss": 0.0554, + "step": 2464 + }, + { + "epoch": 11.31, + "learning_rate": 8.750902527075811e-05, + "loss": 0.0383, + "step": 2465 + }, + { + "epoch": 11.31, + "learning_rate": 8.740072202166064e-05, + "loss": 0.05, + "step": 2466 + }, + { + "epoch": 11.32, + "learning_rate": 8.729241877256318e-05, + "loss": 0.0684, + "step": 2467 + }, + { + "epoch": 11.32, + "learning_rate": 8.718411552346571e-05, + "loss": 0.1015, + "step": 2468 + }, + { + "epoch": 11.33, + "learning_rate": 8.707581227436823e-05, + "loss": 0.0963, + "step": 2469 + }, + { + "epoch": 11.33, + "learning_rate": 8.696750902527076e-05, + "loss": 0.1549, + "step": 2470 + }, + { + "epoch": 11.33, + "learning_rate": 8.685920577617329e-05, + "loss": 0.0823, + "step": 2471 + }, + { + "epoch": 11.34, + "learning_rate": 8.67509025270758e-05, + "loss": 0.1264, + "step": 2472 + }, + { + "epoch": 11.34, + "learning_rate": 8.664259927797833e-05, + "loss": 0.1072, + "step": 2473 + }, + { + "epoch": 11.35, + "learning_rate": 8.653429602888086e-05, + "loss": 0.0333, + "step": 2474 + }, + { + "epoch": 11.35, + "learning_rate": 8.642599277978338e-05, + "loss": 0.0421, + "step": 2475 + }, + { + "epoch": 11.36, + "learning_rate": 8.63176895306859e-05, + "loss": 0.0824, + "step": 2476 + }, + { + "epoch": 11.36, + "learning_rate": 8.620938628158844e-05, + "loss": 0.0802, + "step": 2477 + }, + { + "epoch": 11.37, + "learning_rate": 8.610108303249098e-05, + "loss": 0.0673, + "step": 2478 + }, + { + "epoch": 11.37, + "learning_rate": 8.59927797833935e-05, + "loss": 0.0403, + "step": 2479 + }, + { + "epoch": 11.38, + "learning_rate": 8.588447653429603e-05, + "loss": 0.1085, + "step": 2480 + }, + { + "epoch": 11.38, + "learning_rate": 8.577617328519855e-05, + "loss": 0.0698, + "step": 2481 + }, + { + "epoch": 11.39, + "learning_rate": 8.566787003610107e-05, + "loss": 0.1091, + "step": 2482 + }, + { + "epoch": 11.39, + "learning_rate": 8.55595667870036e-05, + "loss": 0.1215, + "step": 2483 + }, + { + "epoch": 11.39, + "learning_rate": 8.545126353790613e-05, + "loss": 0.1193, + "step": 2484 + }, + { + "epoch": 11.4, + "learning_rate": 8.534296028880866e-05, + "loss": 0.0636, + "step": 2485 + }, + { + "epoch": 11.4, + "learning_rate": 8.523465703971118e-05, + "loss": 0.08, + "step": 2486 + }, + { + "epoch": 11.41, + "learning_rate": 8.51263537906137e-05, + "loss": 0.0758, + "step": 2487 + }, + { + "epoch": 11.41, + "learning_rate": 8.501805054151624e-05, + "loss": 0.0939, + "step": 2488 + }, + { + "epoch": 11.42, + "learning_rate": 8.490974729241878e-05, + "loss": 0.0701, + "step": 2489 + }, + { + "epoch": 11.42, + "learning_rate": 8.48014440433213e-05, + "loss": 0.1779, + "step": 2490 + }, + { + "epoch": 11.43, + "learning_rate": 8.469314079422382e-05, + "loss": 0.0501, + "step": 2491 + }, + { + "epoch": 11.43, + "learning_rate": 8.458483754512635e-05, + "loss": 0.1288, + "step": 2492 + }, + { + "epoch": 11.44, + "learning_rate": 8.447653429602887e-05, + "loss": 0.0663, + "step": 2493 + }, + { + "epoch": 11.44, + "learning_rate": 8.43682310469314e-05, + "loss": 0.0862, + "step": 2494 + }, + { + "epoch": 11.44, + "learning_rate": 8.425992779783393e-05, + "loss": 0.0977, + "step": 2495 + }, + { + "epoch": 11.45, + "learning_rate": 8.415162454873645e-05, + "loss": 0.1128, + "step": 2496 + }, + { + "epoch": 11.45, + "learning_rate": 8.404332129963898e-05, + "loss": 0.1604, + "step": 2497 + }, + { + "epoch": 11.46, + "learning_rate": 8.39350180505415e-05, + "loss": 0.134, + "step": 2498 + }, + { + "epoch": 11.46, + "learning_rate": 8.382671480144403e-05, + "loss": 0.0899, + "step": 2499 + }, + { + "epoch": 11.47, + "learning_rate": 8.371841155234656e-05, + "loss": 0.0764, + "step": 2500 + }, + { + "epoch": 11.47, + "eval_loss": 0.373426616191864, + "eval_runtime": 19.8845, + "eval_samples_per_second": 82.828, + "eval_steps_per_second": 2.615, + "eval_wer": 0.3507302624859565, + "step": 2500 + }, + { + "epoch": 11.47, + "learning_rate": 8.36101083032491e-05, + "loss": 0.0673, + "step": 2501 + }, + { + "epoch": 11.48, + "learning_rate": 8.350180505415162e-05, + "loss": 0.0845, + "step": 2502 + }, + { + "epoch": 11.48, + "learning_rate": 8.339350180505415e-05, + "loss": 0.0639, + "step": 2503 + }, + { + "epoch": 11.49, + "learning_rate": 8.328519855595667e-05, + "loss": 0.072, + "step": 2504 + }, + { + "epoch": 11.49, + "learning_rate": 8.31768953068592e-05, + "loss": 0.1118, + "step": 2505 + }, + { + "epoch": 11.5, + "learning_rate": 8.306859205776173e-05, + "loss": 0.088, + "step": 2506 + }, + { + "epoch": 11.5, + "learning_rate": 8.296028880866425e-05, + "loss": 0.1168, + "step": 2507 + }, + { + "epoch": 11.5, + "learning_rate": 8.285198555956677e-05, + "loss": 0.0516, + "step": 2508 + }, + { + "epoch": 11.51, + "learning_rate": 8.27436823104693e-05, + "loss": 0.098, + "step": 2509 + }, + { + "epoch": 11.51, + "learning_rate": 8.263537906137182e-05, + "loss": 0.1277, + "step": 2510 + }, + { + "epoch": 11.52, + "learning_rate": 8.252707581227436e-05, + "loss": 0.0742, + "step": 2511 + }, + { + "epoch": 11.52, + "learning_rate": 8.24187725631769e-05, + "loss": 0.0688, + "step": 2512 + }, + { + "epoch": 11.53, + "learning_rate": 8.231046931407942e-05, + "loss": 0.0497, + "step": 2513 + }, + { + "epoch": 11.53, + "learning_rate": 8.220216606498194e-05, + "loss": 0.0399, + "step": 2514 + }, + { + "epoch": 11.54, + "learning_rate": 8.209386281588447e-05, + "loss": 0.0459, + "step": 2515 + }, + { + "epoch": 11.54, + "learning_rate": 8.1985559566787e-05, + "loss": 0.0295, + "step": 2516 + }, + { + "epoch": 11.55, + "learning_rate": 8.187725631768951e-05, + "loss": 0.0582, + "step": 2517 + }, + { + "epoch": 11.55, + "learning_rate": 8.176895306859204e-05, + "loss": 0.0554, + "step": 2518 + }, + { + "epoch": 11.56, + "learning_rate": 8.166064981949457e-05, + "loss": 0.1264, + "step": 2519 + }, + { + "epoch": 11.56, + "learning_rate": 8.15523465703971e-05, + "loss": 0.0685, + "step": 2520 + }, + { + "epoch": 11.56, + "learning_rate": 8.144404332129963e-05, + "loss": 0.1232, + "step": 2521 + }, + { + "epoch": 11.57, + "learning_rate": 8.133574007220216e-05, + "loss": 0.1014, + "step": 2522 + }, + { + "epoch": 11.57, + "learning_rate": 8.122743682310469e-05, + "loss": 0.0594, + "step": 2523 + }, + { + "epoch": 11.58, + "learning_rate": 8.111913357400722e-05, + "loss": 0.0662, + "step": 2524 + }, + { + "epoch": 11.58, + "learning_rate": 8.101083032490974e-05, + "loss": 0.0458, + "step": 2525 + }, + { + "epoch": 11.59, + "learning_rate": 8.090252707581227e-05, + "loss": 0.0872, + "step": 2526 + }, + { + "epoch": 11.59, + "learning_rate": 8.07942238267148e-05, + "loss": 0.0617, + "step": 2527 + }, + { + "epoch": 11.6, + "learning_rate": 8.068592057761731e-05, + "loss": 0.0626, + "step": 2528 + }, + { + "epoch": 11.6, + "learning_rate": 8.057761732851984e-05, + "loss": 0.0598, + "step": 2529 + }, + { + "epoch": 11.61, + "learning_rate": 8.046931407942237e-05, + "loss": 0.0699, + "step": 2530 + }, + { + "epoch": 11.61, + "learning_rate": 8.036101083032489e-05, + "loss": 0.0821, + "step": 2531 + }, + { + "epoch": 11.61, + "learning_rate": 8.025270758122743e-05, + "loss": 0.099, + "step": 2532 + }, + { + "epoch": 11.62, + "learning_rate": 8.014440433212996e-05, + "loss": 0.082, + "step": 2533 + }, + { + "epoch": 11.62, + "learning_rate": 8.003610108303249e-05, + "loss": 0.0381, + "step": 2534 + }, + { + "epoch": 11.63, + "learning_rate": 7.992779783393501e-05, + "loss": 0.1058, + "step": 2535 + }, + { + "epoch": 11.63, + "learning_rate": 7.981949458483754e-05, + "loss": 0.0506, + "step": 2536 + }, + { + "epoch": 11.64, + "learning_rate": 7.971119133574007e-05, + "loss": 0.0608, + "step": 2537 + }, + { + "epoch": 11.64, + "learning_rate": 7.96028880866426e-05, + "loss": 0.0586, + "step": 2538 + }, + { + "epoch": 11.65, + "learning_rate": 7.949458483754511e-05, + "loss": 0.0651, + "step": 2539 + }, + { + "epoch": 11.65, + "learning_rate": 7.938628158844764e-05, + "loss": 0.0963, + "step": 2540 + }, + { + "epoch": 11.66, + "learning_rate": 7.927797833935017e-05, + "loss": 0.1036, + "step": 2541 + }, + { + "epoch": 11.66, + "learning_rate": 7.916967509025269e-05, + "loss": 0.0293, + "step": 2542 + }, + { + "epoch": 11.67, + "learning_rate": 7.906137184115523e-05, + "loss": 0.133, + "step": 2543 + }, + { + "epoch": 11.67, + "learning_rate": 7.895306859205776e-05, + "loss": 0.0868, + "step": 2544 + }, + { + "epoch": 11.67, + "learning_rate": 7.884476534296029e-05, + "loss": 0.0679, + "step": 2545 + }, + { + "epoch": 11.68, + "learning_rate": 7.873646209386281e-05, + "loss": 0.0826, + "step": 2546 + }, + { + "epoch": 11.68, + "learning_rate": 7.862815884476534e-05, + "loss": 0.0697, + "step": 2547 + }, + { + "epoch": 11.69, + "learning_rate": 7.851985559566787e-05, + "loss": 0.1218, + "step": 2548 + }, + { + "epoch": 11.69, + "learning_rate": 7.841155234657038e-05, + "loss": 0.0452, + "step": 2549 + }, + { + "epoch": 11.7, + "learning_rate": 7.830324909747291e-05, + "loss": 0.0498, + "step": 2550 + }, + { + "epoch": 11.7, + "learning_rate": 7.819494584837544e-05, + "loss": 0.0546, + "step": 2551 + }, + { + "epoch": 11.71, + "learning_rate": 7.808664259927797e-05, + "loss": 0.0934, + "step": 2552 + }, + { + "epoch": 11.71, + "learning_rate": 7.797833935018049e-05, + "loss": 0.0559, + "step": 2553 + }, + { + "epoch": 11.72, + "learning_rate": 7.787003610108303e-05, + "loss": 0.0634, + "step": 2554 + }, + { + "epoch": 11.72, + "learning_rate": 7.776173285198556e-05, + "loss": 0.0361, + "step": 2555 + }, + { + "epoch": 11.72, + "learning_rate": 7.765342960288809e-05, + "loss": 0.0535, + "step": 2556 + }, + { + "epoch": 11.73, + "learning_rate": 7.754512635379061e-05, + "loss": 0.063, + "step": 2557 + }, + { + "epoch": 11.73, + "learning_rate": 7.743682310469314e-05, + "loss": 0.1123, + "step": 2558 + }, + { + "epoch": 11.74, + "learning_rate": 7.732851985559567e-05, + "loss": 0.1017, + "step": 2559 + }, + { + "epoch": 11.74, + "learning_rate": 7.722021660649818e-05, + "loss": 0.116, + "step": 2560 + }, + { + "epoch": 11.75, + "learning_rate": 7.711191335740071e-05, + "loss": 0.0512, + "step": 2561 + }, + { + "epoch": 11.75, + "learning_rate": 7.700361010830324e-05, + "loss": 0.0455, + "step": 2562 + }, + { + "epoch": 11.76, + "learning_rate": 7.689530685920576e-05, + "loss": 0.0091, + "step": 2563 + }, + { + "epoch": 11.76, + "learning_rate": 7.678700361010829e-05, + "loss": 0.0478, + "step": 2564 + }, + { + "epoch": 11.77, + "learning_rate": 7.667870036101083e-05, + "loss": 0.055, + "step": 2565 + }, + { + "epoch": 11.77, + "learning_rate": 7.657039711191336e-05, + "loss": 0.1064, + "step": 2566 + }, + { + "epoch": 11.78, + "learning_rate": 7.646209386281588e-05, + "loss": 0.0565, + "step": 2567 + }, + { + "epoch": 11.78, + "learning_rate": 7.63537906137184e-05, + "loss": 0.0666, + "step": 2568 + }, + { + "epoch": 11.78, + "learning_rate": 7.624548736462094e-05, + "loss": 0.0975, + "step": 2569 + }, + { + "epoch": 11.79, + "learning_rate": 7.613718411552345e-05, + "loss": 0.1109, + "step": 2570 + }, + { + "epoch": 11.79, + "learning_rate": 7.602888086642598e-05, + "loss": 0.1284, + "step": 2571 + }, + { + "epoch": 11.8, + "learning_rate": 7.592057761732851e-05, + "loss": 0.0694, + "step": 2572 + }, + { + "epoch": 11.8, + "learning_rate": 7.581227436823104e-05, + "loss": 0.1434, + "step": 2573 + }, + { + "epoch": 11.81, + "learning_rate": 7.570397111913356e-05, + "loss": 0.0444, + "step": 2574 + }, + { + "epoch": 11.81, + "learning_rate": 7.559566787003609e-05, + "loss": 0.0361, + "step": 2575 + }, + { + "epoch": 11.82, + "learning_rate": 7.548736462093863e-05, + "loss": 0.0986, + "step": 2576 + }, + { + "epoch": 11.82, + "learning_rate": 7.537906137184116e-05, + "loss": 0.055, + "step": 2577 + }, + { + "epoch": 11.83, + "learning_rate": 7.527075812274368e-05, + "loss": 0.119, + "step": 2578 + }, + { + "epoch": 11.83, + "learning_rate": 7.51624548736462e-05, + "loss": 0.0284, + "step": 2579 + }, + { + "epoch": 11.83, + "learning_rate": 7.505415162454874e-05, + "loss": 0.048, + "step": 2580 + }, + { + "epoch": 11.84, + "learning_rate": 7.494584837545125e-05, + "loss": 0.0361, + "step": 2581 + }, + { + "epoch": 11.84, + "learning_rate": 7.483754512635378e-05, + "loss": 0.0679, + "step": 2582 + }, + { + "epoch": 11.85, + "learning_rate": 7.472924187725631e-05, + "loss": 0.1195, + "step": 2583 + }, + { + "epoch": 11.85, + "learning_rate": 7.462093862815884e-05, + "loss": 0.1171, + "step": 2584 + }, + { + "epoch": 11.86, + "learning_rate": 7.451263537906137e-05, + "loss": 0.0753, + "step": 2585 + }, + { + "epoch": 11.86, + "learning_rate": 7.440433212996389e-05, + "loss": 0.0419, + "step": 2586 + }, + { + "epoch": 11.87, + "learning_rate": 7.429602888086642e-05, + "loss": 0.0489, + "step": 2587 + }, + { + "epoch": 11.87, + "learning_rate": 7.418772563176895e-05, + "loss": 0.0502, + "step": 2588 + }, + { + "epoch": 11.88, + "learning_rate": 7.407942238267148e-05, + "loss": 0.0699, + "step": 2589 + }, + { + "epoch": 11.88, + "learning_rate": 7.3971119133574e-05, + "loss": 0.0234, + "step": 2590 + }, + { + "epoch": 11.89, + "learning_rate": 7.386281588447653e-05, + "loss": 0.0402, + "step": 2591 + }, + { + "epoch": 11.89, + "learning_rate": 7.375451263537905e-05, + "loss": 0.0593, + "step": 2592 + }, + { + "epoch": 11.89, + "learning_rate": 7.364620938628158e-05, + "loss": 0.0686, + "step": 2593 + }, + { + "epoch": 11.9, + "learning_rate": 7.353790613718411e-05, + "loss": 0.1017, + "step": 2594 + }, + { + "epoch": 11.9, + "learning_rate": 7.342960288808664e-05, + "loss": 0.0612, + "step": 2595 + }, + { + "epoch": 11.91, + "learning_rate": 7.332129963898917e-05, + "loss": 0.0676, + "step": 2596 + }, + { + "epoch": 11.91, + "learning_rate": 7.321299638989169e-05, + "loss": 0.1205, + "step": 2597 + }, + { + "epoch": 11.92, + "learning_rate": 7.310469314079422e-05, + "loss": 0.1177, + "step": 2598 + }, + { + "epoch": 11.92, + "learning_rate": 7.299638989169675e-05, + "loss": 0.0446, + "step": 2599 + }, + { + "epoch": 11.93, + "learning_rate": 7.288808664259927e-05, + "loss": 0.0973, + "step": 2600 + }, + { + "epoch": 11.93, + "eval_loss": 0.3934902846813202, + "eval_runtime": 20.4281, + "eval_samples_per_second": 80.624, + "eval_steps_per_second": 2.546, + "eval_wer": 0.3471555510162394, + "step": 2600 + }, + { + "epoch": 11.93, + "learning_rate": 7.27797833935018e-05, + "loss": 0.0472, + "step": 2601 + }, + { + "epoch": 11.94, + "learning_rate": 7.267148014440432e-05, + "loss": 0.0756, + "step": 2602 + }, + { + "epoch": 11.94, + "learning_rate": 7.256317689530685e-05, + "loss": 0.0715, + "step": 2603 + }, + { + "epoch": 11.94, + "learning_rate": 7.245487364620938e-05, + "loss": 0.0708, + "step": 2604 + }, + { + "epoch": 11.95, + "learning_rate": 7.234657039711191e-05, + "loss": 0.0846, + "step": 2605 + }, + { + "epoch": 11.95, + "learning_rate": 7.223826714801444e-05, + "loss": 0.0689, + "step": 2606 + }, + { + "epoch": 11.96, + "learning_rate": 7.212996389891696e-05, + "loss": 0.1136, + "step": 2607 + }, + { + "epoch": 11.96, + "learning_rate": 7.202166064981949e-05, + "loss": 0.043, + "step": 2608 + }, + { + "epoch": 11.97, + "learning_rate": 7.191335740072201e-05, + "loss": 0.1078, + "step": 2609 + }, + { + "epoch": 11.97, + "learning_rate": 7.180505415162454e-05, + "loss": 0.2061, + "step": 2610 + }, + { + "epoch": 11.98, + "learning_rate": 7.169675090252707e-05, + "loss": 0.0788, + "step": 2611 + }, + { + "epoch": 11.98, + "learning_rate": 7.15884476534296e-05, + "loss": 0.0674, + "step": 2612 + }, + { + "epoch": 11.99, + "learning_rate": 7.148014440433212e-05, + "loss": 0.0592, + "step": 2613 + }, + { + "epoch": 11.99, + "learning_rate": 7.137184115523465e-05, + "loss": 0.0645, + "step": 2614 + }, + { + "epoch": 12.0, + "learning_rate": 7.126353790613718e-05, + "loss": 0.0469, + "step": 2615 + }, + { + "epoch": 12.0, + "learning_rate": 7.115523465703971e-05, + "loss": 0.0848, + "step": 2616 + }, + { + "epoch": 12.0, + "learning_rate": 7.104693140794224e-05, + "loss": 0.0584, + "step": 2617 + }, + { + "epoch": 12.01, + "learning_rate": 7.093862815884475e-05, + "loss": 0.0555, + "step": 2618 + }, + { + "epoch": 12.01, + "learning_rate": 7.083032490974728e-05, + "loss": 0.0717, + "step": 2619 + }, + { + "epoch": 12.02, + "learning_rate": 7.072202166064981e-05, + "loss": 0.053, + "step": 2620 + }, + { + "epoch": 12.02, + "learning_rate": 7.061371841155233e-05, + "loss": 0.0523, + "step": 2621 + }, + { + "epoch": 12.03, + "learning_rate": 7.050541516245487e-05, + "loss": 0.0985, + "step": 2622 + }, + { + "epoch": 12.03, + "learning_rate": 7.039711191335739e-05, + "loss": 0.1255, + "step": 2623 + }, + { + "epoch": 12.04, + "learning_rate": 7.028880866425992e-05, + "loss": 0.0561, + "step": 2624 + }, + { + "epoch": 12.04, + "learning_rate": 7.018050541516245e-05, + "loss": 0.0928, + "step": 2625 + }, + { + "epoch": 12.05, + "learning_rate": 7.007220216606498e-05, + "loss": 0.136, + "step": 2626 + }, + { + "epoch": 12.05, + "learning_rate": 6.996389891696751e-05, + "loss": 0.0891, + "step": 2627 + }, + { + "epoch": 12.06, + "learning_rate": 6.985559566787004e-05, + "loss": 0.0712, + "step": 2628 + }, + { + "epoch": 12.06, + "learning_rate": 6.974729241877255e-05, + "loss": 0.1849, + "step": 2629 + }, + { + "epoch": 12.06, + "learning_rate": 6.963898916967508e-05, + "loss": 0.076, + "step": 2630 + }, + { + "epoch": 12.07, + "learning_rate": 6.953068592057761e-05, + "loss": 0.0319, + "step": 2631 + }, + { + "epoch": 12.07, + "learning_rate": 6.942238267148014e-05, + "loss": 0.0873, + "step": 2632 + }, + { + "epoch": 12.08, + "learning_rate": 6.931407942238267e-05, + "loss": 0.0689, + "step": 2633 + }, + { + "epoch": 12.08, + "learning_rate": 6.920577617328519e-05, + "loss": 0.0772, + "step": 2634 + }, + { + "epoch": 12.09, + "learning_rate": 6.909747292418772e-05, + "loss": 0.082, + "step": 2635 + }, + { + "epoch": 12.09, + "learning_rate": 6.898916967509025e-05, + "loss": 0.1242, + "step": 2636 + }, + { + "epoch": 12.1, + "learning_rate": 6.888086642599276e-05, + "loss": 0.105, + "step": 2637 + }, + { + "epoch": 12.1, + "learning_rate": 6.877256317689531e-05, + "loss": 0.1563, + "step": 2638 + }, + { + "epoch": 12.11, + "learning_rate": 6.866425992779782e-05, + "loss": 0.0462, + "step": 2639 + }, + { + "epoch": 12.11, + "learning_rate": 6.855595667870035e-05, + "loss": 0.1554, + "step": 2640 + }, + { + "epoch": 12.11, + "learning_rate": 6.844765342960288e-05, + "loss": 0.0927, + "step": 2641 + }, + { + "epoch": 12.12, + "learning_rate": 6.833935018050541e-05, + "loss": 0.0689, + "step": 2642 + }, + { + "epoch": 12.12, + "learning_rate": 6.823104693140794e-05, + "loss": 0.0763, + "step": 2643 + }, + { + "epoch": 12.13, + "learning_rate": 6.812274368231047e-05, + "loss": 0.0486, + "step": 2644 + }, + { + "epoch": 12.13, + "learning_rate": 6.801444043321299e-05, + "loss": 0.0838, + "step": 2645 + }, + { + "epoch": 12.14, + "learning_rate": 6.790613718411552e-05, + "loss": 0.0754, + "step": 2646 + }, + { + "epoch": 12.14, + "learning_rate": 6.779783393501805e-05, + "loss": 0.0876, + "step": 2647 + }, + { + "epoch": 12.15, + "learning_rate": 6.768953068592056e-05, + "loss": 0.0613, + "step": 2648 + }, + { + "epoch": 12.15, + "learning_rate": 6.758122743682311e-05, + "loss": 0.0675, + "step": 2649 + }, + { + "epoch": 12.16, + "learning_rate": 6.747292418772562e-05, + "loss": 0.0653, + "step": 2650 + }, + { + "epoch": 12.16, + "learning_rate": 6.736462093862815e-05, + "loss": 0.0831, + "step": 2651 + }, + { + "epoch": 12.17, + "learning_rate": 6.725631768953068e-05, + "loss": 0.1811, + "step": 2652 + }, + { + "epoch": 12.17, + "learning_rate": 6.71480144404332e-05, + "loss": 0.1188, + "step": 2653 + }, + { + "epoch": 12.17, + "learning_rate": 6.703971119133574e-05, + "loss": 0.069, + "step": 2654 + }, + { + "epoch": 12.18, + "learning_rate": 6.693140794223826e-05, + "loss": 0.054, + "step": 2655 + }, + { + "epoch": 12.18, + "learning_rate": 6.682310469314079e-05, + "loss": 0.0336, + "step": 2656 + }, + { + "epoch": 12.19, + "learning_rate": 6.671480144404332e-05, + "loss": 0.0827, + "step": 2657 + }, + { + "epoch": 12.19, + "learning_rate": 6.660649819494583e-05, + "loss": 0.0499, + "step": 2658 + }, + { + "epoch": 12.2, + "learning_rate": 6.649819494584838e-05, + "loss": 0.0177, + "step": 2659 + }, + { + "epoch": 12.2, + "learning_rate": 6.638989169675089e-05, + "loss": 0.1054, + "step": 2660 + }, + { + "epoch": 12.21, + "learning_rate": 6.628158844765342e-05, + "loss": 0.051, + "step": 2661 + }, + { + "epoch": 12.21, + "learning_rate": 6.617328519855595e-05, + "loss": 0.057, + "step": 2662 + }, + { + "epoch": 12.22, + "learning_rate": 6.606498194945848e-05, + "loss": 0.0925, + "step": 2663 + }, + { + "epoch": 12.22, + "learning_rate": 6.5956678700361e-05, + "loss": 0.1569, + "step": 2664 + }, + { + "epoch": 12.22, + "learning_rate": 6.584837545126354e-05, + "loss": 0.0661, + "step": 2665 + }, + { + "epoch": 12.23, + "learning_rate": 6.574007220216606e-05, + "loss": 0.041, + "step": 2666 + }, + { + "epoch": 12.23, + "learning_rate": 6.563176895306859e-05, + "loss": 0.0762, + "step": 2667 + }, + { + "epoch": 12.24, + "learning_rate": 6.552346570397112e-05, + "loss": 0.0773, + "step": 2668 + }, + { + "epoch": 12.24, + "learning_rate": 6.541516245487363e-05, + "loss": 0.0771, + "step": 2669 + }, + { + "epoch": 12.25, + "learning_rate": 6.530685920577618e-05, + "loss": 0.0583, + "step": 2670 + }, + { + "epoch": 12.25, + "learning_rate": 6.519855595667869e-05, + "loss": 0.1068, + "step": 2671 + }, + { + "epoch": 12.26, + "learning_rate": 6.509025270758122e-05, + "loss": 0.0858, + "step": 2672 + }, + { + "epoch": 12.26, + "learning_rate": 6.498194945848375e-05, + "loss": 0.0981, + "step": 2673 + }, + { + "epoch": 12.27, + "learning_rate": 6.487364620938627e-05, + "loss": 0.101, + "step": 2674 + }, + { + "epoch": 12.27, + "learning_rate": 6.47653429602888e-05, + "loss": 0.0595, + "step": 2675 + }, + { + "epoch": 12.28, + "learning_rate": 6.465703971119133e-05, + "loss": 0.0937, + "step": 2676 + }, + { + "epoch": 12.28, + "learning_rate": 6.454873646209386e-05, + "loss": 0.0665, + "step": 2677 + }, + { + "epoch": 12.28, + "learning_rate": 6.444043321299639e-05, + "loss": 0.0827, + "step": 2678 + }, + { + "epoch": 12.29, + "learning_rate": 6.433212996389892e-05, + "loss": 0.0949, + "step": 2679 + }, + { + "epoch": 12.29, + "learning_rate": 6.422382671480143e-05, + "loss": 0.0601, + "step": 2680 + }, + { + "epoch": 12.3, + "learning_rate": 6.411552346570398e-05, + "loss": 0.0508, + "step": 2681 + }, + { + "epoch": 12.3, + "learning_rate": 6.400722021660649e-05, + "loss": 0.0899, + "step": 2682 + }, + { + "epoch": 12.31, + "learning_rate": 6.389891696750902e-05, + "loss": 0.0634, + "step": 2683 + }, + { + "epoch": 12.31, + "learning_rate": 6.379061371841155e-05, + "loss": 0.0732, + "step": 2684 + }, + { + "epoch": 12.32, + "learning_rate": 6.368231046931407e-05, + "loss": 0.083, + "step": 2685 + }, + { + "epoch": 12.32, + "learning_rate": 6.357400722021661e-05, + "loss": 0.0553, + "step": 2686 + }, + { + "epoch": 12.33, + "learning_rate": 6.346570397111913e-05, + "loss": 0.0693, + "step": 2687 + }, + { + "epoch": 12.33, + "learning_rate": 6.335740072202166e-05, + "loss": 0.0756, + "step": 2688 + }, + { + "epoch": 12.33, + "learning_rate": 6.324909747292419e-05, + "loss": 0.0924, + "step": 2689 + }, + { + "epoch": 12.34, + "learning_rate": 6.31407942238267e-05, + "loss": 0.1721, + "step": 2690 + }, + { + "epoch": 12.34, + "learning_rate": 6.303249097472923e-05, + "loss": 0.1924, + "step": 2691 + }, + { + "epoch": 12.35, + "learning_rate": 6.292418772563176e-05, + "loss": 0.069, + "step": 2692 + }, + { + "epoch": 12.35, + "learning_rate": 6.281588447653429e-05, + "loss": 0.061, + "step": 2693 + }, + { + "epoch": 12.36, + "learning_rate": 6.270758122743682e-05, + "loss": 0.0577, + "step": 2694 + }, + { + "epoch": 12.36, + "learning_rate": 6.259927797833934e-05, + "loss": 0.0789, + "step": 2695 + }, + { + "epoch": 12.37, + "learning_rate": 6.249097472924187e-05, + "loss": 0.0752, + "step": 2696 + }, + { + "epoch": 12.37, + "learning_rate": 6.23826714801444e-05, + "loss": 0.076, + "step": 2697 + }, + { + "epoch": 12.38, + "learning_rate": 6.227436823104693e-05, + "loss": 0.0596, + "step": 2698 + }, + { + "epoch": 12.38, + "learning_rate": 6.216606498194946e-05, + "loss": 0.0754, + "step": 2699 + }, + { + "epoch": 12.39, + "learning_rate": 6.205776173285199e-05, + "loss": 0.0649, + "step": 2700 + }, + { + "epoch": 12.39, + "eval_loss": 0.36723965406417847, + "eval_runtime": 21.047, + "eval_samples_per_second": 78.253, + "eval_steps_per_second": 2.471, + "eval_wer": 0.3413338780512716, + "step": 2700 + }, + { + "epoch": 12.39, + "learning_rate": 6.19494584837545e-05, + "loss": 0.0721, + "step": 2701 + }, + { + "epoch": 12.39, + "learning_rate": 6.184115523465703e-05, + "loss": 0.0654, + "step": 2702 + }, + { + "epoch": 12.4, + "learning_rate": 6.173285198555956e-05, + "loss": 0.2383, + "step": 2703 + }, + { + "epoch": 12.4, + "learning_rate": 6.162454873646209e-05, + "loss": 0.1634, + "step": 2704 + }, + { + "epoch": 12.41, + "learning_rate": 6.151624548736462e-05, + "loss": 0.0545, + "step": 2705 + }, + { + "epoch": 12.41, + "learning_rate": 6.140794223826714e-05, + "loss": 0.092, + "step": 2706 + }, + { + "epoch": 12.42, + "learning_rate": 6.129963898916967e-05, + "loss": 0.0653, + "step": 2707 + }, + { + "epoch": 12.42, + "learning_rate": 6.11913357400722e-05, + "loss": 0.062, + "step": 2708 + }, + { + "epoch": 12.43, + "learning_rate": 6.108303249097473e-05, + "loss": 0.0416, + "step": 2709 + }, + { + "epoch": 12.43, + "learning_rate": 6.0974729241877255e-05, + "loss": 0.0352, + "step": 2710 + }, + { + "epoch": 12.44, + "learning_rate": 6.086642599277978e-05, + "loss": 0.0469, + "step": 2711 + }, + { + "epoch": 12.44, + "learning_rate": 6.07581227436823e-05, + "loss": 0.0515, + "step": 2712 + }, + { + "epoch": 12.44, + "learning_rate": 6.064981949458483e-05, + "loss": 0.1064, + "step": 2713 + }, + { + "epoch": 12.45, + "learning_rate": 6.054151624548736e-05, + "loss": 0.0819, + "step": 2714 + }, + { + "epoch": 12.45, + "learning_rate": 6.043321299638989e-05, + "loss": 0.1183, + "step": 2715 + }, + { + "epoch": 12.46, + "learning_rate": 6.032490974729241e-05, + "loss": 0.0342, + "step": 2716 + }, + { + "epoch": 12.46, + "learning_rate": 6.0216606498194935e-05, + "loss": 0.0291, + "step": 2717 + }, + { + "epoch": 12.47, + "learning_rate": 6.0108303249097465e-05, + "loss": 0.0691, + "step": 2718 + }, + { + "epoch": 12.47, + "learning_rate": 5.9999999999999995e-05, + "loss": 0.0293, + "step": 2719 + }, + { + "epoch": 12.48, + "learning_rate": 5.9891696750902524e-05, + "loss": 0.0515, + "step": 2720 + }, + { + "epoch": 12.48, + "learning_rate": 5.978339350180505e-05, + "loss": 0.0881, + "step": 2721 + }, + { + "epoch": 12.49, + "learning_rate": 5.967509025270758e-05, + "loss": 0.1056, + "step": 2722 + }, + { + "epoch": 12.49, + "learning_rate": 5.95667870036101e-05, + "loss": 0.1101, + "step": 2723 + }, + { + "epoch": 12.5, + "learning_rate": 5.9458483754512636e-05, + "loss": 0.0711, + "step": 2724 + }, + { + "epoch": 12.5, + "learning_rate": 5.935018050541516e-05, + "loss": 0.0791, + "step": 2725 + }, + { + "epoch": 12.5, + "learning_rate": 5.924187725631768e-05, + "loss": 0.1092, + "step": 2726 + }, + { + "epoch": 12.51, + "learning_rate": 5.913357400722021e-05, + "loss": 0.0975, + "step": 2727 + }, + { + "epoch": 12.51, + "learning_rate": 5.9025270758122735e-05, + "loss": 0.1751, + "step": 2728 + }, + { + "epoch": 12.52, + "learning_rate": 5.8916967509025264e-05, + "loss": 0.0246, + "step": 2729 + }, + { + "epoch": 12.52, + "learning_rate": 5.8808664259927794e-05, + "loss": 0.0338, + "step": 2730 + }, + { + "epoch": 12.53, + "learning_rate": 5.8700361010830324e-05, + "loss": 0.052, + "step": 2731 + }, + { + "epoch": 12.53, + "learning_rate": 5.859205776173285e-05, + "loss": 0.0518, + "step": 2732 + }, + { + "epoch": 12.54, + "learning_rate": 5.848375451263537e-05, + "loss": 0.0806, + "step": 2733 + }, + { + "epoch": 12.54, + "learning_rate": 5.83754512635379e-05, + "loss": 0.0754, + "step": 2734 + }, + { + "epoch": 12.55, + "learning_rate": 5.826714801444043e-05, + "loss": 0.0954, + "step": 2735 + }, + { + "epoch": 12.55, + "learning_rate": 5.815884476534296e-05, + "loss": 0.0895, + "step": 2736 + }, + { + "epoch": 12.56, + "learning_rate": 5.805054151624548e-05, + "loss": 0.0556, + "step": 2737 + }, + { + "epoch": 12.56, + "learning_rate": 5.794223826714801e-05, + "loss": 0.0738, + "step": 2738 + }, + { + "epoch": 12.56, + "learning_rate": 5.7833935018050534e-05, + "loss": 0.0839, + "step": 2739 + }, + { + "epoch": 12.57, + "learning_rate": 5.772563176895306e-05, + "loss": 0.0304, + "step": 2740 + }, + { + "epoch": 12.57, + "learning_rate": 5.7617328519855593e-05, + "loss": 0.0756, + "step": 2741 + }, + { + "epoch": 12.58, + "learning_rate": 5.7509025270758116e-05, + "loss": 0.0529, + "step": 2742 + }, + { + "epoch": 12.58, + "learning_rate": 5.7400722021660646e-05, + "loss": 0.0569, + "step": 2743 + }, + { + "epoch": 12.59, + "learning_rate": 5.729241877256317e-05, + "loss": 0.0341, + "step": 2744 + }, + { + "epoch": 12.59, + "learning_rate": 5.71841155234657e-05, + "loss": 0.0606, + "step": 2745 + }, + { + "epoch": 12.6, + "learning_rate": 5.707581227436823e-05, + "loss": 0.0631, + "step": 2746 + }, + { + "epoch": 12.6, + "learning_rate": 5.696750902527076e-05, + "loss": 0.1039, + "step": 2747 + }, + { + "epoch": 12.61, + "learning_rate": 5.685920577617328e-05, + "loss": 0.1214, + "step": 2748 + }, + { + "epoch": 12.61, + "learning_rate": 5.6750902527075804e-05, + "loss": 0.0751, + "step": 2749 + }, + { + "epoch": 12.61, + "learning_rate": 5.6642599277978333e-05, + "loss": 0.0551, + "step": 2750 + }, + { + "epoch": 12.62, + "learning_rate": 5.653429602888086e-05, + "loss": 0.1064, + "step": 2751 + }, + { + "epoch": 12.62, + "learning_rate": 5.642599277978339e-05, + "loss": 0.118, + "step": 2752 + }, + { + "epoch": 12.63, + "learning_rate": 5.6317689530685916e-05, + "loss": 0.0615, + "step": 2753 + }, + { + "epoch": 12.63, + "learning_rate": 5.6209386281588445e-05, + "loss": 0.0645, + "step": 2754 + }, + { + "epoch": 12.64, + "learning_rate": 5.610108303249097e-05, + "loss": 0.0437, + "step": 2755 + }, + { + "epoch": 12.64, + "learning_rate": 5.599277978339349e-05, + "loss": 0.0308, + "step": 2756 + }, + { + "epoch": 12.65, + "learning_rate": 5.588447653429603e-05, + "loss": 0.0448, + "step": 2757 + }, + { + "epoch": 12.65, + "learning_rate": 5.577617328519855e-05, + "loss": 0.047, + "step": 2758 + }, + { + "epoch": 12.66, + "learning_rate": 5.566787003610108e-05, + "loss": 0.0691, + "step": 2759 + }, + { + "epoch": 12.66, + "learning_rate": 5.55595667870036e-05, + "loss": 0.0879, + "step": 2760 + }, + { + "epoch": 12.67, + "learning_rate": 5.5451263537906126e-05, + "loss": 0.0872, + "step": 2761 + }, + { + "epoch": 12.67, + "learning_rate": 5.534296028880866e-05, + "loss": 0.1469, + "step": 2762 + }, + { + "epoch": 12.67, + "learning_rate": 5.5234657039711185e-05, + "loss": 0.0499, + "step": 2763 + }, + { + "epoch": 12.68, + "learning_rate": 5.5126353790613715e-05, + "loss": 0.0586, + "step": 2764 + }, + { + "epoch": 12.68, + "learning_rate": 5.501805054151624e-05, + "loss": 0.1172, + "step": 2765 + }, + { + "epoch": 12.69, + "learning_rate": 5.490974729241877e-05, + "loss": 0.0901, + "step": 2766 + }, + { + "epoch": 12.69, + "learning_rate": 5.480144404332129e-05, + "loss": 0.06, + "step": 2767 + }, + { + "epoch": 12.7, + "learning_rate": 5.469314079422383e-05, + "loss": 0.1099, + "step": 2768 + }, + { + "epoch": 12.7, + "learning_rate": 5.458483754512635e-05, + "loss": 0.0549, + "step": 2769 + }, + { + "epoch": 12.71, + "learning_rate": 5.447653429602887e-05, + "loss": 0.043, + "step": 2770 + }, + { + "epoch": 12.71, + "learning_rate": 5.43682310469314e-05, + "loss": 0.0948, + "step": 2771 + }, + { + "epoch": 12.72, + "learning_rate": 5.4259927797833925e-05, + "loss": 0.088, + "step": 2772 + }, + { + "epoch": 12.72, + "learning_rate": 5.415162454873646e-05, + "loss": 0.0793, + "step": 2773 + }, + { + "epoch": 12.72, + "learning_rate": 5.4043321299638985e-05, + "loss": 0.0692, + "step": 2774 + }, + { + "epoch": 12.73, + "learning_rate": 5.3935018050541514e-05, + "loss": 0.0702, + "step": 2775 + }, + { + "epoch": 12.73, + "learning_rate": 5.382671480144404e-05, + "loss": 0.0644, + "step": 2776 + }, + { + "epoch": 12.74, + "learning_rate": 5.371841155234656e-05, + "loss": 0.096, + "step": 2777 + }, + { + "epoch": 12.74, + "learning_rate": 5.36101083032491e-05, + "loss": 0.0786, + "step": 2778 + }, + { + "epoch": 12.75, + "learning_rate": 5.350180505415162e-05, + "loss": 0.1135, + "step": 2779 + }, + { + "epoch": 12.75, + "learning_rate": 5.339350180505415e-05, + "loss": 0.1034, + "step": 2780 + }, + { + "epoch": 12.76, + "learning_rate": 5.328519855595667e-05, + "loss": 0.1115, + "step": 2781 + }, + { + "epoch": 12.76, + "learning_rate": 5.31768953068592e-05, + "loss": 0.0608, + "step": 2782 + }, + { + "epoch": 12.77, + "learning_rate": 5.3068592057761725e-05, + "loss": 0.076, + "step": 2783 + }, + { + "epoch": 12.77, + "learning_rate": 5.296028880866426e-05, + "loss": 0.0722, + "step": 2784 + }, + { + "epoch": 12.78, + "learning_rate": 5.2851985559566784e-05, + "loss": 0.0373, + "step": 2785 + }, + { + "epoch": 12.78, + "learning_rate": 5.274368231046931e-05, + "loss": 0.1194, + "step": 2786 + }, + { + "epoch": 12.78, + "learning_rate": 5.263537906137184e-05, + "loss": 0.0753, + "step": 2787 + }, + { + "epoch": 12.79, + "learning_rate": 5.252707581227436e-05, + "loss": 0.1701, + "step": 2788 + }, + { + "epoch": 12.79, + "learning_rate": 5.2418772563176896e-05, + "loss": 0.0455, + "step": 2789 + }, + { + "epoch": 12.8, + "learning_rate": 5.231046931407942e-05, + "loss": 0.1695, + "step": 2790 + }, + { + "epoch": 12.8, + "learning_rate": 5.220216606498195e-05, + "loss": 0.0908, + "step": 2791 + }, + { + "epoch": 12.81, + "learning_rate": 5.209386281588447e-05, + "loss": 0.0549, + "step": 2792 + }, + { + "epoch": 12.81, + "learning_rate": 5.1985559566786994e-05, + "loss": 0.0664, + "step": 2793 + }, + { + "epoch": 12.82, + "learning_rate": 5.1877256317689524e-05, + "loss": 0.0722, + "step": 2794 + }, + { + "epoch": 12.82, + "learning_rate": 5.1768953068592054e-05, + "loss": 0.0415, + "step": 2795 + }, + { + "epoch": 12.83, + "learning_rate": 5.1660649819494583e-05, + "loss": 0.0716, + "step": 2796 + }, + { + "epoch": 12.83, + "learning_rate": 5.1552346570397106e-05, + "loss": 0.0145, + "step": 2797 + }, + { + "epoch": 12.83, + "learning_rate": 5.1444043321299636e-05, + "loss": 0.0561, + "step": 2798 + }, + { + "epoch": 12.84, + "learning_rate": 5.133574007220216e-05, + "loss": 0.135, + "step": 2799 + }, + { + "epoch": 12.84, + "learning_rate": 5.1227436823104695e-05, + "loss": 0.0542, + "step": 2800 + }, + { + "epoch": 12.84, + "eval_loss": 0.37319043278694153, + "eval_runtime": 20.1025, + "eval_samples_per_second": 81.93, + "eval_steps_per_second": 2.587, + "eval_wer": 0.3369420896741906, + "step": 2800 + }, + { + "epoch": 12.85, + "learning_rate": 5.111913357400722e-05, + "loss": 0.0656, + "step": 2801 + }, + { + "epoch": 12.85, + "learning_rate": 5.101083032490974e-05, + "loss": 0.0415, + "step": 2802 + }, + { + "epoch": 12.86, + "learning_rate": 5.090252707581227e-05, + "loss": 0.18, + "step": 2803 + }, + { + "epoch": 12.86, + "learning_rate": 5.0794223826714794e-05, + "loss": 0.0508, + "step": 2804 + }, + { + "epoch": 12.87, + "learning_rate": 5.068592057761732e-05, + "loss": 0.0283, + "step": 2805 + }, + { + "epoch": 12.87, + "learning_rate": 5.057761732851985e-05, + "loss": 0.0346, + "step": 2806 + }, + { + "epoch": 12.88, + "learning_rate": 5.0469314079422376e-05, + "loss": 0.0542, + "step": 2807 + }, + { + "epoch": 12.88, + "learning_rate": 5.0361010830324906e-05, + "loss": 0.0466, + "step": 2808 + }, + { + "epoch": 12.89, + "learning_rate": 5.025270758122743e-05, + "loss": 0.0626, + "step": 2809 + }, + { + "epoch": 12.89, + "learning_rate": 5.014440433212996e-05, + "loss": 0.0827, + "step": 2810 + }, + { + "epoch": 12.89, + "learning_rate": 5.003610108303249e-05, + "loss": 0.1091, + "step": 2811 + }, + { + "epoch": 12.9, + "learning_rate": 4.992779783393502e-05, + "loss": 0.0769, + "step": 2812 + }, + { + "epoch": 12.9, + "learning_rate": 4.981949458483754e-05, + "loss": 0.0883, + "step": 2813 + }, + { + "epoch": 12.91, + "learning_rate": 4.9711191335740063e-05, + "loss": 0.0841, + "step": 2814 + }, + { + "epoch": 12.91, + "learning_rate": 4.960288808664259e-05, + "loss": 0.0924, + "step": 2815 + }, + { + "epoch": 12.92, + "learning_rate": 4.949458483754512e-05, + "loss": 0.0721, + "step": 2816 + }, + { + "epoch": 12.92, + "learning_rate": 4.938628158844765e-05, + "loss": 0.0571, + "step": 2817 + }, + { + "epoch": 12.93, + "learning_rate": 4.9277978339350175e-05, + "loss": 0.0466, + "step": 2818 + }, + { + "epoch": 12.93, + "learning_rate": 4.9169675090252705e-05, + "loss": 0.0829, + "step": 2819 + }, + { + "epoch": 12.94, + "learning_rate": 4.906137184115523e-05, + "loss": 0.0997, + "step": 2820 + }, + { + "epoch": 12.94, + "learning_rate": 4.895306859205775e-05, + "loss": 0.0782, + "step": 2821 + }, + { + "epoch": 12.94, + "learning_rate": 4.884476534296029e-05, + "loss": 0.0493, + "step": 2822 + }, + { + "epoch": 12.95, + "learning_rate": 4.873646209386281e-05, + "loss": 0.1088, + "step": 2823 + }, + { + "epoch": 12.95, + "learning_rate": 4.862815884476534e-05, + "loss": 0.0779, + "step": 2824 + }, + { + "epoch": 12.96, + "learning_rate": 4.851985559566786e-05, + "loss": 0.099, + "step": 2825 + }, + { + "epoch": 12.96, + "learning_rate": 4.841155234657039e-05, + "loss": 0.0749, + "step": 2826 + }, + { + "epoch": 12.97, + "learning_rate": 4.830324909747292e-05, + "loss": 0.1671, + "step": 2827 + }, + { + "epoch": 12.97, + "learning_rate": 4.819494584837545e-05, + "loss": 0.0566, + "step": 2828 + }, + { + "epoch": 12.98, + "learning_rate": 4.8086642599277975e-05, + "loss": 0.101, + "step": 2829 + }, + { + "epoch": 12.98, + "learning_rate": 4.79783393501805e-05, + "loss": 0.0305, + "step": 2830 + }, + { + "epoch": 12.99, + "learning_rate": 4.787003610108303e-05, + "loss": 0.0697, + "step": 2831 + }, + { + "epoch": 12.99, + "learning_rate": 4.776173285198555e-05, + "loss": 0.0395, + "step": 2832 + }, + { + "epoch": 13.0, + "learning_rate": 4.765342960288809e-05, + "loss": 0.1571, + "step": 2833 + }, + { + "epoch": 13.0, + "learning_rate": 4.754512635379061e-05, + "loss": 0.0794, + "step": 2834 + }, + { + "epoch": 13.0, + "learning_rate": 4.743682310469314e-05, + "loss": 0.0535, + "step": 2835 + }, + { + "epoch": 13.01, + "learning_rate": 4.732851985559566e-05, + "loss": 0.0589, + "step": 2836 + }, + { + "epoch": 13.01, + "learning_rate": 4.7220216606498185e-05, + "loss": 0.0685, + "step": 2837 + }, + { + "epoch": 13.02, + "learning_rate": 4.711191335740072e-05, + "loss": 0.0505, + "step": 2838 + }, + { + "epoch": 13.02, + "learning_rate": 4.7003610108303244e-05, + "loss": 0.0278, + "step": 2839 + }, + { + "epoch": 13.03, + "learning_rate": 4.6895306859205774e-05, + "loss": 0.1048, + "step": 2840 + }, + { + "epoch": 13.03, + "learning_rate": 4.67870036101083e-05, + "loss": 0.0414, + "step": 2841 + }, + { + "epoch": 13.04, + "learning_rate": 4.667870036101083e-05, + "loss": 0.0968, + "step": 2842 + }, + { + "epoch": 13.04, + "learning_rate": 4.6570397111913356e-05, + "loss": 0.0644, + "step": 2843 + }, + { + "epoch": 13.05, + "learning_rate": 4.6462093862815886e-05, + "loss": 0.0722, + "step": 2844 + }, + { + "epoch": 13.05, + "learning_rate": 4.635379061371841e-05, + "loss": 0.0452, + "step": 2845 + }, + { + "epoch": 13.06, + "learning_rate": 4.624548736462093e-05, + "loss": 0.0775, + "step": 2846 + }, + { + "epoch": 13.06, + "learning_rate": 4.613718411552346e-05, + "loss": 0.0658, + "step": 2847 + }, + { + "epoch": 13.06, + "learning_rate": 4.6028880866425984e-05, + "loss": 0.0396, + "step": 2848 + }, + { + "epoch": 13.07, + "learning_rate": 4.592057761732852e-05, + "loss": 0.0545, + "step": 2849 + }, + { + "epoch": 13.07, + "learning_rate": 4.5812274368231044e-05, + "loss": 0.0982, + "step": 2850 + }, + { + "epoch": 13.08, + "learning_rate": 4.570397111913357e-05, + "loss": 0.0641, + "step": 2851 + }, + { + "epoch": 13.08, + "learning_rate": 4.5595667870036096e-05, + "loss": 0.043, + "step": 2852 + }, + { + "epoch": 13.09, + "learning_rate": 4.548736462093862e-05, + "loss": 0.1075, + "step": 2853 + }, + { + "epoch": 13.09, + "learning_rate": 4.5379061371841156e-05, + "loss": 0.0813, + "step": 2854 + }, + { + "epoch": 13.1, + "learning_rate": 4.527075812274368e-05, + "loss": 0.0331, + "step": 2855 + }, + { + "epoch": 13.1, + "learning_rate": 4.516245487364621e-05, + "loss": 0.1345, + "step": 2856 + }, + { + "epoch": 13.11, + "learning_rate": 4.505415162454873e-05, + "loss": 0.0575, + "step": 2857 + }, + { + "epoch": 13.11, + "learning_rate": 4.4945848375451254e-05, + "loss": 0.0455, + "step": 2858 + }, + { + "epoch": 13.11, + "learning_rate": 4.4837545126353784e-05, + "loss": 0.1655, + "step": 2859 + }, + { + "epoch": 13.12, + "learning_rate": 4.4729241877256313e-05, + "loss": 0.0206, + "step": 2860 + }, + { + "epoch": 13.12, + "learning_rate": 4.462093862815884e-05, + "loss": 0.0471, + "step": 2861 + }, + { + "epoch": 13.13, + "learning_rate": 4.4512635379061366e-05, + "loss": 0.0704, + "step": 2862 + }, + { + "epoch": 13.13, + "learning_rate": 4.4404332129963896e-05, + "loss": 0.1134, + "step": 2863 + }, + { + "epoch": 13.14, + "learning_rate": 4.429602888086642e-05, + "loss": 0.0229, + "step": 2864 + }, + { + "epoch": 13.14, + "learning_rate": 4.4187725631768955e-05, + "loss": 0.0359, + "step": 2865 + }, + { + "epoch": 13.15, + "learning_rate": 4.407942238267148e-05, + "loss": 0.0609, + "step": 2866 + }, + { + "epoch": 13.15, + "learning_rate": 4.3971119133574e-05, + "loss": 0.0834, + "step": 2867 + }, + { + "epoch": 13.16, + "learning_rate": 4.386281588447653e-05, + "loss": 0.0558, + "step": 2868 + }, + { + "epoch": 13.16, + "learning_rate": 4.3754512635379053e-05, + "loss": 0.0374, + "step": 2869 + }, + { + "epoch": 13.17, + "learning_rate": 4.364620938628159e-05, + "loss": 0.0873, + "step": 2870 + }, + { + "epoch": 13.17, + "learning_rate": 4.353790613718411e-05, + "loss": 0.1664, + "step": 2871 + }, + { + "epoch": 13.17, + "learning_rate": 4.342960288808664e-05, + "loss": 0.1264, + "step": 2872 + }, + { + "epoch": 13.18, + "learning_rate": 4.3321299638989165e-05, + "loss": 0.0616, + "step": 2873 + }, + { + "epoch": 13.18, + "learning_rate": 4.321299638989169e-05, + "loss": 0.0303, + "step": 2874 + }, + { + "epoch": 13.19, + "learning_rate": 4.310469314079422e-05, + "loss": 0.0298, + "step": 2875 + }, + { + "epoch": 13.19, + "learning_rate": 4.299638989169675e-05, + "loss": 0.0548, + "step": 2876 + }, + { + "epoch": 13.2, + "learning_rate": 4.288808664259928e-05, + "loss": 0.0301, + "step": 2877 + }, + { + "epoch": 13.2, + "learning_rate": 4.27797833935018e-05, + "loss": 0.0555, + "step": 2878 + }, + { + "epoch": 13.21, + "learning_rate": 4.267148014440433e-05, + "loss": 0.0913, + "step": 2879 + }, + { + "epoch": 13.21, + "learning_rate": 4.256317689530685e-05, + "loss": 0.071, + "step": 2880 + }, + { + "epoch": 13.22, + "learning_rate": 4.245487364620939e-05, + "loss": 0.045, + "step": 2881 + }, + { + "epoch": 13.22, + "learning_rate": 4.234657039711191e-05, + "loss": 0.1279, + "step": 2882 + }, + { + "epoch": 13.22, + "learning_rate": 4.2238267148014435e-05, + "loss": 0.1088, + "step": 2883 + }, + { + "epoch": 13.23, + "learning_rate": 4.2129963898916965e-05, + "loss": 0.0999, + "step": 2884 + }, + { + "epoch": 13.23, + "learning_rate": 4.202166064981949e-05, + "loss": 0.0763, + "step": 2885 + }, + { + "epoch": 13.24, + "learning_rate": 4.191335740072202e-05, + "loss": 0.0463, + "step": 2886 + }, + { + "epoch": 13.24, + "learning_rate": 4.180505415162455e-05, + "loss": 0.0388, + "step": 2887 + }, + { + "epoch": 13.25, + "learning_rate": 4.169675090252708e-05, + "loss": 0.0583, + "step": 2888 + }, + { + "epoch": 13.25, + "learning_rate": 4.15884476534296e-05, + "loss": 0.0922, + "step": 2889 + }, + { + "epoch": 13.26, + "learning_rate": 4.148014440433212e-05, + "loss": 0.0753, + "step": 2890 + }, + { + "epoch": 13.26, + "learning_rate": 4.137184115523465e-05, + "loss": 0.0633, + "step": 2891 + }, + { + "epoch": 13.27, + "learning_rate": 4.126353790613718e-05, + "loss": 0.0909, + "step": 2892 + }, + { + "epoch": 13.27, + "learning_rate": 4.115523465703971e-05, + "loss": 0.0469, + "step": 2893 + }, + { + "epoch": 13.28, + "learning_rate": 4.1046931407942234e-05, + "loss": 0.1607, + "step": 2894 + }, + { + "epoch": 13.28, + "learning_rate": 4.093862815884476e-05, + "loss": 0.0348, + "step": 2895 + }, + { + "epoch": 13.28, + "learning_rate": 4.083032490974729e-05, + "loss": 0.1298, + "step": 2896 + }, + { + "epoch": 13.29, + "learning_rate": 4.072202166064982e-05, + "loss": 0.1057, + "step": 2897 + }, + { + "epoch": 13.29, + "learning_rate": 4.0613718411552346e-05, + "loss": 0.0537, + "step": 2898 + }, + { + "epoch": 13.3, + "learning_rate": 4.050541516245487e-05, + "loss": 0.0374, + "step": 2899 + }, + { + "epoch": 13.3, + "learning_rate": 4.03971119133574e-05, + "loss": 0.087, + "step": 2900 + }, + { + "epoch": 13.3, + "eval_loss": 0.38328906893730164, + "eval_runtime": 19.961, + "eval_samples_per_second": 82.511, + "eval_steps_per_second": 2.605, + "eval_wer": 0.3458278010417731, + "step": 2900 + }, + { + "epoch": 13.31, + "learning_rate": 4.028880866425992e-05, + "loss": 0.0776, + "step": 2901 + }, + { + "epoch": 13.31, + "learning_rate": 4.0180505415162445e-05, + "loss": 0.0662, + "step": 2902 + }, + { + "epoch": 13.32, + "learning_rate": 4.007220216606498e-05, + "loss": 0.0494, + "step": 2903 + }, + { + "epoch": 13.32, + "learning_rate": 3.9963898916967504e-05, + "loss": 0.069, + "step": 2904 + }, + { + "epoch": 13.33, + "learning_rate": 3.9855595667870034e-05, + "loss": 0.111, + "step": 2905 + }, + { + "epoch": 13.33, + "learning_rate": 3.974729241877256e-05, + "loss": 0.0702, + "step": 2906 + }, + { + "epoch": 13.33, + "learning_rate": 3.9638989169675086e-05, + "loss": 0.0616, + "step": 2907 + }, + { + "epoch": 13.34, + "learning_rate": 3.9530685920577616e-05, + "loss": 0.0807, + "step": 2908 + }, + { + "epoch": 13.34, + "learning_rate": 3.9422382671480146e-05, + "loss": 0.0778, + "step": 2909 + }, + { + "epoch": 13.35, + "learning_rate": 3.931407942238267e-05, + "loss": 0.0305, + "step": 2910 + }, + { + "epoch": 13.35, + "learning_rate": 3.920577617328519e-05, + "loss": 0.0691, + "step": 2911 + }, + { + "epoch": 13.36, + "learning_rate": 3.909747292418772e-05, + "loss": 0.0359, + "step": 2912 + }, + { + "epoch": 13.36, + "learning_rate": 3.8989169675090244e-05, + "loss": 0.0577, + "step": 2913 + }, + { + "epoch": 13.37, + "learning_rate": 3.888086642599278e-05, + "loss": 0.0657, + "step": 2914 + }, + { + "epoch": 13.37, + "learning_rate": 3.8772563176895303e-05, + "loss": 0.0312, + "step": 2915 + }, + { + "epoch": 13.38, + "learning_rate": 3.866425992779783e-05, + "loss": 0.0512, + "step": 2916 + }, + { + "epoch": 13.38, + "learning_rate": 3.8555956678700356e-05, + "loss": 0.0727, + "step": 2917 + }, + { + "epoch": 13.39, + "learning_rate": 3.844765342960288e-05, + "loss": 0.0254, + "step": 2918 + }, + { + "epoch": 13.39, + "learning_rate": 3.8339350180505415e-05, + "loss": 0.0503, + "step": 2919 + }, + { + "epoch": 13.39, + "learning_rate": 3.823104693140794e-05, + "loss": 0.0875, + "step": 2920 + }, + { + "epoch": 13.4, + "learning_rate": 3.812274368231047e-05, + "loss": 0.0687, + "step": 2921 + }, + { + "epoch": 13.4, + "learning_rate": 3.801444043321299e-05, + "loss": 0.1056, + "step": 2922 + }, + { + "epoch": 13.41, + "learning_rate": 3.790613718411552e-05, + "loss": 0.0377, + "step": 2923 + }, + { + "epoch": 13.41, + "learning_rate": 3.7797833935018043e-05, + "loss": 0.0725, + "step": 2924 + }, + { + "epoch": 13.42, + "learning_rate": 3.768953068592058e-05, + "loss": 0.0364, + "step": 2925 + }, + { + "epoch": 13.42, + "learning_rate": 3.75812274368231e-05, + "loss": 0.0411, + "step": 2926 + }, + { + "epoch": 13.43, + "learning_rate": 3.7472924187725626e-05, + "loss": 0.0672, + "step": 2927 + }, + { + "epoch": 13.43, + "learning_rate": 3.7364620938628155e-05, + "loss": 0.0144, + "step": 2928 + }, + { + "epoch": 13.44, + "learning_rate": 3.7256317689530685e-05, + "loss": 0.0276, + "step": 2929 + }, + { + "epoch": 13.44, + "learning_rate": 3.714801444043321e-05, + "loss": 0.0665, + "step": 2930 + }, + { + "epoch": 13.44, + "learning_rate": 3.703971119133574e-05, + "loss": 0.1397, + "step": 2931 + }, + { + "epoch": 13.45, + "learning_rate": 3.693140794223827e-05, + "loss": 0.0711, + "step": 2932 + }, + { + "epoch": 13.45, + "learning_rate": 3.682310469314079e-05, + "loss": 0.0663, + "step": 2933 + }, + { + "epoch": 13.46, + "learning_rate": 3.671480144404332e-05, + "loss": 0.1321, + "step": 2934 + }, + { + "epoch": 13.46, + "learning_rate": 3.660649819494584e-05, + "loss": 0.0376, + "step": 2935 + }, + { + "epoch": 13.47, + "learning_rate": 3.649819494584837e-05, + "loss": 0.0829, + "step": 2936 + }, + { + "epoch": 13.47, + "learning_rate": 3.63898916967509e-05, + "loss": 0.0685, + "step": 2937 + }, + { + "epoch": 13.48, + "learning_rate": 3.6281588447653425e-05, + "loss": 0.0764, + "step": 2938 + }, + { + "epoch": 13.48, + "learning_rate": 3.6173285198555955e-05, + "loss": 0.0972, + "step": 2939 + }, + { + "epoch": 13.49, + "learning_rate": 3.606498194945848e-05, + "loss": 0.0701, + "step": 2940 + }, + { + "epoch": 13.49, + "learning_rate": 3.595667870036101e-05, + "loss": 0.074, + "step": 2941 + }, + { + "epoch": 13.5, + "learning_rate": 3.584837545126354e-05, + "loss": 0.1365, + "step": 2942 + }, + { + "epoch": 13.5, + "learning_rate": 3.574007220216606e-05, + "loss": 0.093, + "step": 2943 + }, + { + "epoch": 13.5, + "learning_rate": 3.563176895306859e-05, + "loss": 0.0414, + "step": 2944 + }, + { + "epoch": 13.51, + "learning_rate": 3.552346570397112e-05, + "loss": 0.0771, + "step": 2945 + }, + { + "epoch": 13.51, + "learning_rate": 3.541516245487364e-05, + "loss": 0.1401, + "step": 2946 + }, + { + "epoch": 13.52, + "learning_rate": 3.5306859205776165e-05, + "loss": 0.1222, + "step": 2947 + }, + { + "epoch": 13.52, + "learning_rate": 3.5198555956678695e-05, + "loss": 0.0676, + "step": 2948 + }, + { + "epoch": 13.53, + "learning_rate": 3.5090252707581224e-05, + "loss": 0.0417, + "step": 2949 + }, + { + "epoch": 13.53, + "learning_rate": 3.4981949458483754e-05, + "loss": 0.0797, + "step": 2950 + }, + { + "epoch": 13.54, + "learning_rate": 3.487364620938628e-05, + "loss": 0.0992, + "step": 2951 + }, + { + "epoch": 13.54, + "learning_rate": 3.476534296028881e-05, + "loss": 0.0453, + "step": 2952 + }, + { + "epoch": 13.55, + "learning_rate": 3.4657039711191336e-05, + "loss": 0.0486, + "step": 2953 + }, + { + "epoch": 13.55, + "learning_rate": 3.454873646209386e-05, + "loss": 0.0549, + "step": 2954 + }, + { + "epoch": 13.56, + "learning_rate": 3.444043321299638e-05, + "loss": 0.0634, + "step": 2955 + }, + { + "epoch": 13.56, + "learning_rate": 3.433212996389891e-05, + "loss": 0.0518, + "step": 2956 + }, + { + "epoch": 13.56, + "learning_rate": 3.422382671480144e-05, + "loss": 0.1083, + "step": 2957 + }, + { + "epoch": 13.57, + "learning_rate": 3.411552346570397e-05, + "loss": 0.0784, + "step": 2958 + }, + { + "epoch": 13.57, + "learning_rate": 3.4007220216606494e-05, + "loss": 0.1415, + "step": 2959 + }, + { + "epoch": 13.58, + "learning_rate": 3.3898916967509024e-05, + "loss": 0.0682, + "step": 2960 + }, + { + "epoch": 13.58, + "learning_rate": 3.3790613718411553e-05, + "loss": 0.0762, + "step": 2961 + }, + { + "epoch": 13.59, + "learning_rate": 3.3682310469314076e-05, + "loss": 0.0798, + "step": 2962 + }, + { + "epoch": 13.59, + "learning_rate": 3.35740072202166e-05, + "loss": 0.0488, + "step": 2963 + }, + { + "epoch": 13.6, + "learning_rate": 3.346570397111913e-05, + "loss": 0.0929, + "step": 2964 + }, + { + "epoch": 13.6, + "learning_rate": 3.335740072202166e-05, + "loss": 0.0601, + "step": 2965 + }, + { + "epoch": 13.61, + "learning_rate": 3.324909747292419e-05, + "loss": 0.0388, + "step": 2966 + }, + { + "epoch": 13.61, + "learning_rate": 3.314079422382671e-05, + "loss": 0.0586, + "step": 2967 + }, + { + "epoch": 13.61, + "learning_rate": 3.303249097472924e-05, + "loss": 0.119, + "step": 2968 + }, + { + "epoch": 13.62, + "learning_rate": 3.292418772563177e-05, + "loss": 0.1002, + "step": 2969 + }, + { + "epoch": 13.62, + "learning_rate": 3.2815884476534293e-05, + "loss": 0.0713, + "step": 2970 + }, + { + "epoch": 13.63, + "learning_rate": 3.2707581227436816e-05, + "loss": 0.1808, + "step": 2971 + }, + { + "epoch": 13.63, + "learning_rate": 3.2599277978339346e-05, + "loss": 0.0564, + "step": 2972 + }, + { + "epoch": 13.64, + "learning_rate": 3.2490974729241876e-05, + "loss": 0.0165, + "step": 2973 + }, + { + "epoch": 13.64, + "learning_rate": 3.23826714801444e-05, + "loss": 0.021, + "step": 2974 + }, + { + "epoch": 13.65, + "learning_rate": 3.227436823104693e-05, + "loss": 0.0444, + "step": 2975 + }, + { + "epoch": 13.65, + "learning_rate": 3.216606498194946e-05, + "loss": 0.0236, + "step": 2976 + }, + { + "epoch": 13.66, + "learning_rate": 3.205776173285199e-05, + "loss": 0.0643, + "step": 2977 + }, + { + "epoch": 13.66, + "learning_rate": 3.194945848375451e-05, + "loss": 0.0632, + "step": 2978 + }, + { + "epoch": 13.67, + "learning_rate": 3.1841155234657033e-05, + "loss": 0.076, + "step": 2979 + }, + { + "epoch": 13.67, + "learning_rate": 3.173285198555956e-05, + "loss": 0.074, + "step": 2980 + }, + { + "epoch": 13.67, + "learning_rate": 3.162454873646209e-05, + "loss": 0.0304, + "step": 2981 + }, + { + "epoch": 13.68, + "learning_rate": 3.1516245487364616e-05, + "loss": 0.0381, + "step": 2982 + }, + { + "epoch": 13.68, + "learning_rate": 3.1407942238267145e-05, + "loss": 0.0555, + "step": 2983 + }, + { + "epoch": 13.69, + "learning_rate": 3.129963898916967e-05, + "loss": 0.1642, + "step": 2984 + }, + { + "epoch": 13.69, + "learning_rate": 3.11913357400722e-05, + "loss": 0.0571, + "step": 2985 + }, + { + "epoch": 13.7, + "learning_rate": 3.108303249097473e-05, + "loss": 0.0335, + "step": 2986 + }, + { + "epoch": 13.7, + "learning_rate": 3.097472924187725e-05, + "loss": 0.0435, + "step": 2987 + }, + { + "epoch": 13.71, + "learning_rate": 3.086642599277978e-05, + "loss": 0.0615, + "step": 2988 + }, + { + "epoch": 13.71, + "learning_rate": 3.075812274368231e-05, + "loss": 0.0849, + "step": 2989 + }, + { + "epoch": 13.72, + "learning_rate": 3.064981949458483e-05, + "loss": 0.0696, + "step": 2990 + }, + { + "epoch": 13.72, + "learning_rate": 3.054151624548736e-05, + "loss": 0.0776, + "step": 2991 + }, + { + "epoch": 13.72, + "learning_rate": 3.043321299638989e-05, + "loss": 0.0713, + "step": 2992 + }, + { + "epoch": 13.73, + "learning_rate": 3.0324909747292415e-05, + "loss": 0.0676, + "step": 2993 + }, + { + "epoch": 13.73, + "learning_rate": 3.0216606498194945e-05, + "loss": 0.0543, + "step": 2994 + }, + { + "epoch": 13.74, + "learning_rate": 3.0108303249097468e-05, + "loss": 0.1155, + "step": 2995 + }, + { + "epoch": 13.74, + "learning_rate": 2.9999999999999997e-05, + "loss": 0.1157, + "step": 2996 + }, + { + "epoch": 13.75, + "learning_rate": 2.9891696750902524e-05, + "loss": 0.0546, + "step": 2997 + }, + { + "epoch": 13.75, + "learning_rate": 2.978339350180505e-05, + "loss": 0.0806, + "step": 2998 + }, + { + "epoch": 13.76, + "learning_rate": 2.967509025270758e-05, + "loss": 0.0529, + "step": 2999 + }, + { + "epoch": 13.76, + "learning_rate": 2.9566787003610106e-05, + "loss": 0.0196, + "step": 3000 + }, + { + "epoch": 13.76, + "eval_loss": 0.3761161267757416, + "eval_runtime": 20.0645, + "eval_samples_per_second": 82.085, + "eval_steps_per_second": 2.592, + "eval_wer": 0.33030333980185883, + "step": 3000 + }, + { + "epoch": 13.77, + "learning_rate": 2.9458483754512632e-05, + "loss": 0.0384, + "step": 3001 + }, + { + "epoch": 13.77, + "learning_rate": 2.9350180505415162e-05, + "loss": 0.0398, + "step": 3002 + }, + { + "epoch": 13.78, + "learning_rate": 2.9241877256317685e-05, + "loss": 0.0691, + "step": 3003 + }, + { + "epoch": 13.78, + "learning_rate": 2.9133574007220214e-05, + "loss": 0.037, + "step": 3004 + }, + { + "epoch": 13.78, + "learning_rate": 2.902527075812274e-05, + "loss": 0.0655, + "step": 3005 + }, + { + "epoch": 13.79, + "learning_rate": 2.8916967509025267e-05, + "loss": 0.0894, + "step": 3006 + }, + { + "epoch": 13.79, + "learning_rate": 2.8808664259927797e-05, + "loss": 0.0754, + "step": 3007 + }, + { + "epoch": 13.8, + "learning_rate": 2.8700361010830323e-05, + "loss": 0.0806, + "step": 3008 + }, + { + "epoch": 13.8, + "learning_rate": 2.859205776173285e-05, + "loss": 0.1085, + "step": 3009 + }, + { + "epoch": 13.81, + "learning_rate": 2.848375451263538e-05, + "loss": 0.0815, + "step": 3010 + }, + { + "epoch": 13.81, + "learning_rate": 2.8375451263537902e-05, + "loss": 0.0432, + "step": 3011 + }, + { + "epoch": 13.82, + "learning_rate": 2.826714801444043e-05, + "loss": 0.0665, + "step": 3012 + }, + { + "epoch": 13.82, + "learning_rate": 2.8158844765342958e-05, + "loss": 0.0431, + "step": 3013 + }, + { + "epoch": 13.83, + "learning_rate": 2.8050541516245484e-05, + "loss": 0.0304, + "step": 3014 + }, + { + "epoch": 13.83, + "learning_rate": 2.7942238267148014e-05, + "loss": 0.0393, + "step": 3015 + }, + { + "epoch": 13.83, + "learning_rate": 2.783393501805054e-05, + "loss": 0.0851, + "step": 3016 + }, + { + "epoch": 13.84, + "learning_rate": 2.7725631768953063e-05, + "loss": 0.1234, + "step": 3017 + }, + { + "epoch": 13.84, + "learning_rate": 2.7617328519855593e-05, + "loss": 0.0342, + "step": 3018 + }, + { + "epoch": 13.85, + "learning_rate": 2.750902527075812e-05, + "loss": 0.0602, + "step": 3019 + }, + { + "epoch": 13.85, + "learning_rate": 2.7400722021660645e-05, + "loss": 0.1423, + "step": 3020 + }, + { + "epoch": 13.86, + "learning_rate": 2.7292418772563175e-05, + "loss": 0.0605, + "step": 3021 + }, + { + "epoch": 13.86, + "learning_rate": 2.71841155234657e-05, + "loss": 0.0793, + "step": 3022 + }, + { + "epoch": 13.87, + "learning_rate": 2.707581227436823e-05, + "loss": 0.0255, + "step": 3023 + }, + { + "epoch": 13.87, + "learning_rate": 2.6967509025270757e-05, + "loss": 0.0505, + "step": 3024 + }, + { + "epoch": 13.88, + "learning_rate": 2.685920577617328e-05, + "loss": 0.024, + "step": 3025 + }, + { + "epoch": 13.88, + "learning_rate": 2.675090252707581e-05, + "loss": 0.0139, + "step": 3026 + }, + { + "epoch": 13.89, + "learning_rate": 2.6642599277978336e-05, + "loss": 0.0241, + "step": 3027 + }, + { + "epoch": 13.89, + "learning_rate": 2.6534296028880862e-05, + "loss": 0.0386, + "step": 3028 + }, + { + "epoch": 13.89, + "learning_rate": 2.6425992779783392e-05, + "loss": 0.0941, + "step": 3029 + }, + { + "epoch": 13.9, + "learning_rate": 2.631768953068592e-05, + "loss": 0.0349, + "step": 3030 + }, + { + "epoch": 13.9, + "learning_rate": 2.6209386281588448e-05, + "loss": 0.0372, + "step": 3031 + }, + { + "epoch": 13.91, + "learning_rate": 2.6101083032490974e-05, + "loss": 0.0815, + "step": 3032 + }, + { + "epoch": 13.91, + "learning_rate": 2.5992779783393497e-05, + "loss": 0.0378, + "step": 3033 + }, + { + "epoch": 13.92, + "learning_rate": 2.5884476534296027e-05, + "loss": 0.0808, + "step": 3034 + }, + { + "epoch": 13.92, + "learning_rate": 2.5776173285198553e-05, + "loss": 0.0574, + "step": 3035 + }, + { + "epoch": 13.93, + "learning_rate": 2.566787003610108e-05, + "loss": 0.0676, + "step": 3036 + }, + { + "epoch": 13.93, + "learning_rate": 2.555956678700361e-05, + "loss": 0.0315, + "step": 3037 + }, + { + "epoch": 13.94, + "learning_rate": 2.5451263537906135e-05, + "loss": 0.0472, + "step": 3038 + }, + { + "epoch": 13.94, + "learning_rate": 2.534296028880866e-05, + "loss": 0.0556, + "step": 3039 + }, + { + "epoch": 13.94, + "learning_rate": 2.5234657039711188e-05, + "loss": 0.0721, + "step": 3040 + }, + { + "epoch": 13.95, + "learning_rate": 2.5126353790613714e-05, + "loss": 0.0684, + "step": 3041 + }, + { + "epoch": 13.95, + "learning_rate": 2.5018050541516244e-05, + "loss": 0.0842, + "step": 3042 + }, + { + "epoch": 13.96, + "learning_rate": 2.490974729241877e-05, + "loss": 0.1156, + "step": 3043 + }, + { + "epoch": 13.96, + "learning_rate": 2.4801444043321297e-05, + "loss": 0.0559, + "step": 3044 + }, + { + "epoch": 13.97, + "learning_rate": 2.4693140794223826e-05, + "loss": 0.1107, + "step": 3045 + }, + { + "epoch": 13.97, + "learning_rate": 2.4584837545126353e-05, + "loss": 0.0723, + "step": 3046 + }, + { + "epoch": 13.98, + "learning_rate": 2.4476534296028875e-05, + "loss": 0.0682, + "step": 3047 + }, + { + "epoch": 13.98, + "learning_rate": 2.4368231046931405e-05, + "loss": 0.0194, + "step": 3048 + }, + { + "epoch": 13.99, + "learning_rate": 2.425992779783393e-05, + "loss": 0.069, + "step": 3049 + }, + { + "epoch": 13.99, + "learning_rate": 2.415162454873646e-05, + "loss": 0.1006, + "step": 3050 + }, + { + "epoch": 14.0, + "learning_rate": 2.4043321299638987e-05, + "loss": 0.0284, + "step": 3051 + }, + { + "epoch": 14.0, + "learning_rate": 2.3935018050541514e-05, + "loss": 0.0632, + "step": 3052 + }, + { + "epoch": 14.0, + "learning_rate": 2.3826714801444043e-05, + "loss": 0.0161, + "step": 3053 + }, + { + "epoch": 14.01, + "learning_rate": 2.371841155234657e-05, + "loss": 0.0362, + "step": 3054 + }, + { + "epoch": 14.01, + "learning_rate": 2.3610108303249093e-05, + "loss": 0.0349, + "step": 3055 + }, + { + "epoch": 14.02, + "learning_rate": 2.3501805054151622e-05, + "loss": 0.0544, + "step": 3056 + }, + { + "epoch": 14.02, + "learning_rate": 2.339350180505415e-05, + "loss": 0.077, + "step": 3057 + }, + { + "epoch": 14.03, + "learning_rate": 2.3285198555956678e-05, + "loss": 0.055, + "step": 3058 + }, + { + "epoch": 14.03, + "learning_rate": 2.3176895306859204e-05, + "loss": 0.125, + "step": 3059 + }, + { + "epoch": 14.04, + "learning_rate": 2.306859205776173e-05, + "loss": 0.0445, + "step": 3060 + }, + { + "epoch": 14.04, + "learning_rate": 2.296028880866426e-05, + "loss": 0.0457, + "step": 3061 + }, + { + "epoch": 14.05, + "learning_rate": 2.2851985559566783e-05, + "loss": 0.0615, + "step": 3062 + }, + { + "epoch": 14.05, + "learning_rate": 2.274368231046931e-05, + "loss": 0.0982, + "step": 3063 + }, + { + "epoch": 14.06, + "learning_rate": 2.263537906137184e-05, + "loss": 0.0663, + "step": 3064 + }, + { + "epoch": 14.06, + "learning_rate": 2.2527075812274366e-05, + "loss": 0.1101, + "step": 3065 + }, + { + "epoch": 14.06, + "learning_rate": 2.2418772563176892e-05, + "loss": 0.0254, + "step": 3066 + }, + { + "epoch": 14.07, + "learning_rate": 2.231046931407942e-05, + "loss": 0.0414, + "step": 3067 + }, + { + "epoch": 14.07, + "learning_rate": 2.2202166064981948e-05, + "loss": 0.0144, + "step": 3068 + }, + { + "epoch": 14.08, + "learning_rate": 2.2093862815884478e-05, + "loss": 0.0466, + "step": 3069 + }, + { + "epoch": 14.08, + "learning_rate": 2.1985559566787e-05, + "loss": 0.052, + "step": 3070 + }, + { + "epoch": 14.09, + "learning_rate": 2.1877256317689527e-05, + "loss": 0.0548, + "step": 3071 + }, + { + "epoch": 14.09, + "learning_rate": 2.1768953068592056e-05, + "loss": 0.0454, + "step": 3072 + }, + { + "epoch": 14.1, + "learning_rate": 2.1660649819494583e-05, + "loss": 0.0501, + "step": 3073 + }, + { + "epoch": 14.1, + "learning_rate": 2.155234657039711e-05, + "loss": 0.1312, + "step": 3074 + }, + { + "epoch": 14.11, + "learning_rate": 2.144404332129964e-05, + "loss": 0.1228, + "step": 3075 + }, + { + "epoch": 14.11, + "learning_rate": 2.1335740072202165e-05, + "loss": 0.1152, + "step": 3076 + }, + { + "epoch": 14.11, + "learning_rate": 2.1227436823104695e-05, + "loss": 0.0633, + "step": 3077 + }, + { + "epoch": 14.12, + "learning_rate": 2.1119133574007218e-05, + "loss": 0.0562, + "step": 3078 + }, + { + "epoch": 14.12, + "learning_rate": 2.1010830324909744e-05, + "loss": 0.061, + "step": 3079 + }, + { + "epoch": 14.13, + "learning_rate": 2.0902527075812274e-05, + "loss": 0.0507, + "step": 3080 + }, + { + "epoch": 14.13, + "learning_rate": 2.07942238267148e-05, + "loss": 0.0589, + "step": 3081 + }, + { + "epoch": 14.14, + "learning_rate": 2.0685920577617326e-05, + "loss": 0.0231, + "step": 3082 + }, + { + "epoch": 14.14, + "learning_rate": 2.0577617328519856e-05, + "loss": 0.0494, + "step": 3083 + }, + { + "epoch": 14.15, + "learning_rate": 2.046931407942238e-05, + "loss": 0.0495, + "step": 3084 + }, + { + "epoch": 14.15, + "learning_rate": 2.036101083032491e-05, + "loss": 0.0713, + "step": 3085 + }, + { + "epoch": 14.16, + "learning_rate": 2.0252707581227435e-05, + "loss": 0.0539, + "step": 3086 + }, + { + "epoch": 14.16, + "learning_rate": 2.014440433212996e-05, + "loss": 0.0824, + "step": 3087 + }, + { + "epoch": 14.17, + "learning_rate": 2.003610108303249e-05, + "loss": 0.1065, + "step": 3088 + }, + { + "epoch": 14.17, + "learning_rate": 1.9927797833935017e-05, + "loss": 0.2171, + "step": 3089 + }, + { + "epoch": 14.17, + "learning_rate": 1.9819494584837543e-05, + "loss": 0.0801, + "step": 3090 + }, + { + "epoch": 14.18, + "learning_rate": 1.9711191335740073e-05, + "loss": 0.0367, + "step": 3091 + }, + { + "epoch": 14.18, + "learning_rate": 1.9602888086642596e-05, + "loss": 0.0314, + "step": 3092 + }, + { + "epoch": 14.19, + "learning_rate": 1.9494584837545122e-05, + "loss": 0.0612, + "step": 3093 + }, + { + "epoch": 14.19, + "learning_rate": 1.9386281588447652e-05, + "loss": 0.0184, + "step": 3094 + }, + { + "epoch": 14.2, + "learning_rate": 1.9277978339350178e-05, + "loss": 0.073, + "step": 3095 + }, + { + "epoch": 14.2, + "learning_rate": 1.9169675090252708e-05, + "loss": 0.0487, + "step": 3096 + }, + { + "epoch": 14.21, + "learning_rate": 1.9061371841155234e-05, + "loss": 0.0827, + "step": 3097 + }, + { + "epoch": 14.21, + "learning_rate": 1.895306859205776e-05, + "loss": 0.1148, + "step": 3098 + }, + { + "epoch": 14.22, + "learning_rate": 1.884476534296029e-05, + "loss": 0.0997, + "step": 3099 + }, + { + "epoch": 14.22, + "learning_rate": 1.8736462093862813e-05, + "loss": 0.0548, + "step": 3100 + }, + { + "epoch": 14.22, + "eval_loss": 0.3855121433734894, + "eval_runtime": 19.9538, + "eval_samples_per_second": 82.54, + "eval_steps_per_second": 2.606, + "eval_wer": 0.3274435706260852, + "step": 3100 + }, + { + "epoch": 14.22, + "learning_rate": 1.8628158844765343e-05, + "loss": 0.0913, + "step": 3101 + }, + { + "epoch": 14.23, + "learning_rate": 1.851985559566787e-05, + "loss": 0.0907, + "step": 3102 + }, + { + "epoch": 14.23, + "learning_rate": 1.8411552346570395e-05, + "loss": 0.0219, + "step": 3103 + }, + { + "epoch": 14.24, + "learning_rate": 1.830324909747292e-05, + "loss": 0.0236, + "step": 3104 + }, + { + "epoch": 14.24, + "learning_rate": 1.819494584837545e-05, + "loss": 0.0939, + "step": 3105 + }, + { + "epoch": 14.25, + "learning_rate": 1.8086642599277977e-05, + "loss": 0.1082, + "step": 3106 + }, + { + "epoch": 14.25, + "learning_rate": 1.7978339350180504e-05, + "loss": 0.0165, + "step": 3107 + }, + { + "epoch": 14.26, + "learning_rate": 1.787003610108303e-05, + "loss": 0.0451, + "step": 3108 + }, + { + "epoch": 14.26, + "learning_rate": 1.776173285198556e-05, + "loss": 0.0661, + "step": 3109 + }, + { + "epoch": 14.27, + "learning_rate": 1.7653429602888083e-05, + "loss": 0.0851, + "step": 3110 + }, + { + "epoch": 14.27, + "learning_rate": 1.7545126353790612e-05, + "loss": 0.0783, + "step": 3111 + }, + { + "epoch": 14.28, + "learning_rate": 1.743682310469314e-05, + "loss": 0.0925, + "step": 3112 + }, + { + "epoch": 14.28, + "learning_rate": 1.7328519855595668e-05, + "loss": 0.1523, + "step": 3113 + }, + { + "epoch": 14.28, + "learning_rate": 1.722021660649819e-05, + "loss": 0.0802, + "step": 3114 + }, + { + "epoch": 14.29, + "learning_rate": 1.711191335740072e-05, + "loss": 0.1751, + "step": 3115 + }, + { + "epoch": 14.29, + "learning_rate": 1.7003610108303247e-05, + "loss": 0.0301, + "step": 3116 + }, + { + "epoch": 14.3, + "learning_rate": 1.6895306859205777e-05, + "loss": 0.0652, + "step": 3117 + }, + { + "epoch": 14.3, + "learning_rate": 1.67870036101083e-05, + "loss": 0.0463, + "step": 3118 + }, + { + "epoch": 14.31, + "learning_rate": 1.667870036101083e-05, + "loss": 0.051, + "step": 3119 + }, + { + "epoch": 14.31, + "learning_rate": 1.6570397111913356e-05, + "loss": 0.0528, + "step": 3120 + }, + { + "epoch": 14.32, + "learning_rate": 1.6462093862815885e-05, + "loss": 0.0801, + "step": 3121 + }, + { + "epoch": 14.32, + "learning_rate": 1.6353790613718408e-05, + "loss": 0.0716, + "step": 3122 + }, + { + "epoch": 14.33, + "learning_rate": 1.6245487364620938e-05, + "loss": 0.1213, + "step": 3123 + }, + { + "epoch": 14.33, + "learning_rate": 1.6137184115523464e-05, + "loss": 0.0473, + "step": 3124 + }, + { + "epoch": 14.33, + "learning_rate": 1.6028880866425994e-05, + "loss": 0.0557, + "step": 3125 + }, + { + "epoch": 14.34, + "learning_rate": 1.5920577617328517e-05, + "loss": 0.0715, + "step": 3126 + }, + { + "epoch": 14.34, + "learning_rate": 1.5812274368231046e-05, + "loss": 0.1077, + "step": 3127 + }, + { + "epoch": 14.35, + "learning_rate": 1.5703971119133573e-05, + "loss": 0.0281, + "step": 3128 + }, + { + "epoch": 14.35, + "learning_rate": 1.55956678700361e-05, + "loss": 0.0396, + "step": 3129 + }, + { + "epoch": 14.36, + "learning_rate": 1.5487364620938625e-05, + "loss": 0.0678, + "step": 3130 + }, + { + "epoch": 14.36, + "learning_rate": 1.5379061371841155e-05, + "loss": 0.0443, + "step": 3131 + }, + { + "epoch": 14.37, + "learning_rate": 1.527075812274368e-05, + "loss": 0.047, + "step": 3132 + }, + { + "epoch": 14.37, + "learning_rate": 1.5162454873646208e-05, + "loss": 0.0401, + "step": 3133 + }, + { + "epoch": 14.38, + "learning_rate": 1.5054151624548734e-05, + "loss": 0.0366, + "step": 3134 + }, + { + "epoch": 14.38, + "learning_rate": 1.4945848375451262e-05, + "loss": 0.0634, + "step": 3135 + }, + { + "epoch": 14.39, + "learning_rate": 1.483754512635379e-05, + "loss": 0.074, + "step": 3136 + }, + { + "epoch": 14.39, + "learning_rate": 1.4729241877256316e-05, + "loss": 0.0786, + "step": 3137 + }, + { + "epoch": 14.39, + "learning_rate": 1.4620938628158842e-05, + "loss": 0.0648, + "step": 3138 + }, + { + "epoch": 14.4, + "learning_rate": 1.451263537906137e-05, + "loss": 0.0846, + "step": 3139 + }, + { + "epoch": 14.4, + "learning_rate": 1.4404332129963898e-05, + "loss": 0.0572, + "step": 3140 + }, + { + "epoch": 14.41, + "learning_rate": 1.4296028880866425e-05, + "loss": 0.0445, + "step": 3141 + }, + { + "epoch": 14.41, + "learning_rate": 1.4187725631768951e-05, + "loss": 0.0353, + "step": 3142 + }, + { + "epoch": 14.42, + "learning_rate": 1.4079422382671479e-05, + "loss": 0.0481, + "step": 3143 + }, + { + "epoch": 14.42, + "learning_rate": 1.3971119133574007e-05, + "loss": 0.0185, + "step": 3144 + }, + { + "epoch": 14.43, + "learning_rate": 1.3862815884476532e-05, + "loss": 0.0448, + "step": 3145 + }, + { + "epoch": 14.43, + "learning_rate": 1.375451263537906e-05, + "loss": 0.0191, + "step": 3146 + }, + { + "epoch": 14.44, + "learning_rate": 1.3646209386281587e-05, + "loss": 0.0894, + "step": 3147 + }, + { + "epoch": 14.44, + "learning_rate": 1.3537906137184115e-05, + "loss": 0.0547, + "step": 3148 + }, + { + "epoch": 14.44, + "learning_rate": 1.342960288808664e-05, + "loss": 0.036, + "step": 3149 + }, + { + "epoch": 14.45, + "learning_rate": 1.3321299638989168e-05, + "loss": 0.085, + "step": 3150 + }, + { + "epoch": 14.45, + "learning_rate": 1.3212996389891696e-05, + "loss": 0.0693, + "step": 3151 + }, + { + "epoch": 14.46, + "learning_rate": 1.3104693140794224e-05, + "loss": 0.073, + "step": 3152 + }, + { + "epoch": 14.46, + "learning_rate": 1.2996389891696749e-05, + "loss": 0.0522, + "step": 3153 + }, + { + "epoch": 14.47, + "learning_rate": 1.2888086642599277e-05, + "loss": 0.048, + "step": 3154 + }, + { + "epoch": 14.47, + "learning_rate": 1.2779783393501805e-05, + "loss": 0.0469, + "step": 3155 + }, + { + "epoch": 14.48, + "learning_rate": 1.267148014440433e-05, + "loss": 0.0283, + "step": 3156 + }, + { + "epoch": 14.48, + "learning_rate": 1.2563176895306857e-05, + "loss": 0.0536, + "step": 3157 + }, + { + "epoch": 14.49, + "learning_rate": 1.2454873646209385e-05, + "loss": 0.0589, + "step": 3158 + }, + { + "epoch": 14.49, + "learning_rate": 1.2346570397111913e-05, + "loss": 0.0753, + "step": 3159 + }, + { + "epoch": 14.5, + "learning_rate": 1.2238267148014438e-05, + "loss": 0.1248, + "step": 3160 + }, + { + "epoch": 14.5, + "learning_rate": 1.2129963898916966e-05, + "loss": 0.0726, + "step": 3161 + }, + { + "epoch": 14.5, + "learning_rate": 1.2021660649819494e-05, + "loss": 0.0383, + "step": 3162 + }, + { + "epoch": 14.51, + "learning_rate": 1.1913357400722022e-05, + "loss": 0.031, + "step": 3163 + }, + { + "epoch": 14.51, + "learning_rate": 1.1805054151624546e-05, + "loss": 0.0466, + "step": 3164 + }, + { + "epoch": 14.52, + "learning_rate": 1.1696750902527074e-05, + "loss": 0.0599, + "step": 3165 + }, + { + "epoch": 14.52, + "learning_rate": 1.1588447653429602e-05, + "loss": 0.0356, + "step": 3166 + }, + { + "epoch": 14.53, + "learning_rate": 1.148014440433213e-05, + "loss": 0.0836, + "step": 3167 + }, + { + "epoch": 14.53, + "learning_rate": 1.1371841155234655e-05, + "loss": 0.0864, + "step": 3168 + }, + { + "epoch": 14.54, + "learning_rate": 1.1263537906137183e-05, + "loss": 0.056, + "step": 3169 + }, + { + "epoch": 14.54, + "learning_rate": 1.115523465703971e-05, + "loss": 0.0131, + "step": 3170 + }, + { + "epoch": 14.55, + "learning_rate": 1.1046931407942239e-05, + "loss": 0.0322, + "step": 3171 + }, + { + "epoch": 14.55, + "learning_rate": 1.0938628158844763e-05, + "loss": 0.054, + "step": 3172 + }, + { + "epoch": 14.56, + "learning_rate": 1.0830324909747291e-05, + "loss": 0.0317, + "step": 3173 + }, + { + "epoch": 14.56, + "learning_rate": 1.072202166064982e-05, + "loss": 0.0741, + "step": 3174 + }, + { + "epoch": 14.56, + "learning_rate": 1.0613718411552347e-05, + "loss": 0.0579, + "step": 3175 + }, + { + "epoch": 14.57, + "learning_rate": 1.0505415162454872e-05, + "loss": 0.1368, + "step": 3176 + }, + { + "epoch": 14.57, + "learning_rate": 1.03971119133574e-05, + "loss": 0.0491, + "step": 3177 + }, + { + "epoch": 14.58, + "learning_rate": 1.0288808664259928e-05, + "loss": 0.0711, + "step": 3178 + }, + { + "epoch": 14.58, + "learning_rate": 1.0180505415162454e-05, + "loss": 0.0457, + "step": 3179 + }, + { + "epoch": 14.59, + "learning_rate": 1.007220216606498e-05, + "loss": 0.0521, + "step": 3180 + }, + { + "epoch": 14.59, + "learning_rate": 9.963898916967508e-06, + "loss": 0.0348, + "step": 3181 + }, + { + "epoch": 14.6, + "learning_rate": 9.855595667870036e-06, + "loss": 0.0271, + "step": 3182 + }, + { + "epoch": 14.6, + "learning_rate": 9.747292418772561e-06, + "loss": 0.0431, + "step": 3183 + }, + { + "epoch": 14.61, + "learning_rate": 9.638989169675089e-06, + "loss": 0.0579, + "step": 3184 + }, + { + "epoch": 14.61, + "learning_rate": 9.530685920577617e-06, + "loss": 0.0699, + "step": 3185 + }, + { + "epoch": 14.61, + "learning_rate": 9.422382671480145e-06, + "loss": 0.0526, + "step": 3186 + }, + { + "epoch": 14.62, + "learning_rate": 9.314079422382671e-06, + "loss": 0.0583, + "step": 3187 + }, + { + "epoch": 14.62, + "learning_rate": 9.205776173285198e-06, + "loss": 0.0759, + "step": 3188 + }, + { + "epoch": 14.63, + "learning_rate": 9.097472924187726e-06, + "loss": 0.1015, + "step": 3189 + }, + { + "epoch": 14.63, + "learning_rate": 8.989169675090252e-06, + "loss": 0.0552, + "step": 3190 + }, + { + "epoch": 14.64, + "learning_rate": 8.88086642599278e-06, + "loss": 0.0393, + "step": 3191 + }, + { + "epoch": 14.64, + "learning_rate": 8.772563176895306e-06, + "loss": 0.0453, + "step": 3192 + }, + { + "epoch": 14.65, + "learning_rate": 8.664259927797834e-06, + "loss": 0.0432, + "step": 3193 + }, + { + "epoch": 14.65, + "learning_rate": 8.55595667870036e-06, + "loss": 0.0236, + "step": 3194 + }, + { + "epoch": 14.66, + "learning_rate": 8.447653429602888e-06, + "loss": 0.0537, + "step": 3195 + }, + { + "epoch": 14.66, + "learning_rate": 8.339350180505415e-06, + "loss": 0.0697, + "step": 3196 + }, + { + "epoch": 14.67, + "learning_rate": 8.231046931407943e-06, + "loss": 0.0397, + "step": 3197 + }, + { + "epoch": 14.67, + "learning_rate": 8.122743682310469e-06, + "loss": 0.0984, + "step": 3198 + }, + { + "epoch": 14.67, + "learning_rate": 8.014440433212997e-06, + "loss": 0.0292, + "step": 3199 + }, + { + "epoch": 14.68, + "learning_rate": 7.906137184115523e-06, + "loss": 0.0577, + "step": 3200 + }, + { + "epoch": 14.68, + "eval_loss": 0.3892526924610138, + "eval_runtime": 20.1653, + "eval_samples_per_second": 81.675, + "eval_steps_per_second": 2.579, + "eval_wer": 0.3237667245429476, + "step": 3200 + }, + { + "epoch": 14.68, + "learning_rate": 7.79783393501805e-06, + "loss": 0.0626, + "step": 3201 + }, + { + "epoch": 14.69, + "learning_rate": 7.689530685920577e-06, + "loss": 0.1146, + "step": 3202 + }, + { + "epoch": 14.69, + "learning_rate": 7.581227436823104e-06, + "loss": 0.0531, + "step": 3203 + }, + { + "epoch": 14.7, + "learning_rate": 7.472924187725631e-06, + "loss": 0.0284, + "step": 3204 + }, + { + "epoch": 14.7, + "learning_rate": 7.364620938628158e-06, + "loss": 0.042, + "step": 3205 + }, + { + "epoch": 14.71, + "learning_rate": 7.256317689530685e-06, + "loss": 0.0759, + "step": 3206 + }, + { + "epoch": 14.71, + "learning_rate": 7.148014440433212e-06, + "loss": 0.044, + "step": 3207 + }, + { + "epoch": 14.72, + "learning_rate": 7.0397111913357395e-06, + "loss": 0.1005, + "step": 3208 + }, + { + "epoch": 14.72, + "learning_rate": 6.931407942238266e-06, + "loss": 0.0498, + "step": 3209 + }, + { + "epoch": 14.72, + "learning_rate": 6.823104693140794e-06, + "loss": 0.1059, + "step": 3210 + }, + { + "epoch": 14.73, + "learning_rate": 6.71480144404332e-06, + "loss": 0.0423, + "step": 3211 + }, + { + "epoch": 14.73, + "learning_rate": 6.606498194945848e-06, + "loss": 0.0979, + "step": 3212 + }, + { + "epoch": 14.74, + "learning_rate": 6.498194945848374e-06, + "loss": 0.0609, + "step": 3213 + }, + { + "epoch": 14.74, + "learning_rate": 6.389891696750902e-06, + "loss": 0.1065, + "step": 3214 + }, + { + "epoch": 14.75, + "learning_rate": 6.281588447653429e-06, + "loss": 0.0699, + "step": 3215 + }, + { + "epoch": 14.75, + "learning_rate": 6.1732851985559566e-06, + "loss": 0.0256, + "step": 3216 + }, + { + "epoch": 14.76, + "learning_rate": 6.064981949458483e-06, + "loss": 0.0249, + "step": 3217 + }, + { + "epoch": 14.76, + "learning_rate": 5.956678700361011e-06, + "loss": 0.0444, + "step": 3218 + }, + { + "epoch": 14.77, + "learning_rate": 5.848375451263537e-06, + "loss": 0.0891, + "step": 3219 + }, + { + "epoch": 14.77, + "learning_rate": 5.740072202166065e-06, + "loss": 0.0694, + "step": 3220 + }, + { + "epoch": 14.78, + "learning_rate": 5.631768953068591e-06, + "loss": 0.0481, + "step": 3221 + }, + { + "epoch": 14.78, + "learning_rate": 5.523465703971119e-06, + "loss": 0.0626, + "step": 3222 + }, + { + "epoch": 14.78, + "learning_rate": 5.415162454873646e-06, + "loss": 0.0358, + "step": 3223 + }, + { + "epoch": 14.79, + "learning_rate": 5.306859205776174e-06, + "loss": 0.0595, + "step": 3224 + }, + { + "epoch": 14.79, + "learning_rate": 5.1985559566787e-06, + "loss": 0.0943, + "step": 3225 + }, + { + "epoch": 14.8, + "learning_rate": 5.090252707581227e-06, + "loss": 0.1334, + "step": 3226 + }, + { + "epoch": 14.8, + "learning_rate": 4.981949458483754e-06, + "loss": 0.1458, + "step": 3227 + }, + { + "epoch": 14.81, + "learning_rate": 4.8736462093862805e-06, + "loss": 0.0443, + "step": 3228 + }, + { + "epoch": 14.81, + "learning_rate": 4.7653429602888085e-06, + "loss": 0.0442, + "step": 3229 + }, + { + "epoch": 14.82, + "learning_rate": 4.657039711191336e-06, + "loss": 0.0542, + "step": 3230 + }, + { + "epoch": 14.82, + "learning_rate": 4.548736462093863e-06, + "loss": 0.0882, + "step": 3231 + }, + { + "epoch": 14.83, + "learning_rate": 4.44043321299639e-06, + "loss": 0.0776, + "step": 3232 + }, + { + "epoch": 14.83, + "learning_rate": 4.332129963898917e-06, + "loss": 0.0594, + "step": 3233 + }, + { + "epoch": 14.83, + "learning_rate": 4.223826714801444e-06, + "loss": 0.0368, + "step": 3234 + }, + { + "epoch": 14.84, + "learning_rate": 4.115523465703971e-06, + "loss": 0.0625, + "step": 3235 + }, + { + "epoch": 14.84, + "learning_rate": 4.0072202166064985e-06, + "loss": 0.052, + "step": 3236 + }, + { + "epoch": 14.85, + "learning_rate": 3.898916967509025e-06, + "loss": 0.0525, + "step": 3237 + }, + { + "epoch": 14.85, + "learning_rate": 3.790613718411552e-06, + "loss": 0.0845, + "step": 3238 + }, + { + "epoch": 14.86, + "learning_rate": 3.682310469314079e-06, + "loss": 0.079, + "step": 3239 + }, + { + "epoch": 14.86, + "learning_rate": 3.574007220216606e-06, + "loss": 0.089, + "step": 3240 + }, + { + "epoch": 14.87, + "learning_rate": 3.465703971119133e-06, + "loss": 0.0164, + "step": 3241 + }, + { + "epoch": 14.87, + "learning_rate": 3.35740072202166e-06, + "loss": 0.0755, + "step": 3242 + }, + { + "epoch": 14.88, + "learning_rate": 3.249097472924187e-06, + "loss": 0.0309, + "step": 3243 + }, + { + "epoch": 14.88, + "learning_rate": 3.1407942238267143e-06, + "loss": 0.0394, + "step": 3244 + }, + { + "epoch": 14.89, + "learning_rate": 3.0324909747292414e-06, + "loss": 0.0306, + "step": 3245 + }, + { + "epoch": 14.89, + "learning_rate": 2.9241877256317686e-06, + "loss": 0.0657, + "step": 3246 + }, + { + "epoch": 14.89, + "learning_rate": 2.8158844765342957e-06, + "loss": 0.0905, + "step": 3247 + }, + { + "epoch": 14.9, + "learning_rate": 2.707581227436823e-06, + "loss": 0.0592, + "step": 3248 + }, + { + "epoch": 14.9, + "learning_rate": 2.59927797833935e-06, + "loss": 0.059, + "step": 3249 + }, + { + "epoch": 14.91, + "learning_rate": 2.490974729241877e-06, + "loss": 0.0542, + "step": 3250 + }, + { + "epoch": 14.91, + "learning_rate": 2.3826714801444043e-06, + "loss": 0.0481, + "step": 3251 + }, + { + "epoch": 14.92, + "learning_rate": 2.2743682310469314e-06, + "loss": 0.0558, + "step": 3252 + }, + { + "epoch": 14.92, + "learning_rate": 2.1660649819494585e-06, + "loss": 0.0393, + "step": 3253 + }, + { + "epoch": 14.93, + "learning_rate": 2.0577617328519857e-06, + "loss": 0.0599, + "step": 3254 + }, + { + "epoch": 14.93, + "learning_rate": 1.9494584837545124e-06, + "loss": 0.0199, + "step": 3255 + }, + { + "epoch": 14.94, + "learning_rate": 1.8411552346570395e-06, + "loss": 0.0636, + "step": 3256 + }, + { + "epoch": 14.94, + "learning_rate": 1.7328519855595664e-06, + "loss": 0.0324, + "step": 3257 + }, + { + "epoch": 14.94, + "learning_rate": 1.6245487364620936e-06, + "loss": 0.1272, + "step": 3258 + }, + { + "epoch": 14.95, + "learning_rate": 1.5162454873646207e-06, + "loss": 0.0669, + "step": 3259 + }, + { + "epoch": 14.95, + "learning_rate": 1.4079422382671479e-06, + "loss": 0.0416, + "step": 3260 + }, + { + "epoch": 14.96, + "learning_rate": 1.299638989169675e-06, + "loss": 0.0985, + "step": 3261 + }, + { + "epoch": 14.96, + "learning_rate": 1.1913357400722021e-06, + "loss": 0.0722, + "step": 3262 + }, + { + "epoch": 14.97, + "learning_rate": 1.0830324909747293e-06, + "loss": 0.0635, + "step": 3263 + }, + { + "epoch": 14.97, + "learning_rate": 9.747292418772562e-07, + "loss": 0.0622, + "step": 3264 + }, + { + "epoch": 14.98, + "learning_rate": 8.664259927797832e-07, + "loss": 0.0782, + "step": 3265 + }, + { + "epoch": 14.98, + "learning_rate": 7.581227436823104e-07, + "loss": 0.0621, + "step": 3266 + }, + { + "epoch": 14.99, + "learning_rate": 6.498194945848375e-07, + "loss": 0.0507, + "step": 3267 + }, + { + "epoch": 14.99, + "learning_rate": 5.415162454873646e-07, + "loss": 0.1, + "step": 3268 + }, + { + "epoch": 15.0, + "learning_rate": 4.332129963898916e-07, + "loss": 0.0268, + "step": 3269 + }, + { + "epoch": 15.0, + "learning_rate": 3.2490974729241875e-07, + "loss": 0.0816, + "step": 3270 + }, + { + "epoch": 15.0, + "step": 3270, + "total_flos": 6.705896706040398e+18, + "train_loss": 0.6689931568703885, + "train_runtime": 2436.2567, + "train_samples_per_second": 21.414, + "train_steps_per_second": 1.342 + } + ], + "max_steps": 3270, + "num_train_epochs": 15, + "total_flos": 6.705896706040398e+18, + "trial_name": null, + "trial_params": null +}